import random import time import csv import sys import pandas as pd import matplotlib.pyplot as plt sys.setrecursionlimit(20000) def ll_insert(head, name, phone): current = head while current is not None: if current['name'] == name: current['phone'] = phone return head current = current['next'] new_node = {'name': name, 'phone': phone, 'next': None} if head is None: return new_node current = head while current['next'] is not None: current = current['next'] current['next'] = new_node return head def ll_find(head, name): current = head while current is not None: if current['name'] == name: return current['phone'] current = current['next'] return None def ll_delete(head, name): if head is None: return None if head['name'] == name: return head['next'] prev = head current = head['next'] while current is not None: if current['name'] == name: prev['next'] = current['next'] return head prev = current current = current['next'] return head def ll_list_all(head): records = [] current = head while current is not None: records.append((current['name'], current['phone'])) current = current['next'] records.sort(key=lambda x: x[0]) return records HASH_SIZE = 997 def hash_func(name, size): return hash(name) % size def ht_create(): return [None] * HASH_SIZE def ht_insert(table, name, phone): idx = hash_func(name, len(table)) table[idx] = ll_insert(table[idx], name, phone) return table def ht_find(table, name): idx = hash_func(name, len(table)) return ll_find(table[idx], name) def ht_delete(table, name): idx = hash_func(name, len(table)) table[idx] = ll_delete(table[idx], name) return table def ht_list_all(table): all_records = [] for head in table: current = head while current is not None: all_records.append((current['name'], current['phone'])) current = current['next'] all_records.sort(key=lambda x: x[0]) return all_records def bst_create_node(name, phone): return {'name': name, 'phone': phone, 'left': None, 'right': None} def bst_insert(root, name, phone): if root is None: return bst_create_node(name, phone) if name == root['name']: root['phone'] = phone elif name < root['name']: root['left'] = bst_insert(root['left'], name, phone) else: root['right'] = bst_insert(root['right'], name, phone) return root def bst_find(root, name): if root is None: return None if name == root['name']: return root['phone'] elif name < root['name']: return bst_find(root['left'], name) else: return bst_find(root['right'], name) def bst_find_min(node): while node['left'] is not None: node = node['left'] return node def bst_delete(root, name): if root is None: return None if name < root['name']: root['left'] = bst_delete(root['left'], name) elif name > root['name']: root['right'] = bst_delete(root['right'], name) else: if root['left'] is None: return root['right'] if root['right'] is None: return root['left'] min_node = bst_find_min(root['right']) root['name'] = min_node['name'] root['phone'] = min_node['phone'] root['right'] = bst_delete(root['right'], min_node['name']) return root def bst_list_all(root): result = [] def inorder(node): if node is None: return inorder(node['left']) result.append((node['name'], node['phone'])) inorder(node['right']) inorder(root) return result def generate_records(num_records, seed=42): random.seed(seed) records = [] for i in range(1, num_records + 1): name = f"User_{i:05d}" phone = f"{random.randint(100,999)}-{random.randint(1000,9999)}" records.append((name, phone)) return records def prepare_datasets(base_records): shuffled = base_records.copy() random.shuffle(shuffled) sorted_records = sorted(base_records, key=lambda x: x[0]) return shuffled, sorted_records def run_experiment_for_structure(struct_funcs, records, mode_name, repeats=5): results = [] for rep in range(repeats): ds = struct_funcs['create']() start = time.perf_counter() for name, phone in records: ds = struct_funcs['insert'](ds, name, phone) insert_time = time.perf_counter() - start existing_names = [rec[0] for rec in records] sample_existing = random.sample(existing_names, 100) nonexistent = [f"None_{i}" for i in range(10)] search_names = sample_existing + nonexistent random.shuffle(search_names) start = time.perf_counter() for name in search_names: _ = struct_funcs['find'](ds, name) find_time = time.perf_counter() - start to_delete = random.sample(existing_names, 50) start = time.perf_counter() for name in to_delete: ds = struct_funcs['delete'](ds, name) delete_time = time.perf_counter() - start results.append({ 'structure': struct_funcs['name'], 'mode': mode_name, 'repetition': rep + 1, 'insert_time': insert_time, 'find_time': find_time, 'delete_time': delete_time }) return results def main_experiment(): N = 10000 REPEATS = 5 print("Генерация тестовых данных...") base_records = generate_records(N) shuffled_records, sorted_records = prepare_datasets(base_records) print(f"Создано {N} записей. Случайный порядок и отсортированный готовы.") structures = { 'LinkedList': { 'name': 'LinkedList', 'create': lambda: None, 'insert': ll_insert, 'find': ll_find, 'delete': ll_delete }, 'HashTable': { 'name': 'HashTable', 'create': ht_create, 'insert': ht_insert, 'find': ht_find, 'delete': ht_delete }, 'BST': { 'name': 'BST', 'create': lambda: None, 'insert': bst_insert, 'find': bst_find, 'delete': bst_delete } } all_results = [] for struct_name, funcs in structures.items(): print(f"Тестирование {struct_name} на случайном порядке...") all_results.extend(run_experiment_for_structure(funcs, shuffled_records, 'random', REPEATS)) print(f"Тестирование {struct_name} на отсортированном порядке...") all_results.extend(run_experiment_for_structure(funcs, sorted_records, 'sorted', REPEATS)) csv_file = "experiment_results.csv" with open(csv_file, 'w', newline='', encoding='utf-8') as f: writer = csv.writer(f) writer.writerow(['Structure', 'Mode', 'Repeat', 'Insert (sec)', 'Search (sec)', 'Delete (sec)']) for rec in all_results: writer.writerow([ rec['structure'], rec['mode'], rec['repetition'], f"{rec['insert_time']:.6f}", f"{rec['find_time']:.6f}", f"{rec['delete_time']:.6f}" ]) print(f"Результаты сохранены в {csv_file}") plot_results(csv_file) def plot_results(csv_path): df = pd.read_csv(csv_path) mean_times = df.groupby(['Structure', 'Mode'])[['Insert (sec)', 'Search (sec)', 'Delete (sec)']].mean().reset_index() structures = mean_times['Structure'].unique() modes = mean_times['Mode'].unique() fig, axes = plt.subplots(1, 3, figsize=(15, 5)) operations = ['Insert (sec)', 'Search (sec)', 'Delete (sec)'] titles = ['Вставка', 'Поиск', 'Удаление'] for ax, op, title in zip(axes, operations, titles): x = range(len(structures)) width = 0.35 random_vals = [] sorted_vals = [] for s in structures: rand_row = mean_times[(mean_times['Structure'] == s) & (mean_times['Mode'] == 'random')] sort_row = mean_times[(mean_times['Structure'] == s) & (mean_times['Mode'] == 'sorted')] random_vals.append(rand_row[op].values[0] if not rand_row.empty else 0) sorted_vals.append(sort_row[op].values[0] if not sort_row.empty else 0) ax.bar([i - width/2 for i in x], random_vals, width, label='Случайный порядок') ax.bar([i + width/2 for i in x], sorted_vals, width, label='Отсортированный порядок') ax.set_xticks(x) ax.set_xticklabels(structures) ax.set_ylabel('Время (секунды)') ax.set_title(title) ax.legend() plt.tight_layout() plt.savefig('performance_comparison.png', dpi=150) plt.show() print("График сохранён как performance_comparison.png") if __name__ == "__main__": main_experiment()