2026-rff_mp/tseremonnikovaaa/task 1/docs/data/main.py

412 lines
14 KiB
Python
Raw Normal View History

2026-05-22 19:08:31 +00:00
import time
import random
import csv
import sys
import matplotlib.pyplot as plt
import numpy as np
sys.setrecursionlimit(20000)
REPEATS = 5
N = 10000
def ll_insert(head, name, phone):
current = head
prev = None
while current is not None:
if current['name'] == name:
current['phone'] = phone
return head
prev = current
current = current['next']
new_node = {'name': name, 'phone': phone, 'next': None}
if prev is None:
return new_node
else:
prev['next'] = new_node
return head
def ll_find(head, name):
current = head
while current is not None:
if current['name'] == name:
return current['phone']
current = current['next']
return None
def ll_delete(head, name):
if head is None:
return None
if head['name'] == name:
return head['next']
current = head
while current['next'] is not None:
if current['next']['name'] == name:
current['next'] = current['next']['next']
return head
current = current['next']
return head
def ll_collect_all(head):
records = []
current = head
while current is not None:
records.append((current['name'], current['phone']))
current = current['next']
records.sort(key=lambda x: x[0])
return records
2026-05-22 19:59:13 +00:00
def hash_function(name, size):
total = 0
for ch in name:
total = (total * 31 + ord(ch)) % size
return total
def ht_create(size=2000):
return [None] * size
def ht_insert(buckets, name, phone):
idx = hash_function(name, len(buckets))
buckets[idx] = ll_insert(buckets[idx], name, phone)
def ht_find(buckets, name):
idx = hash_function(name, len(buckets))
return ll_find(buckets[idx], name)
def ht_delete(buckets, name):
idx = hash_function(name, len(buckets))
buckets[idx] = ll_delete(buckets[idx], name)
def ht_collect_all(buckets):
all_records = []
for bucket in buckets:
current = bucket
while current is not None:
all_records.append((current['name'], current['phone']))
current = current['next']
all_records.sort(key=lambda x: x[0])
return all_records
def bst_insert(root, name, phone):
new_node = {'name': name, 'phone': phone, 'left': None, 'right': None}
if root is None:
return new_node
current = root
while True:
if name < current['name']:
if current['left'] is None:
current['left'] = new_node
break
current = current['left']
elif name > current['name']:
if current['right'] is None:
current['right'] = new_node
break
current = current['right']
else:
current['phone'] = phone
break
return root
def bst_find(root, name):
current = root
while current is not None:
if name < current['name']:
current = current['left']
elif name > current['name']:
current = current['right']
else:
return current['phone']
return None
def bst_find_min(node):
while node['left'] is not None:
node = node['left']
return node
def bst_delete(root, name):
parent = None
current = root
while current is not None and current['name'] != name:
parent = current
if name < current['name']:
current = current['left']
else:
current = current['right']
if current is None:
return root
if current['left'] is None and current['right'] is None:
if parent is None:
return None
if parent['left'] is current:
parent['left'] = None
else:
parent['right'] = None
return root
if current['left'] is None:
if parent is None:
return current['right']
if parent['left'] is current:
parent['left'] = current['right']
else:
parent['right'] = current['right']
return root
if current['right'] is None:
if parent is None:
return current['left']
if parent['left'] is current:
parent['left'] = current['left']
else:
parent['right'] = current['left']
return root
succ_parent = current
succ = current['right']
while succ['left'] is not None:
succ_parent = succ
succ = succ['left']
current['name'] = succ['name']
current['phone'] = succ['phone']
if succ_parent['left'] is succ:
succ_parent['left'] = succ['right']
else:
succ_parent['right'] = succ['right']
return root
def bst_inorder_collect(root, records=None):
if records is None:
records = []
if root is not None:
bst_inorder_collect(root['left'], records)
records.append((root['name'], root['phone']))
bst_inorder_collect(root['right'], records)
return records
def generate_records(N=10000):
records = []
for i in range(N):
name = f"User_{i:05d}"
phone = f"+7-999-{random.randint(1000000, 9999999)}"
records.append((name, phone))
return records
def measure_insertion(struct_type, records):
times = []
for _ in range(REPEATS):
if struct_type == 'll':
head = None
start = time.perf_counter()
for name, phone in records:
head = ll_insert(head, name, phone)
end = time.perf_counter()
elif struct_type == 'ht':
buckets = ht_create(2000)
start = time.perf_counter()
for name, phone in records:
ht_insert(buckets, name, phone)
end = time.perf_counter()
else:
root = None
start = time.perf_counter()
for name, phone in records:
root = bst_insert(root, name, phone)
end = time.perf_counter()
times.append(end - start)
return times
def build_structure(struct_type, records):
if struct_type == 'll':
head = None
for name, phone in records:
head = ll_insert(head, name, phone)
return head
elif struct_type == 'ht':
buckets = ht_create(2000)
for name, phone in records:
ht_insert(buckets, name, phone)
return buckets
else:
root = None
for name, phone in records:
root = bst_insert(root, name, phone)
return root
def measure_search(struct_type, structure, records):
times = []
N_records = len(records)
for _ in range(REPEATS):
indices = random.sample(range(N_records), 100)
existing_names = [records[i][0] for i in indices]
missing_names = [f"None_{i}" for i in range(10)]
search_names = existing_names + missing_names
random.shuffle(search_names)
start = time.perf_counter()
if struct_type == 'll':
for name in search_names:
ll_find(structure, name)
elif struct_type == 'ht':
for name in search_names:
ht_find(structure, name)
else:
for name in search_names:
bst_find(structure, name)
times.append(time.perf_counter() - start)
return times
def measure_deletion(struct_type, records):
times = []
N_records = len(records)
for _ in range(REPEATS):
indices = random.sample(range(N_records), 50)
delete_names = [records[i][0] for i in indices]
if struct_type == 'll':
head = None
for name, phone in records:
head = ll_insert(head, name, phone)
start = time.perf_counter()
for name in delete_names:
head = ll_delete(head, name)
end = time.perf_counter()
elif struct_type == 'ht':
buckets = ht_create(2000)
for name, phone in records:
ht_insert(buckets, name, phone)
start = time.perf_counter()
for name in delete_names:
ht_delete(buckets, name)
end = time.perf_counter()
else:
root = None
for name, phone in records:
root = bst_insert(root, name, phone)
start = time.perf_counter()
for name in delete_names:
root = bst_delete(root, name)
end = time.perf_counter()
times.append(end - start)
return times
def plot_bar_charts(insert_data, search_data, delete_data):
"""Построение столбчатых диаграмм"""
structures = ['ll', 'ht', 'bst']
labels = ['Связный список', 'Хеш-таблица', 'Двоичное дерево']
mode_labels = ['Случайный порядок', 'Отсортированный порядок']
colors = ['skyblue', 'salmon']
x = np.arange(len(structures))
width = 0.35
# График вставки
fig1, ax1 = plt.subplots(figsize=(10, 6))
means_sh = [sum(insert_data[s]['shuffled'])/len(insert_data[s]['shuffled']) for s in structures]
means_so = [sum(insert_data[s]['sorted'])/len(insert_data[s]['sorted']) for s in structures]
rects1 = ax1.bar(x - width/2, means_sh, width, label=mode_labels[0], color=colors[0])
rects2 = ax1.bar(x + width/2, means_so, width, label=mode_labels[1], color=colors[1])
ax1.set_ylabel('Время (секунды)')
ax1.set_title('Вставка всех записей (10000 шт.)')
ax1.set_xticks(x)
ax1.set_xticklabels(labels)
ax1.legend()
ax1.set_yscale('log')
for rect in rects1 + rects2:
h = rect.get_height()
ax1.annotate(f'{h:.4f}', xy=(rect.get_x() + rect.get_width()/2, h),
xytext=(0, 3), textcoords="offset points", ha='center', va='bottom', fontsize=8)
plt.tight_layout()
plt.savefig('insert_comparison.png', dpi=150)
plt.show()
print(" График вставки сохранён: insert_comparison.png")
# График поиска
fig2, ax2 = plt.subplots(figsize=(10, 6))
means_sh = [sum(search_data[s]['shuffled'])/len(search_data[s]['shuffled']) for s in structures]
means_so = [sum(search_data[s]['sorted'])/len(search_data[s]['sorted']) for s in structures]
rects1 = ax2.bar(x - width/2, means_sh, width, label=mode_labels[0], color=colors[0])
rects2 = ax2.bar(x + width/2, means_so, width, label=mode_labels[1], color=colors[1])
ax2.set_ylabel('Время (секунды)')
ax2.set_title('Поиск (100 существующих + 10 отсутствующих)')
ax2.set_xticks(x)
ax2.set_xticklabels(labels)
ax2.legend()
for rect in rects1 + rects2:
h = rect.get_height()
ax2.annotate(f'{h:.6f}', xy=(rect.get_x() + rect.get_width()/2, h),
xytext=(0, 3), textcoords="offset points", ha='center', va='bottom', fontsize=8)
plt.tight_layout()
plt.savefig('search_comparison.png', dpi=150)
plt.show()
print(" График поиска сохранён: search_comparison.png")
# График удаления
fig3, ax3 = plt.subplots(figsize=(10, 6))
means_sh = [sum(delete_data[s]['shuffled'])/len(delete_data[s]['shuffled']) for s in structures]
means_so = [sum(delete_data[s]['sorted'])/len(delete_data[s]['sorted']) for s in structures]
rects1 = ax3.bar(x - width/2, means_sh, width, label=mode_labels[0], color=colors[0])
rects2 = ax3.bar(x + width/2, means_so, width, label=mode_labels[1], color=colors[1])
ax3.set_ylabel('Время (секунды)')
ax3.set_title('Удаление 50 случайных записей')
ax3.set_xticks(x)
ax3.set_xticklabels(labels)
ax3.legend()
for rect in rects1 + rects2:
h = rect.get_height()
ax3.annotate(f'{h:.6f}', xy=(rect.get_x() + rect.get_width()/2, h),
xytext=(0, 3), textcoords="offset points", ha='center', va='bottom', fontsize=8)
plt.tight_layout()
plt.savefig('delete_comparison.png', dpi=150)
plt.show()
print(" График удаления сохранён: delete_comparison.png")
def plot_attempts_graphs(data, op_name, op_title):
"""Построение графиков по 5 попыткам"""
fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))
struct_config = [
('ll', 'Связный список', 'red', 'o'),
('ht', 'Хеш-таблица', 'green', 's'),
('bst', 'Двоичное дерево', 'blue', '^')
]
# Случайный порядок
for struct, label, color, marker in struct_config:
times = data[struct]['shuffled']
x = range(1, len(times) + 1)
ax1.plot(x, times, marker=marker, color=color, label=label,
linestyle='--', linewidth=1)
ax1.scatter(x, times, color=color, s=60, zorder=5)
ax1.set_xlabel('Номер попытки')
ax1.set_ylabel('Время (секунды)')
ax1.set_title(f'{op_title} случайный порядок')
ax1.legend()
ax1.grid(True, linestyle=':', alpha=0.7)
# Отсортированный порядок
for struct, label, color, marker in struct_config:
times = data[struct]['sorted']
x = range(1, len(times) + 1)
ax2.plot(x, times, marker=marker, color=color, label=label,
linestyle='--', linewidth=1)
ax2.scatter(x, times, color=color, s=60, zorder=5)
ax2.set_xlabel('Номер попытки')
ax2.set_ylabel('Время (секунды)')
ax2.set_title(f'{op_title} отсортированный порядок')
ax2.legend()
ax2.grid(True, linestyle=':', alpha=0.7)
plt.tight_layout()
plt.savefig(f'{op_name}_5attempts.png', dpi=150)
plt.show()
print(f" График {op_name}_5attempts.png сохранён")