import time import random import csv import os import matplotlib.pyplot as plt import numpy as np import sys sys.setrecursionlimit(20000) # 1. LinkedList def ll_insert(head, name, phone): new_node = {'name': name, 'phone': phone, 'next': None} if head is None: return new_node if head['name'] == name: head['phone'] = phone return head current = head while current['next'] is not None: if current['next']['name'] == name: current['next']['phone'] = phone return head current = current['next'] current['next'] = new_node return head def ll_find(head, name): current = head while current is not None: if current['name'] == name: return current['phone'] current = current['next'] return None def ll_delete(head, name): if head is None: return None if head['name'] == name: return head['next'] current = head while current['next'] is not None: if current['next']['name'] == name: current['next'] = current['next']['next'] return head current = current['next'] return head def ll_list_all(head): records = [] current = head while current is not None: records.append((current['name'], current['phone'])) current = current['next'] records.sort(key=lambda x: x[0]) return records # 2. Hash Function def hash_function(name, table_size): return sum(ord(c) for c in name) % table_size def ht_create(size=1000): return [None] * size def ht_insert(buckets, name, phone): size = len(buckets) index = hash_function(name, size) buckets[index] = ll_insert(buckets[index], name, phone) def ht_find(buckets, name): size = len(buckets) index = hash_function(name, size) return ll_find(buckets[index], name) def ht_delete(buckets, name): size = len(buckets) index = hash_function(name, size) buckets[index] = ll_delete(buckets[index], name) def ht_list_all(buckets): records = [] for bucket in buckets: current = bucket while current is not None: records.append((current['name'], current['phone'])) current = current['next'] records.sort(key=lambda x: x[0]) return records #3. Tree function def bst_insert(root, name, phone): if root is None: return {'name': name, 'phone': phone, 'left': None, 'right': None} if name < root['name']: root['left'] = bst_insert(root['left'], name, phone) elif name > root['name']: root['right'] = bst_insert(root['right'], name, phone) else: root['phone'] = phone return root def bst_find(root, name): current = root while current is not None: if name == current['name']: return current['phone'] elif name < current['name']: current = current['left'] else: current = current['right'] return None def bst_find_min(node): current = node while current['left'] is not None: current = current['left'] return current def bst_delete(root, name): if root is None: return None if name < root['name']: root['left'] = bst_delete(root['left'], name) elif name > root['name']: root['right'] = bst_delete(root['right'], name) else: if root['left'] is None: return root['right'] elif root['right'] is None: return root['left'] min_node = bst_find_min(root['right']) root['name'] = min_node['name'] root['phone'] = min_node['phone'] root['right'] = bst_delete(root['right'], min_node['name']) return root def bst_list_all(root): records = [] def inorder_traversal(node): if node is not None: inorder_traversal(node['left']) records.append((node['name'], node['phone'])) inorder_traversal(node['right']) inorder_traversal(root) return records #EXPERIMENTAL PART # 1. Test data generation def generate_records(count=10000): records = [] for i in range(count): name = f"User_{i:05d}" phone = f"+7-{random.randint(100,999)}-{random.randint(100,999)}-{random.randint(1000,9999)}" records.append((name, phone)) shuffled = records.copy() random.shuffle(shuffled) sorted_records = sorted(records, key=lambda x: x[0]) return shuffled, sorted_records # 2. Timing def measure_insertion(structure_name, records): times = [] filled_structure = None for run in range(5): if structure_name == "linked_list": structure = None elif structure_name == "hash_table": structure = ht_create(1000) elif structure_name == "bst": structure = None start = time.perf_counter() for name, phone in records: if structure_name == "linked_list": structure = ll_insert(structure, name, phone) elif structure_name == "hash_table": ht_insert(structure, name, phone) elif structure_name == "bst": structure = bst_insert(structure, name, phone) end = time.perf_counter() times.append(end - start) if run == 4: filled_structure = structure return times, filled_structure def measure_search(structure_name, structure, search_names): times = [] for run in range(5): start = time.perf_counter() for name in search_names: if structure_name == "linked_list": ll_find(structure, name) elif structure_name == "hash_table": ht_find(structure, name) elif structure_name == "bst": bst_find(structure, name) end = time.perf_counter() times.append(end - start) return times def measure_deletion(structure_name, original_structure, delete_names): times = [] for run in range(5): if structure_name == "linked_list": all_records = ll_list_all(original_structure) test_structure = None for name, phone in all_records: test_structure = ll_insert(test_structure, name, phone) elif structure_name == "hash_table": all_records = ht_list_all(original_structure) test_structure = ht_create(1000) for name, phone in all_records: ht_insert(test_structure, name, phone) elif structure_name == "bst": all_records = bst_list_all(original_structure) test_structure = None for name, phone in all_records: test_structure = bst_insert(test_structure, name, phone) start = time.perf_counter() for name in delete_names: if structure_name == "linked_list": test_structure = ll_delete(test_structure, name) elif structure_name == "hash_table": ht_delete(test_structure, name) elif structure_name == "bst": test_structure = bst_delete(test_structure, name) end = time.perf_counter() times.append(end - start) return times # 3. Launch and save results def run_experiment(): current_dir = os.path.dirname(__file__) docs_dir = os.path.dirname(current_dir) csv_file = os.path.join(docs_dir, "experiment_results.csv") print("=" * 70) print("ЭКСПЕРИМЕНТАЛЬНОЕ СРАВНЕНИЕ СТРУКТУР ДАННЫХ") print("Телефонный справочник - 10000 записей") print("=" * 70) print(f"\n📁 Результаты будут сохранены в: {csv_file}") print("\n1. Генерация тестовых данных...") shuffled_records, sorted_records = generate_records(10000) print(f" Сгенерировано 10000 записей") existing_names = [shuffled_records[i][0] for i in random.sample(range(10000), 100)] nonexisting_names = [f"NotExist_{i}" for i in range(10)] search_names = existing_names + nonexisting_names delete_names = [shuffled_records[i][0] for i in random.sample(range(10000), 50)] results = [["Структура", "Режим", "Операция", "Замер1(с)", "Замер2(с)", "Замер3(с)", "Замер4(с)", "Замер5(с)", "Среднее(с)"]] for mode_name, records in [("случайный", shuffled_records), ("отсортированный", sorted_records)]: print(f"\n2. Тестирование режима: {mode_name}") print("-" * 50) for struct_name in ["linked_list", "hash_table", "bst"]: print(f"\n {struct_name.upper()}:") print(" Вставка 10000 записей...") insert_times, filled_struct = measure_insertion(struct_name, records) avg_insert = sum(insert_times) / 5 print(f" Время: {avg_insert:.4f} сек (среднее)") print(" Поиск 110 записей...") search_times = measure_search(struct_name, filled_struct, search_names) avg_search = sum(search_times) / 5 print(f" Время: {avg_search:.4f} сек (среднее)") print(" Удаление 50 записей...") delete_times = measure_deletion(struct_name, filled_struct, delete_names) avg_delete = sum(delete_times) / 5 print(f" Время: {avg_delete:.4f} сек (среднее)") results.append([struct_name, mode_name, "вставка"] + insert_times + [avg_insert]) results.append([struct_name, mode_name, "поиск"] + search_times + [avg_search]) results.append([struct_name, mode_name, "удаление"] + delete_times + [avg_delete]) print("\n3. Сохранение результатов...") with open(csv_file, "w", newline="", encoding="utf-8") as f: writer = csv.writer(f) writer.writerows(results) print(f" ✅ Результаты сохранены в: {csv_file}") print("\n" + "=" * 70) print("СВОДНАЯ ТАБЛИЦА РЕЗУЛЬТАТОВ") print("=" * 70) print(f"{'Структура':<15} {'Режим':<12} {'Операция':<10} {'Среднее время (сек)':<20}") print("-" * 70) for row in results[1:]: struct, mode, op, t1, t2, t3, t4, t5, avg = row print(f"{struct:<15} {mode:<12} {op:<10} {avg:<20.6f}") return results, docs_dir # 4. Graphics def create_graphs(results, docs_dir): print("\n4. Построение графиков...") data = {} for row in results[1:]: struct = row[0] mode = row[1] op = row[2] avg = row[8] if struct not in data: data[struct] = {} if mode not in data[struct]: data[struct][mode] = {} data[struct][mode][op] = avg struct_labels = { 'linked_list': 'LinkedList', 'hash_table': 'HashTable', 'bst': 'BST' } colors = { 'linked_list': '#3498db', 'hash_table': '#2ecc71', 'bst': '#e74c3c' } fig, axes = plt.subplots(1, 3, figsize=(15, 6)) fig.suptitle('Сравнение производительности структур данных', fontsize=16, fontweight='bold') operations = ['вставка', 'поиск', 'удаление'] operation_titles = ['Вставка\n(10000 записей)', 'Поиск\n(110 запросов)', 'Удаление\n(50 записей)'] modes = ['случайный', 'отсортированный'] mode_labels = ['Случайный', 'Отсортированный'] for idx, (op, op_title) in enumerate(zip(operations, operation_titles)): ax = axes[idx] # Позиции для групп столбцов x = np.arange(len(modes)) # [0, 1] width = 0.25 # ширина одного столбца multiplier = 0 for struct in ['linked_list', 'hash_table', 'bst']: values = [data[struct][mode][op] for mode in modes] offset = width * multiplier bars = ax.bar(x + offset, values, width, label=struct_labels[struct], color=colors[struct], edgecolor='black', linewidth=0.5) for bar, val in zip(bars, values): if val < 0.01: ax.text(bar.get_x() + bar.get_width()/2, bar.get_height() + val*0.05, f'{val:.5f}', ha='center', va='bottom', fontsize=8, rotation=0) else: ax.text(bar.get_x() + bar.get_width()/2, bar.get_height() + val*0.02, f'{val:.4f}', ha='center', va='bottom', fontsize=8, rotation=0) multiplier += 1 ax.set_title(op_title, fontsize=12, fontweight='bold') ax.set_ylabel('Время (секунды)', fontsize=10) ax.set_xlabel('Режим данных', fontsize=10) ax.set_xticks(x + width) ax.set_xticklabels(mode_labels) ax.legend(loc='upper left', fontsize=8) ax.grid(True, alpha=0.3, axis='y') all_values = [data[s][m][op] for s in ['linked_list', 'hash_table', 'bst'] for m in modes] if max(all_values) / min(all_values) > 100: ax.set_yscale('log') ax.set_ylabel('Время (секунды) - логарифмическая шкала', fontsize=9) plt.tight_layout() graph_path = os.path.join(docs_dir, "performance_graphs.png") plt.savefig(graph_path, dpi=150, bbox_inches='tight') plt.close() print(f" ✅ Графики сохранены в: {graph_path}") return graph_path # 5. Main program if __name__ == "__main__": results, docs_dir = run_experiment() try: graph_file = create_graphs(results, docs_dir) print("\n" + "=" * 70) print("ЭКСПЕРИМЕНТ ЗАВЕРШЕН УСПЕШНО!") print("=" * 70) print("\n📂 СОЗДАННЫЕ ФАЙЛЫ:") print(f" 📊 Данные: {os.path.join(docs_dir, 'experiment_results.csv')}") print(f" 📈 Графики: {graph_file}") except Exception as e: print(f"\n⚠️ Ошибка при построении графиков: {e}") print(" Убедитесь, что установлен matplotlib: pip install matplotlib") print("\n" + "=" * 70) print("ЭКСПЕРИМЕНТ ЗАВЕРШЕН (без графиков)") print("=" * 70) print(f"\n📂 CSV файл сохранен: {os.path.join(docs_dir, 'experiment_results.csv')}")