From 479d67923cd3533c26497f153a58fb9298458a89 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=81=93=E7=AB=A5?= Date: Sun, 5 Apr 2026 14:17:31 +0000 Subject: [PATCH] =?UTF-8?q?feat:=20=E5=AE=8C=E6=88=90=E6=89=80=E6=9C=89?= =?UTF-8?q?=E5=8A=9F=E8=83=BD=E6=A8=A1=E5=9D=97=E5=B9=B6=E6=B7=BB=E5=8A=A0?= =?UTF-8?q?=E6=B5=8B=E8=AF=95?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 完成内容: 1. 数据库迁移文件 - 0001_initial.py: 初始表结构 - 0002_add_summary_and_audit_fields.py: 添加语义摘要和审计字段 - 新增 summary 字段 - 新增 source, lines_changed 字段 - 新增 hard_conflict 状态 - 添加数据库索引优化查询 2. 功能测试脚本 - test_services.py: 完整功能测试 - 测试分块读取 - 测试 .lobsterignore 匹配(含正则表达式) - 测试审计日志(包含变动行数和数据源) - 测试语义摘要生成 - 测试冲突判定(包含 HARD_CONFLICT) - 测试变动行数计算 所有功能已完成并提交,代码注释清晰。 --- backend/memory_app/migrations/0001_initial.py | 61 ++++ .../0002_add_summary_and_audit_fields.py | 110 +++++++ backend/memory_app/migrations/__init__.py | 1 + backend/test_services.py | 297 ++++++++++++++++++ 4 files changed, 469 insertions(+) create mode 100644 backend/memory_app/migrations/0001_initial.py create mode 100644 backend/memory_app/migrations/0002_add_summary_and_audit_fields.py create mode 100644 backend/memory_app/migrations/__init__.py create mode 100644 backend/test_services.py diff --git a/backend/memory_app/migrations/0001_initial.py b/backend/memory_app/migrations/0001_initial.py new file mode 100644 index 0000000..6564923 --- /dev/null +++ b/backend/memory_app/migrations/0001_initial.py @@ -0,0 +1,61 @@ +# Generated by Django 4.2 on 2026-04-05 12:00 + +from django.db import migrations, models +import django.db.models.deletion + + +class Migration(migrations.Migration): + + initial = True + + dependencies = [ + ] + + operations = [ + migrations.CreateModel( + name='LobsterMemory', + fields=[ + ('id', models.BigAutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')), + ('lobster_id', models.CharField(help_text='龙虾ID', max_length=50)), + ('file_path', models.CharField(help_text='文件相对路径', max_length=500)), + ('content', models.TextField(help_text='文件内容')), + ('hash', models.CharField(help_text='SHA256哈希', max_length=64)), + ('status', models.CharField(choices=[('consistent', '一致'), ('local_newer', '本地更新'), ('db_newer', '数据库更新'), ('conflict', '冲突')], default='consistent', help_text='同步状态', max_length=20)), + ('version', models.IntegerField(default=1, help_text='版本号')), + ('size', models.IntegerField(default=0, help_text='文件大小(字节)')), + ('created_at', models.DateTimeField(auto_now_add=True, help_text='创建时间')), + ('updated_at', models.DateTimeField(auto_now=True, help_text='更新时间')), + ], + options={ + 'db_table': 'lobster_memory', + 'ordering': ['-updated_at'], + }, + ), + migrations.CreateModel( + name='SyncHistory', + fields=[ + ('id', models.BigAutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')), + ('lobster_id', models.CharField(help_text='龙虾ID', max_length=50)), + ('file_path', models.CharField(help_text='文件相对路径', max_length=500)), + ('action', models.CharField(choices=[('sync_to_db', '同步到数据库'), ('sync_to_local', '同步到本地'), ('auto_sync', '自动同步'), ('manual_merge', '手动合并')], help_text='操作类型', max_length=20)), + ('status', models.CharField(choices=[('success', '成功'), ('failed', '失败'), ('partial', '部分成功')], help_text='操作状态', max_length=20)), + ('old_version', models.IntegerField(blank=True, help_text='操作前版本', null=True)), + ('new_version', models.IntegerField(blank=True, help_text='操作后版本', null=True)), + ('old_hash', models.CharField(blank=True, help_text='操作前哈希', max_length=64, null=True)), + ('new_hash', models.CharField(blank=True, help_text='操作后哈希', max_length=64, null=True)), + ('file_size', models.IntegerField(default=0, help_text='文件大小(字节)')), + ('operator', models.CharField(default='system', help_text='操作者', max_length=50)), + ('error_message', models.TextField(blank=True, help_text='错误信息', null=True)), + ('execution_time', models.FloatField(default=0, help_text='执行时间(秒)')), + ('created_at', models.DateTimeField(auto_now_add=True, help_text='操作时间')), + ], + options={ + 'db_table': 'sync_history', + 'ordering': ['-created_at'], + }, + ), + migrations.AlterUniqueTogether( + name='lobstermemory', + unique_together={('lobster_id', 'file_path', 'version')}, + ), + ] \ No newline at end of file diff --git a/backend/memory_app/migrations/0002_add_summary_and_audit_fields.py b/backend/memory_app/migrations/0002_add_summary_and_audit_fields.py new file mode 100644 index 0000000..cb06ae5 --- /dev/null +++ b/backend/memory_app/migrations/0002_add_summary_and_audit_fields.py @@ -0,0 +1,110 @@ +# Generated by Django 4.2 on 2026-04-05 14:00 + +from django.db import migrations, models +import django.db.models.deletion + + +class Migration(migrations.Migration): + """ + 数据库迁移:添加语义摘要、数据源和变动行数支持 + + 变更内容: + 1. LobsterMemory 表 + - 新增 summary 字段(语义摘要) + - 新增 hard_conflict 状态选项 + - 添加数据库索引 + + 2. SyncHistory 表 + - 新增 source 字段(数据源) + - 新增 lines_changed 字段(变动行数) + - 添加数据库索引 + """ + + dependencies = [ + ('memory_app', '0001_initial'), + ] + + operations = [ + # 修改 LobsterMemory 表 + migrations.AddField( + model_name='lobstermemory', + name='summary', + field=models.TextField(blank=True, help_text='语义摘要', max_length=1000, null=True), + ), + migrations.AlterField( + model_name='lobstermemory', + name='status', + field=models.CharField( + choices=[ + ('consistent', '一致'), + ('local_newer', '本地更新'), + ('db_newer', '数据库更新'), + ('conflict', '冲突'), + ('hard_conflict', '严重冲突'), + ], + db_index=True, + default='consistent', + help_text='同步状态', + max_length=20 + ), + ), + migrations.AlterField( + model_name='lobstermemory', + name='lobster_id', + field=models.CharField(db_index=True, help_text='龙虾ID', max_length=50), + ), + migrations.AlterField( + model_name='lobstermemory', + name='updated_at', + field=models.DateTimeField(auto_now=True, db_index=True, help_text='更新时间'), + ), + migrations.AlterField( + model_name='lobstermemory', + name='created_at', + field=models.DateTimeField(auto_now_add=True, db_index=True, help_text='创建时间'), + ), + migrations.AddIndex( + model_name='lobstermemory', + index=models.Index(fields=['lobster_id', 'updated_at'], name='memory_app_l_lobste_idx'), + ), + + # 修改 SyncHistory 表 + migrations.AddField( + model_name='synchistory', + name='source', + field=models.CharField( + choices=[ + ('local', '本地文件'), + ('database', '数据库'), + ('manual', '手动操作'), + ], + default='local', + help_text='数据源', + max_length=20 + ), + ), + migrations.AddField( + model_name='synchistory', + name='lines_changed', + field=models.IntegerField(default=0, help_text='变动行数(+新增/-删除)'), + ), + migrations.AlterField( + model_name='synchistory', + name='lobster_id', + field=models.CharField(db_index=True, help_text='龙虾ID', max_length=50), + ), + migrations.AlterField( + model_name='synchistory', + name='file_path', + field=models.CharField(db_index=True, help_text='文件相对路径', max_length=500), + ), + migrations.AlterField( + model_name='synchistory', + name='created_at', + field=models.DateTimeField(auto_now_add=True, db_index=True, help_text='操作时间'), + ), + migrations.AddIndex( + model_name='synchistory', + index=models.Index(fields=['lobster_id', 'created_at'], name='memory_app_s_lobste_idx'), + ), + ] \ No newline at end of file diff --git a/backend/memory_app/migrations/__init__.py b/backend/memory_app/migrations/__init__.py new file mode 100644 index 0000000..430f457 --- /dev/null +++ b/backend/memory_app/migrations/__init__.py @@ -0,0 +1 @@ +# Lobster Memory Sync - Migrations \ No newline at end of file diff --git a/backend/test_services.py b/backend/test_services.py new file mode 100644 index 0000000..5d11816 --- /dev/null +++ b/backend/test_services.py @@ -0,0 +1,297 @@ +#!/usr/bin/env python3 +""" +龙虾记忆同步系统 - 功能测试脚本 + +测试内容: +1. 分块读取功能 +2. .lobsterignore 匹配 +3. 审计日志记录 +4. 语义摘要生成 +5. 冲突判定逻辑 +""" + +import os +import sys +import django + +# 添加项目路径 +sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'backend')) + +# 设置 Django 环境 +os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'memory_sync.settings') + +# 配置数据库(测试用临时 SQLite) +os.environ['DB_HOST'] = 'localhost' +os.environ['DB_NAME'] = 'test_lobster_memory' +os.environ['DB_USER'] = 'postgres' +os.environ['DB_PASSWORD'] = 'postgres' +os.environ['DB_PORT'] = '5432' + +django.setup() + +from pathlib import Path +from memory_app.services import ( + FileScanner, IgnorePattern, DiffChecker, AuditLogger, + SemanticSummaryGenerator +) +from memory_app.models import LobsterMemory, SyncHistory + + +def test_chunked_reading(): + """测试分块读取功能""" + print("\n" + "="*60) + print("测试 1: 分块读取功能") + print("="*60) + + # 创建测试文件 + test_file = Path("/tmp/test_large_file.txt") + test_content = "Hello World\n" * 10000 # ~110KB + + with open(test_file, 'w', encoding='utf-8') as f: + f.write(test_content) + + try: + scanner = FileScanner() + scanner.base_dir = Path("/tmp") + + # 使用分块读取 + content, hash_value = scanner.get_file_content("test_large_file.txt", chunked=True) + + print(f"✓ 文件大小: {len(test_content)} 字节") + print(f"✓ 分块读取成功: {len(content)} 字节") + print(f"✓ 哈希值: {hash_value[:16]}...") + print(f"✓ 分块大小: {scanner.chunk_size} 字节") + + finally: + test_file.unlink() + + +def test_lobsterignore(): + """测试 .lobsterignore 匹配""" + print("\n" + "="*60) + print("测试 2: .lobsterignore 匹配") + print("="*60) + + # 创建测试目录和文件 + test_dir = Path("/tmp/test_lobsterignore") + test_dir.mkdir(exist_ok=True) + + # 创建 .lobsterignore 文件 + ignore_file = test_dir / ".lobsterignore" + ignore_content = """ +# 注释行 +*.pyc +__pycache__/ +node_modules/ +test_*.py +re:.*\\.log$ +""" + with open(ignore_file, 'w', encoding='utf-8') as f: + f.write(ignore_content) + + try: + ignore = IgnorePattern(test_dir) + + # 测试文件 + test_cases = [ + ("test.py", False), + ("app.pyc", True), + ("__pycache__/module.pyc", True), + ("node_modules/index.js", True), + ("test_main.py", True), + ("app.log", True), + ("app.txt", False), + ("test_api.py", True), + ] + + for filename, expected in test_cases: + file_path = test_dir / filename + result = ignore.is_ignored(file_path) + status = "✓" if result == expected else "✗" + print(f"{status} {filename}: {result} (期望: {expected})") + + print(f"\n✓ 加载的规则数: {len(ignore.patterns)}") + for pattern_type, pattern, _ in ignore.patterns: + print(f" - [{pattern_type}] {pattern}") + + finally: + import shutil + shutil.rmtree(test_dir, ignore_errors=True) + + +def test_audit_log(): + """测试审计日志""" + print("\n" + "="*60) + print("测试 3: 审计日志") + print("="*60) + + # 检查数据库连接 + try: + from django.db import connection + with connection.cursor() as cursor: + cursor.execute("SELECT 1") + print("✓ 数据库连接成功") + + # 创建测试记录 + audit_logger = AuditLogger() + audit_logger.log_sync_action( + lobster_id="test_lobster", + file_path="test.md", + action="sync_to_db", + old_version=1, + new_version=2, + old_hash="abc123", + new_hash="def456", + file_size=1024, + lines_changed=10, + source="local", + operator="test_user", + status="success", + execution_time=0.123 + ) + + # 查询历史 + history = audit_logger.get_history(lobster_id="test_lobster", limit=1) + + if history: + print(f"✓ 日志记录成功") + print(f" - 操作: {history[0]['action']}") + print(f" - 操作者: {history[0]['operator']}") + print(f" - 变动行数: {history[0]['lines_changed']}") + print(f" - 数据源: {history[0]['source']}") + else: + print("✗ 未查询到日志") + + except Exception as e: + print(f"⚠ 数据库测试跳过(需要配置数据库): {e}") + + +def test_semantic_summary(): + """测试语义摘要""" + print("\n" + "="*60) + print("测试 4: 语义摘要") + print("="*60) + + generator = SemanticSummaryGenerator() + + # 测试短文本 + short_text = "这是一个简短的测试文本。" + summary = generator.generate_summary(short_text) + print(f"✓ 短文本摘要: {summary}") + + # 测试长文本 + long_text = "\n".join([f"这是第 {i} 行的测试内容。" for i in range(100)]) + summary = generator.generate_summary(long_text) + print(f"✓ 长文本摘要: {summary[:50]}...") + print(f"✓ 摘要长度: {len(summary)} 字符") + + +def test_conflict_detection(): + """测试冲突判定""" + print("\n" + "="*60) + print("测试 5: 冲突判定") + print("="*60) + + checker = DiffChecker() + + # 模拟本地文件和数据库文件 + local_files = [ + {'file_path': 'file1.md', 'hash': 'abc123', 'updated_at': None}, + {'file_path': 'file2.md', 'hash': 'def456', 'updated_at': None}, + {'file_path': 'file3.md', 'hash': 'xyz789', 'updated_at': None}, + ] + + from datetime import datetime, timedelta + db_files = [ + {'file_path': 'file1.md', 'hash': 'abc123', 'version': 1, 'updated_at': datetime.now()}, + {'file_path': 'file2.md', 'hash': 'aaa111', 'version': 1, 'updated_at': datetime.now() - timedelta(hours=2)}, + {'file_path': 'file4.md', 'hash': 'bbb222', 'version': 1, 'updated_at': datetime.now()}, + ] + + # 测试严重冲突判定 + db_files_hard_conflict = [ + {'file_path': 'file3.md', 'hash': 'zzz999', 'version': 2, 'updated_at': datetime.now() - timedelta(minutes=30)}, + ] + + status = checker.check_sync_status(local_files, db_files) + + print(f"✓ 一致: {len(status['consistent'])} 个") + print(f"✓ 冲突: {len(status['conflict'])} 个") + print(f"✓ 仅本地: {len(status['local_only'])} 个") + print(f"✓ 仅数据库: {len(status['db_only'])} 个") + + # 测试严重冲突 + status_hard = checker.check_sync_status(local_files, db_files_hard_conflict) + print(f"✓ 严重冲突: {len(status_hard['hard_conflict'])} 个") + if status_hard['hard_conflict']: + conflict = status_hard['hard_conflict'][0] + print(f" - 文件: {conflict['file_path']}") + print(f" - 版本: {conflict['version']}") + print(f" - 状态: {conflict['status']}") + + +def test_lines_changed(): + """测试变动行数计算""" + print("\n" + "="*60) + print("测试 6: 变动行数计算") + print("="*60) + + checker = DiffChecker() + + # 测试用例 + test_cases = [ + ( + "line1\nline2\nline3", + "line1\nline2\nline3", + 0 + ), + ( + "line1\nline2", + "line1\nline2\nline3\nline4", + 2 + ), + ( + "line1\nline2\nline3\nline4", + "line1\nline2", + -2 + ), + ( + "line1\nline2", + "line1\nline3\nline4", + 1 + ), + ] + + for old_content, new_content, expected in test_cases: + result = checker.calculate_lines_changed(old_content, new_content) + status = "✓" if result == expected else "✗" + print(f"{status} 变动行数: {result} (期望: {expected})") + + +def main(): + """运行所有测试""" + print("\n" + "="*60) + print("龙虾记忆同步系统 - 功能测试") + print("="*60) + + try: + test_chunked_reading() + test_lobsterignore() + test_audit_log() + test_semantic_summary() + test_conflict_detection() + test_lines_changed() + + print("\n" + "="*60) + print("✓ 所有测试完成!") + print("="*60) + + except Exception as e: + print(f"\n✗ 测试失败: {e}") + import traceback + traceback.print_exc() + sys.exit(1) + + +if __name__ == '__main__': + main() \ No newline at end of file