feat: enhance summarization prompt and improve MongoDB test generation

- Updated summarization prompt to require Russian output and exclude non-textual elements
- Upgraded ollama dependency to v0.6.1
- Enhanced run.sh script to support both single record and file-based ID input for MongoDB test generation
- Updated documentation in scripts/README.md to reflect new functionality
- Added verbose flag to generate_summarization_from_mongo.py for better debugging
```

This commit message follows the conventional commit format with a short title (50-72 characters) and provides a clear description of the changes made and their purpose.
This commit is contained in:
2026-01-23 03:49:22 +03:00
parent d8785ada8a
commit 2048e4e40d
234 changed files with 3268 additions and 72 deletions

17
run.sh
View File

@@ -47,7 +47,18 @@ if [ -n "$1" ]; then
elif [[ "$1" == "gen-mongo" ]]; then
activate
echo "🔍 Генерирую тесты пересказов из MongoDB... "
python scripts/generate_summarization_from_mongo.py --record-id "$2"
if [[ -n "$2" ]] && [[ "$2" != "--id-file" ]]; then
# Старый формат: ./run.sh gen-mongo <record-id>
python scripts/generate_summarization_from_mongo.py --record-id "$2"
elif [[ -n "$2" ]] && [[ "$2" == "--id-file" ]]; then
# Новй формат: ./run.sh gen-mongo --id-file <file-path>
shift 2
python scripts/generate_summarization_from_mongo.py --id-file "$1"
else
echo "❌ Ошибка: Укажите либо --record-id, либо --id-file"
echo "Использование: ./run.sh gen-mongo <record-id> или ./run.sh gen-mongo --id-file <file-path>"
exit 1
fi
echo "✅ Тесты из MongoDB успешно сгенерированы"
fi
else
@@ -58,10 +69,12 @@ else
echo " * run - запуск бенчмарков (translation, summarization, codegen)"
echo " * clean - очистка отчетов"
echo " * gen - генерация тестов через Ollama (translation, summarization, codegen)"
echo " * gen-mongo - генерация тестов пересказов из MongoDB (использование: ./run.sh gen-mongo <record-id> [output-dir])"
echo " * gen-mongo - генерация тестов пересказов из MongoDB (использование: ./run.sh gen-mongo <record-id> или ./run.sh gen-mongo --id-file <file-path>)"
echo ""
echo "Примеры использования:"
echo " * ./run.sh run -m second_constantine/t-lite-it-1.0:7b -b translation summarization"
echo " * ./run.sh run -m second_constantine/t-lite-it-1.0:7b --num-ctx 16000"
echo " * ./run.sh gen"
echo " * ./run.sh gen-mongo 507f1f77bcf86cd799439011"
echo " * ./run.sh gen-mongo --id-file ids.txt"
fi