commit
f94df248d0
7 changed files with 2729 additions and 0 deletions
@ -0,0 +1,221 @@ |
|||||||
|
# Byte-compiled / optimized / DLL files |
||||||
|
__pycache__/ |
||||||
|
*.py[cod] |
||||||
|
*$py.class |
||||||
|
|
||||||
|
# C extensions |
||||||
|
*.so |
||||||
|
|
||||||
|
# Distribution / packaging |
||||||
|
.Python |
||||||
|
build/ |
||||||
|
develop-eggs/ |
||||||
|
dist/ |
||||||
|
downloads/ |
||||||
|
eggs/ |
||||||
|
.eggs/ |
||||||
|
lib/ |
||||||
|
lib64/ |
||||||
|
parts/ |
||||||
|
sdist/ |
||||||
|
var/ |
||||||
|
wheels/ |
||||||
|
share/python-wheels/ |
||||||
|
*.egg-info/ |
||||||
|
.installed.cfg |
||||||
|
*.egg |
||||||
|
MANIFEST |
||||||
|
|
||||||
|
# PyInstaller |
||||||
|
# Usually these files are written by a python script from a template |
||||||
|
# before PyInstaller builds the exe, so as to inject date/other infos into it. |
||||||
|
*.manifest |
||||||
|
*.spec |
||||||
|
|
||||||
|
# Installer logs |
||||||
|
pip-log.txt |
||||||
|
pip-delete-this-directory.txt |
||||||
|
|
||||||
|
# Unit test / coverage reports |
||||||
|
htmlcov/ |
||||||
|
.tox/ |
||||||
|
.nox/ |
||||||
|
.coverage |
||||||
|
.coverage.* |
||||||
|
.cache |
||||||
|
nosetests.xml |
||||||
|
coverage.xml |
||||||
|
*.cover |
||||||
|
*.py,cover |
||||||
|
.hypothesis/ |
||||||
|
.pytest_cache/ |
||||||
|
cover/ |
||||||
|
|
||||||
|
# Translations |
||||||
|
*.mo |
||||||
|
*.pot |
||||||
|
|
||||||
|
# Django stuff: |
||||||
|
*.log |
||||||
|
local_settings.py |
||||||
|
db.sqlite3 |
||||||
|
db.sqlite3-journal |
||||||
|
|
||||||
|
# Flask stuff: |
||||||
|
instance/ |
||||||
|
.webassets-cache |
||||||
|
|
||||||
|
# Scrapy stuff: |
||||||
|
.scrapy |
||||||
|
|
||||||
|
# Sphinx documentation |
||||||
|
docs/_build/ |
||||||
|
|
||||||
|
# PyBuilder |
||||||
|
.pybuilder/ |
||||||
|
target/ |
||||||
|
|
||||||
|
# Jupyter Notebook |
||||||
|
.ipynb_checkpoints |
||||||
|
|
||||||
|
# IPython |
||||||
|
profile_default/ |
||||||
|
ipython_config.py |
||||||
|
|
||||||
|
# pyenv |
||||||
|
# For a library or package, you might want to ignore these files since the code is |
||||||
|
# intended to run in multiple environments; otherwise, check them in: |
||||||
|
# .python-version |
||||||
|
|
||||||
|
# pipenv |
||||||
|
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. |
||||||
|
# However, in case of collaboration, if having platform-specific dependencies or dependencies |
||||||
|
# having no cross-platform support, pipenv may install dependencies that don't work, or not |
||||||
|
# install all needed dependencies. |
||||||
|
#Pipfile.lock |
||||||
|
|
||||||
|
# poetry |
||||||
|
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control. |
||||||
|
# This is especially recommended for binary packages to ensure reproducibility, and is more |
||||||
|
# commonly ignored for libraries. |
||||||
|
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control |
||||||
|
#poetry.lock |
||||||
|
|
||||||
|
# pdm |
||||||
|
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control. |
||||||
|
#pdm.lock |
||||||
|
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it |
||||||
|
# in version control. |
||||||
|
# https://pdm.fming.dev/#use-with-ide |
||||||
|
.pdm.toml |
||||||
|
|
||||||
|
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm |
||||||
|
__pypackages__/ |
||||||
|
|
||||||
|
# Celery stuff |
||||||
|
celerybeat-schedule |
||||||
|
celerybeat.pid |
||||||
|
|
||||||
|
# SageMath parsed files |
||||||
|
*.sage.py |
||||||
|
|
||||||
|
# Environments |
||||||
|
.env |
||||||
|
.venv |
||||||
|
env/ |
||||||
|
venv/ |
||||||
|
ENV/ |
||||||
|
env.bak/ |
||||||
|
venv.bak/ |
||||||
|
|
||||||
|
# Spyder project settings |
||||||
|
.spyderproject |
||||||
|
.spyproject |
||||||
|
|
||||||
|
# Rope project settings |
||||||
|
.ropeproject |
||||||
|
|
||||||
|
# mkdocs documentation |
||||||
|
/site |
||||||
|
|
||||||
|
# mypy |
||||||
|
.mypy_cache/ |
||||||
|
.dmypy.json |
||||||
|
dmypy.json |
||||||
|
|
||||||
|
# Pyre type checker |
||||||
|
.pyre/ |
||||||
|
|
||||||
|
# pytype static type analyzer |
||||||
|
.pytype/ |
||||||
|
|
||||||
|
# Cython debug symbols |
||||||
|
cython_debug/ |
||||||
|
|
||||||
|
# PyCharm |
||||||
|
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can |
||||||
|
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore |
||||||
|
# and can be added to the global gitignore or merged into this file. For a more nuclear |
||||||
|
# option (not recommended) you can ignore the whole idea folder. |
||||||
|
.idea/ |
||||||
|
|
||||||
|
# VS Code |
||||||
|
.vscode/ |
||||||
|
*.code-workspace |
||||||
|
|
||||||
|
# Data files |
||||||
|
*.db |
||||||
|
*.sqlite |
||||||
|
*.sqlite3 |
||||||
|
|
||||||
|
# ChromaDB database |
||||||
|
chroma_db/ |
||||||
|
|
||||||
|
# AI Models |
||||||
|
models/ |
||||||
|
!models/.gitkeep |
||||||
|
|
||||||
|
# Downloaded data |
||||||
|
data/ |
||||||
|
!data/.gitkeep |
||||||
|
|
||||||
|
# Temporary files |
||||||
|
*.tmp |
||||||
|
*.temp |
||||||
|
*.log |
||||||
|
|
||||||
|
# OS generated files |
||||||
|
.DS_Store |
||||||
|
.DS_Store? |
||||||
|
._* |
||||||
|
.Spotlight-V100 |
||||||
|
.Trashes |
||||||
|
ehthumbs.db |
||||||
|
Thumbs.db |
||||||
|
|
||||||
|
# Windows |
||||||
|
*.lnk |
||||||
|
|
||||||
|
# Application specific |
||||||
|
# rag_corpus.json |
||||||
|
config.json |
||||||
|
|
||||||
|
# LLM cache and temporary files |
||||||
|
.cache/ |
||||||
|
*.gguf.tmp |
||||||
|
|
||||||
|
# Logs |
||||||
|
logs/ |
||||||
|
*.log |
||||||
|
|
||||||
|
# Backup files |
||||||
|
*.bak |
||||||
|
*.backup |
||||||
|
|
||||||
|
# Local configuration |
||||||
|
local_config.py |
||||||
|
settings_local.py |
||||||
|
|
||||||
|
# Large files (добавьте сюда файлы больше 100MB если они есть) |
||||||
|
# *.largefile |
||||||
|
/scripts/ |
||||||
@ -0,0 +1,26 @@ |
|||||||
|
# Medical RAG System with YandexGPT |
||||||
|
|
||||||
|
Система для автоматического преобразования кратких медицинских записей в развернутые формулировки жалоб пациентов с использованием RAG (Retrieval-Augmented Generation) и модели YandexGPT. |
||||||
|
|
||||||
|
## 🚀 Особенности |
||||||
|
|
||||||
|
- **RAG-архитектура**: Поиск релевантных медицинских примеров из базы знаний |
||||||
|
- **Гибкое использование GPU**: Автоматическое определение и использование GPU для ускорения работы |
||||||
|
- **Управление токенами**: Интеллектуальное ограничение длины контекста |
||||||
|
- **Русскоязычная оптимизация**: Специально настроена для работы с медицинскими текстами на русском языке |
||||||
|
- **Хранение состояния**: Сохранение векторной базы данных между сессиями |
||||||
|
|
||||||
|
## 📋 Требования |
||||||
|
|
||||||
|
### Аппаратные требования |
||||||
|
- **Минимально**: CPU с 8+ GB RAM |
||||||
|
- **Рекомендуется**: GPU с 8+ GB VRAM (NVIDIA) |
||||||
|
- **Память**: 10+ GB свободного места |
||||||
|
|
||||||
|
### Программные требования |
||||||
|
- Python 3.8+ |
||||||
|
- PyTorch (с поддержкой CUDA при наличии GPU) |
||||||
|
- Библиотеки: `chromadb`, `llama-cpp-python`, `sentence-transformers`, `tiktoken` |
||||||
|
|
||||||
|
### Модель |
||||||
|
[YandexGPT-5-Lite-8B-instruct-Q4_K_M](https://huggingface.co/yandex/YandexGPT-5-Lite-8B-instruct-GGUF/resolve/main/YandexGPT-5-Lite-8B-instruct-Q4_K_M.gguf?download=true) |
||||||
@ -0,0 +1,6 @@ |
|||||||
|
torch>=2.0.0 |
||||||
|
chromadb>=0.4.0 |
||||||
|
llama-cpp-python>=0.2.0 |
||||||
|
sentence-transformers>=2.2.0 |
||||||
|
tiktoken>=0.4.0 |
||||||
|
numpy>=1.21.0 |
||||||
Loading…
Reference in new issue