- Complete transformer implementation from scratch - Training pipeline with gradient accumulation and mixed precision - Optimized inference with KV caching - Multi-format data processing (PDFs, images, code, text) - Comprehensive documentation - Apache 2.0 license - Example training plots included in docs/images/
210 lines
2.4 KiB
Plaintext
210 lines
2.4 KiB
Plaintext
# Byte-compiled / optimized / DLL files
|
|
__pycache__/
|
|
*.py[cod]
|
|
*$py.class
|
|
|
|
# C extensions
|
|
*.so
|
|
|
|
# Distribution / packaging
|
|
.Python
|
|
build/
|
|
develop-eggs/
|
|
dist/
|
|
downloads/
|
|
eggs/
|
|
.eggs/
|
|
lib/
|
|
lib64/
|
|
parts/
|
|
sdist/
|
|
var/
|
|
wheels/
|
|
share/python-wheels/
|
|
*.egg-info/
|
|
.installed.cfg
|
|
*.egg
|
|
MANIFEST
|
|
|
|
# PyInstaller
|
|
*.manifest
|
|
*.spec
|
|
|
|
# Installer logs
|
|
pip-log.txt
|
|
pip-delete-this-directory.txt
|
|
|
|
# Unit test / coverage reports
|
|
htmlcov/
|
|
.tox/
|
|
.nox/
|
|
.coverage
|
|
.coverage.*
|
|
.cache
|
|
nosetests.xml
|
|
coverage.xml
|
|
*.cover
|
|
*.py,cover
|
|
.hypothesis/
|
|
.pytest_cache/
|
|
cover/
|
|
|
|
# Translations
|
|
*.mo
|
|
*.pot
|
|
|
|
# Django stuff:
|
|
*.log
|
|
local_settings.py
|
|
db.sqlite3
|
|
db.sqlite3-journal
|
|
|
|
# Flask stuff:
|
|
instance/
|
|
.webassets-cache
|
|
|
|
# Scrapy stuff:
|
|
.scrapy
|
|
|
|
# Sphinx documentation
|
|
docs/_build/
|
|
|
|
# PyBuilder
|
|
.pybuilder/
|
|
target/
|
|
|
|
# Jupyter Notebook
|
|
.ipynb_checkpoints
|
|
|
|
# IPython
|
|
profile_default/
|
|
ipython_config.py
|
|
|
|
# pyenv
|
|
.python-version
|
|
|
|
# pipenv
|
|
Pipfile.lock
|
|
|
|
# poetry
|
|
poetry.lock
|
|
|
|
# pdm
|
|
.pdm.toml
|
|
.pdm-python
|
|
.pdm-build/
|
|
|
|
# PEP 582
|
|
__pypackages__/
|
|
|
|
# Celery stuff
|
|
celerybeat-schedule
|
|
celerybeat.pid
|
|
|
|
# SageMath parsed files
|
|
*.sage.py
|
|
|
|
# Environments
|
|
.env
|
|
.venv
|
|
env/
|
|
venv/
|
|
ENV/
|
|
env.bak/
|
|
venv.bak/
|
|
|
|
# Spyder project settings
|
|
.spyderproject
|
|
.spyproject
|
|
|
|
# Rope project settings
|
|
.ropeproject
|
|
|
|
# mkdocs documentation
|
|
/site
|
|
|
|
# mypy
|
|
.mypy_cache/
|
|
.dmypy.json
|
|
dmypy.json
|
|
|
|
# Pyre type checker
|
|
.pyre/
|
|
|
|
# pytype static type analyzer
|
|
.pytype/
|
|
|
|
# Cython debug symbols
|
|
cython_debug/
|
|
|
|
# PyCharm
|
|
.idea/
|
|
|
|
# VS Code
|
|
.vscode/
|
|
|
|
# Custom entries
|
|
.cursor
|
|
papers/
|
|
# Ignore data files but keep the data/ directory structure
|
|
data/*.txt
|
|
data/*.json
|
|
data/*.csv
|
|
data/*.db
|
|
data/*.sqlite
|
|
data/*.sqlite3
|
|
# But NOT data/__init__.py (needed for Python module)
|
|
!data/__init__.py
|
|
# Ignore storage symlinks
|
|
data_storage
|
|
checkpoints_storage
|
|
|
|
# OS-specific
|
|
.DS_Store
|
|
.DS_Store?
|
|
._*
|
|
.Spotlight-V100
|
|
.Trashes
|
|
ehthumbs.db
|
|
Thumbs.db
|
|
|
|
# Checkpoints (if you don't want to track them)
|
|
checkpoints/
|
|
checkpoints_test/
|
|
|
|
# Training artifacts (discovered knowledge)
|
|
# Ignore all images except those in docs/images
|
|
*.png
|
|
*.jpg
|
|
*.jpeg
|
|
*.svg
|
|
!docs/images/
|
|
!docs/images/**/*.png
|
|
!docs/images/**/*.jpg
|
|
!docs/images/**/*.jpeg
|
|
|
|
# Training outputs (exclude from root, but allow in docs/images)
|
|
/training_curve.png
|
|
/loss_by_epoch.png
|
|
training_logs/
|
|
*.log
|
|
|
|
# Model checkpoints and weights
|
|
*.pt
|
|
*.pth
|
|
*.ckpt
|
|
*.safetensors
|
|
|
|
# Training metrics
|
|
metrics.json
|
|
training_metrics.json
|
|
wandb/
|
|
tensorboard_logs/
|
|
|
|
# Data (already covered but ensure)
|
|
data/
|
|
data_storage/
|
|
*.db
|
|
*.sqlite
|
|
*.sqlite3
|