.gitignore 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313
  1. # Configs and keys
  2. ch05/07_gpt_to_llama/config.json
  3. ch07/02_dataset-utilities/config.json
  4. ch07/03_model-evaluation/config.json
  5. # Graphics
  6. appendix-D/01_main-chapter-code/1.pdf
  7. appendix-D/01_main-chapter-code/2.pdf
  8. appendix-D/01_main-chapter-code/3.pdf
  9. appendix-E/01_main-chapter-code/loss-plot.pdf
  10. ch05/01_main-chapter-code/loss-plot.pdf
  11. ch05/01_main-chapter-code/temperature-plot.pdf
  12. ch05/01_main-chapter-code/the-verdict.txt
  13. ch06/01_main-chapter-code/loss-plot.pdf
  14. ch06/01_main-chapter-code/accuracy-plot.pdf
  15. ch07/01_main-chapter-code/loss-plot.pdf
  16. ch07/01_main-chapter-code/loss-plot-standalone.pdf
  17. ch07/01_main-chapter-code/loss-plot-baseline.pdf
  18. ch07/01_main-chapter-code/loss-plot-mask-instructions.pdf
  19. ch07/01_main-chapter-code/loss-plot-phi3-prompt.pdf
  20. ch07/01_main-chapter-code/loss-plot-alpaca52k.pdf
  21. # Checkpoint files
  22. appendix-A/01_main-chapter-code/model.pth
  23. appendix-E/01_main-chapter-code/gpt2
  24. ch05/01_main-chapter-code/gpt2/
  25. ch05/02_alternative_weight_loading/checkpoints
  26. ch05/02_alternative_weight_loading/*.safetensors
  27. ch05/01_main-chapter-code/model.pth
  28. ch05/01_main-chapter-code/model_and_optimizer.pth
  29. ch05/03_bonus_pretraining_on_gutenberg/model_checkpoints
  30. ch05/06_user_interface/gpt2
  31. ch05/07_gpt_to_llama/.cache
  32. ch05/07_gpt_to_llama/Llama-2-7b
  33. ch05/07_gpt_to_llama/Llama-2-7b-chat
  34. ch05/07_gpt_to_llama/Llama-3-8B
  35. ch05/07_gpt_to_llama/Llama-3-8B-Instruct
  36. ch05/07_gpt_to_llama/Llama-3.1-8B
  37. ch05/07_gpt_to_llama/Llama-3.1-8B-Instruct
  38. ch05/07_gpt_to_llama/Llama-3.2-1B
  39. ch05/07_gpt_to_llama/Llama-3.2-1B-Instruct
  40. ch05/07_gpt_to_llama/Llama-3.2-3B
  41. ch05/07_gpt_to_llama/Llama-3.2-3B-Instruct
  42. ch05/07_gpt_to_llama/llama3.2-1B-instruct.pth
  43. ch05/07_gpt_to_llama/tokenizer.model
  44. ch05/10_llm-training-speed/middlemarch.txt
  45. ch05/10_llm-training-speed/loss.pdf
  46. ch05/10_llm-training-speed/model.pth
  47. ch05/11_qwen3/Qwen3-0.6B
  48. ch05/11_qwen3/Qwen3-0.6B-Base
  49. ch05/11_qwen3/Qwen3-1.7B
  50. ch05/11_qwen3/Qwen3-1.7B-Base
  51. ch05/11_qwen3/Qwen3-4B
  52. ch05/11_qwen3/Qwen3-4B-Base
  53. ch05/11_qwen3/Qwen3-8B
  54. ch05/11_qwen3/Qwen3-8B-Base
  55. ch05/11_qwen3/Qwen3-32B
  56. ch05/11_qwen3/Qwen3-32B-Base
  57. ch06/01_main-chapter-code/gpt2
  58. ch06/02_bonus_additional-experiments/gpt2
  59. ch06/03_bonus_imdb-classification/gpt2
  60. ch07/01_main-chapter-code/gpt2-medium355M-sft-baseline.pth
  61. ch07/01_main-chapter-code/gpt2-medium355M-sft-mask-instructions.pth
  62. ch07/01_main-chapter-code/gpt2-medium355M-sft-phi3-prompt.pth
  63. ch07/01_main-chapter-code/gpt2-medium355M-sft-alpaca52k.pth
  64. ch07/01_main-chapter-code/gpt2-medium355M-sft-lora.pth
  65. ch07/01_main-chapter-code/gpt2-medium355M-sft.pth
  66. ch07/01_main-chapter-code/gpt2-medium355M-sft-standalone.pth
  67. ch07/01_main-chapter-code/Smalltestmodel-sft-standalone.pth
  68. ch07/01_main-chapter-code/gpt2/
  69. # Datasets
  70. the-verdict.txt
  71. appendix-E/01_main-chapter-code/sms_spam_collection.zip
  72. appendix-E/01_main-chapter-code/sms_spam_collection
  73. appendix-E/01_main-chapter-code/train.csv
  74. appendix-E/01_main-chapter-code/test.csv
  75. appendix-E/01_main-chapter-code/validation.csv
  76. ch02/01_main-chapter-code/number-data.txt
  77. ch02/05_bpe-from-scratch/the-verdict.txt
  78. ch05/03_bonus_pretraining_on_gutenberg/gutenberg
  79. ch05/03_bonus_pretraining_on_gutenberg/gutenberg_preprocessed
  80. ch06/01_main-chapter-code/sms_spam_collection.zip
  81. ch06/01_main-chapter-code/sms_spam_collection
  82. ch06/01_main-chapter-code/test.csv
  83. ch06/01_main-chapter-code/train.csv
  84. ch06/01_main-chapter-code/validation.csv
  85. ch06/01_main-chapter-code/review_classifier.pth
  86. ch06/02_bonus_additional-experiments/test.csv
  87. ch06/02_bonus_additional-experiments/train.csv
  88. ch06/02_bonus_additional-experiments/validation.csv
  89. ch06/02_bonus_additional-experiments/sms_spam_collection.zip
  90. ch06/02_bonus_additional-experiments/sms_spam_collection
  91. ch06/03_bonus_imdb-classification/aclImdb/
  92. ch06/03_bonus_imdb-classification/aclImdb_v1.tar.gz
  93. ch06/03_bonus_imdb-classification/test.csv
  94. ch06/03_bonus_imdb-classification/train.csv
  95. ch06/03_bonus_imdb-classification/validation.csv
  96. ch07/01_main-chapter-code/instruction-data-with-response-standalone.json
  97. ch07/01_main-chapter-code/instruction-data-with-response-baseline.json
  98. ch07/01_main-chapter-code/instruction-data-with-response-mask-instructions.json
  99. ch07/01_main-chapter-code/loss-plot-lora.pdf
  100. ch07/01_main-chapter-code/instruction-data-with-response-alpaca52k.json
  101. ch07/01_main-chapter-code/instruction-data-with-response-lora.json
  102. ch07/01_main-chapter-code/instruction-data-with-response-phi3-prompt.json
  103. ch07/02_dataset-utilities/instruction-examples-modified.json
  104. ch07/04_preference-tuning-with-dpo/gpt2-medium355M-sft.pth
  105. ch07/04_preference-tuning-with-dpo/loss-plot.pdf
  106. # Tokenizer files
  107. ch02/05_bpe-from-scratch/bpe_merges.txt
  108. ch02/05_bpe-from-scratch/encoder.json
  109. ch02/05_bpe-from-scratch/vocab.bpe
  110. ch02/05_bpe-from-scratch/vocab.json
  111. encoder.json
  112. vocab.bpe
  113. vocab.json
  114. # Other
  115. ch0?/0?_user_interface/.chainlit/
  116. ch0?/0?_user_interface/chainlit.md
  117. ch0?/0?_user_interface/.files
  118. *.lock
  119. # Temporary OS-related files
  120. .DS_Store
  121. # Byte-compiled / optimized / DLL files
  122. __pycache__/
  123. *.py[cod]
  124. *$py.class
  125. *.key
  126. solution/
  127. # C extensions
  128. *.so
  129. # Distribution / packaging
  130. .Python
  131. build/
  132. develop-eggs/
  133. dist/
  134. downloads/
  135. eggs/
  136. .eggs/
  137. lib/
  138. lib64/
  139. parts/
  140. sdist/
  141. var/
  142. wheels/
  143. share/python-wheels/
  144. *.egg-info/
  145. .installed.cfg
  146. *.egg
  147. MANIFEST
  148. # PyInstaller
  149. # Usually these files are written by a python script from a template
  150. # before PyInstaller builds the exe, so as to inject date/other infos into it.
  151. *.manifest
  152. *.spec
  153. # Installer logs
  154. pip-log.txt
  155. pip-delete-this-directory.txt
  156. # Unit test / coverage reports
  157. htmlcov/
  158. .tox/
  159. .nox/
  160. .coverage
  161. .coverage.*
  162. .cache
  163. nosetests.xml
  164. coverage.xml
  165. *.cover
  166. *.py,cover
  167. .hypothesis/
  168. .pytest_cache/
  169. cover/
  170. # Translations
  171. *.mo
  172. *.pot
  173. # Django stuff:
  174. *.log
  175. local_settings.py
  176. db.sqlite3
  177. db.sqlite3-journal
  178. # Flask stuff:
  179. instance/
  180. .webassets-cache
  181. # Scrapy stuff:
  182. .scrapy
  183. # Sphinx documentation
  184. docs/_build/
  185. # PyBuilder
  186. .pybuilder/
  187. target/
  188. # Jupyter Notebook
  189. .ipynb_checkpoints
  190. # IPython
  191. profile_default/
  192. ipython_config.py
  193. # pyenv
  194. # For a library or package, you might want to ignore these files since the code is
  195. # intended to run in multiple environments; otherwise, check them in:
  196. # .python-version
  197. # pipenv
  198. # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
  199. # However, in case of collaboration, if having platform-specific dependencies or dependencies
  200. # having no cross-platform support, pipenv may install dependencies that don't work, or not
  201. # install all needed dependencies.
  202. #Pipfile.lock
  203. # poetry
  204. # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
  205. # This is especially recommended for binary packages to ensure reproducibility, and is more
  206. # commonly ignored for libraries.
  207. # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
  208. #poetry.lock
  209. # pdm
  210. # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
  211. #pdm.lock
  212. # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
  213. # in version control.
  214. # https://pdm.fming.dev/#use-with-ide
  215. .pdm.toml
  216. # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
  217. __pypackages__/
  218. # Celery stuff
  219. celerybeat-schedule
  220. celerybeat.pid
  221. # SageMath parsed files
  222. *.sage.py
  223. # Environments
  224. .env
  225. .venv
  226. .python-version
  227. uv.lock
  228. pixi.lock
  229. env/
  230. venv/
  231. ENV/
  232. env.bak/
  233. venv.bak/
  234. # Spyder project settings
  235. .spyderproject
  236. .spyproject
  237. # Rope project settings
  238. .ropeproject
  239. # mkdocs documentation
  240. /site
  241. # mypy
  242. .mypy_cache/
  243. .dmypy.json
  244. dmypy.json
  245. # Pyre type checker
  246. .pyre/
  247. # pytype static type analyzer
  248. .pytype/
  249. # Cython debug symbols
  250. cython_debug/
  251. # PyCharm
  252. # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
  253. # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
  254. # and can be added to the global gitignore or merged into this file. For a more nuclear
  255. # option (not recommended) you can uncomment the following to ignore the entire idea folder.
  256. #.idea/
  257. # vscode
  258. .vscode/
  259. # pixi environments
  260. .pixi
  261. *.egg-info