.gitignore 6.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272
  1. # Configs and keys
  2. ch05/07_gpt_to_llama/config.json
  3. ch07/02_dataset-utilities/config.json
  4. ch07/03_model-evaluation/config.json
  5. # Graphics
  6. appendix-D/01_main-chapter-code/1.pdf
  7. appendix-D/01_main-chapter-code/2.pdf
  8. appendix-D/01_main-chapter-code/3.pdf
  9. appendix-E/01_main-chapter-code/loss-plot.pdf
  10. ch05/01_main-chapter-code/loss-plot.pdf
  11. ch05/01_main-chapter-code/temperature-plot.pdf
  12. ch05/01_main-chapter-code/the-verdict.txt
  13. ch06/01_main-chapter-code/loss-plot.pdf
  14. ch06/01_main-chapter-code/accuracy-plot.pdf
  15. ch07/01_main-chapter-code/loss-plot.pdf
  16. ch07/01_main-chapter-code/loss-plot-standalone.pdf
  17. ch07/01_main-chapter-code/loss-plot-baseline.pdf
  18. ch07/01_main-chapter-code/loss-plot-mask-instructions.pdf
  19. ch07/01_main-chapter-code/loss-plot-phi3-prompt.pdf
  20. ch07/01_main-chapter-code/loss-plot-alpaca52k.pdf
  21. # Checkpoint files
  22. appendix-A/01_main-chapter-code/model.pth
  23. appendix-E/01_main-chapter-code/gpt2
  24. ch05/01_main-chapter-code/gpt2/
  25. ch05/02_alternative_weight_loading/checkpoints
  26. ch05/01_main-chapter-code/model.pth
  27. ch05/01_main-chapter-code/model_and_optimizer.pth
  28. ch05/03_bonus_pretraining_on_gutenberg/model_checkpoints
  29. ch05/06_user_interface/gpt2
  30. ch05/07_gpt_to_llama/Llama-2-7b
  31. ch05/07_gpt_to_llama/Llama-2-7b-chat
  32. ch05/07_gpt_to_llama/.cache
  33. ch05/07_gpt_to_llama/llama3-files
  34. ch05/07_gpt_to_llama/llama31-files
  35. ch05/07_gpt_to_llama/llama32-files
  36. ch06/01_main-chapter-code/gpt2
  37. ch06/02_bonus_additional-experiments/gpt2
  38. ch06/03_bonus_imdb-classification/gpt2
  39. ch07/01_main-chapter-code/gpt2-medium355M-sft-baseline.pth
  40. ch07/01_main-chapter-code/gpt2-medium355M-sft-mask-instructions.pth
  41. ch07/01_main-chapter-code/gpt2-medium355M-sft-phi3-prompt.pth
  42. ch07/01_main-chapter-code/gpt2-medium355M-sft-alpaca52k.pth
  43. ch07/01_main-chapter-code/gpt2-medium355M-sft-lora.pth
  44. ch07/01_main-chapter-code/gpt2-medium355M-sft.pth
  45. ch07/01_main-chapter-code/gpt2-medium355M-sft-standalone.pth
  46. ch07/01_main-chapter-code/Smalltestmodel-sft-standalone.pth
  47. ch07/01_main-chapter-code/gpt2/
  48. # Datasets
  49. appendix-E/01_main-chapter-code/sms_spam_collection.zip
  50. appendix-E/01_main-chapter-code/sms_spam_collection
  51. appendix-E/01_main-chapter-code/train.csv
  52. appendix-E/01_main-chapter-code/test.csv
  53. appendix-E/01_main-chapter-code/validation.csv
  54. ch02/01_main-chapter-code/number-data.txt
  55. ch05/03_bonus_pretraining_on_gutenberg/gutenberg
  56. ch05/03_bonus_pretraining_on_gutenberg/gutenberg_preprocessed
  57. ch06/01_main-chapter-code/sms_spam_collection.zip
  58. ch06/01_main-chapter-code/sms_spam_collection
  59. ch06/01_main-chapter-code/test.csv
  60. ch06/01_main-chapter-code/train.csv
  61. ch06/01_main-chapter-code/validation.csv
  62. ch06/01_main-chapter-code/review_classifier.pth
  63. ch06/02_bonus_additional-experiments/test.csv
  64. ch06/02_bonus_additional-experiments/train.csv
  65. ch06/02_bonus_additional-experiments/validation.csv
  66. ch06/02_bonus_additional-experiments/sms_spam_collection.zip
  67. ch06/02_bonus_additional-experiments/sms_spam_collection
  68. ch06/03_bonus_imdb-classification/aclImdb/
  69. ch06/03_bonus_imdb-classification/aclImdb_v1.tar.gz
  70. ch06/03_bonus_imdb-classification/test.csv
  71. ch06/03_bonus_imdb-classification/train.csv
  72. ch06/03_bonus_imdb-classification/validation.csv
  73. ch07/01_main-chapter-code/instruction-data-with-response-standalone.json
  74. ch07/01_main-chapter-code/instruction-data-with-response-baseline.json
  75. ch07/01_main-chapter-code/instruction-data-with-response-mask-instructions.json
  76. ch07/01_main-chapter-code/loss-plot-lora.pdf
  77. ch07/01_main-chapter-code/instruction-data-with-response-alpaca52k.json
  78. ch07/01_main-chapter-code/instruction-data-with-response-lora.json
  79. ch07/01_main-chapter-code/instruction-data-with-response-phi3-prompt.json
  80. ch07/02_dataset-utilities/instruction-examples-modified.json
  81. ch07/04_preference-tuning-with-dpo/gpt2-medium355M-sft.pth
  82. ch07/04_preference-tuning-with-dpo/loss-plot.pdf
  83. # Other
  84. ch0?/0?_user_interface/.chainlit/
  85. ch0?/0?_user_interface/chainlit.md
  86. ch0?/0?_user_interface/.files
  87. *.lock
  88. # Temporary OS-related files
  89. .DS_Store
  90. # Byte-compiled / optimized / DLL files
  91. __pycache__/
  92. *.py[cod]
  93. *$py.class
  94. *.key
  95. solution/
  96. # C extensions
  97. *.so
  98. # Distribution / packaging
  99. .Python
  100. build/
  101. develop-eggs/
  102. dist/
  103. downloads/
  104. eggs/
  105. .eggs/
  106. lib/
  107. lib64/
  108. parts/
  109. sdist/
  110. var/
  111. wheels/
  112. share/python-wheels/
  113. *.egg-info/
  114. .installed.cfg
  115. *.egg
  116. MANIFEST
  117. # PyInstaller
  118. # Usually these files are written by a python script from a template
  119. # before PyInstaller builds the exe, so as to inject date/other infos into it.
  120. *.manifest
  121. *.spec
  122. # Installer logs
  123. pip-log.txt
  124. pip-delete-this-directory.txt
  125. # Unit test / coverage reports
  126. htmlcov/
  127. .tox/
  128. .nox/
  129. .coverage
  130. .coverage.*
  131. .cache
  132. nosetests.xml
  133. coverage.xml
  134. *.cover
  135. *.py,cover
  136. .hypothesis/
  137. .pytest_cache/
  138. cover/
  139. # Translations
  140. *.mo
  141. *.pot
  142. # Django stuff:
  143. *.log
  144. local_settings.py
  145. db.sqlite3
  146. db.sqlite3-journal
  147. # Flask stuff:
  148. instance/
  149. .webassets-cache
  150. # Scrapy stuff:
  151. .scrapy
  152. # Sphinx documentation
  153. docs/_build/
  154. # PyBuilder
  155. .pybuilder/
  156. target/
  157. # Jupyter Notebook
  158. .ipynb_checkpoints
  159. # IPython
  160. profile_default/
  161. ipython_config.py
  162. # pyenv
  163. # For a library or package, you might want to ignore these files since the code is
  164. # intended to run in multiple environments; otherwise, check them in:
  165. # .python-version
  166. # pipenv
  167. # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
  168. # However, in case of collaboration, if having platform-specific dependencies or dependencies
  169. # having no cross-platform support, pipenv may install dependencies that don't work, or not
  170. # install all needed dependencies.
  171. #Pipfile.lock
  172. # poetry
  173. # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
  174. # This is especially recommended for binary packages to ensure reproducibility, and is more
  175. # commonly ignored for libraries.
  176. # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
  177. #poetry.lock
  178. # pdm
  179. # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
  180. #pdm.lock
  181. # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
  182. # in version control.
  183. # https://pdm.fming.dev/#use-with-ide
  184. .pdm.toml
  185. # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
  186. __pypackages__/
  187. # Celery stuff
  188. celerybeat-schedule
  189. celerybeat.pid
  190. # SageMath parsed files
  191. *.sage.py
  192. # Environments
  193. .env
  194. .venv
  195. env/
  196. venv/
  197. ENV/
  198. env.bak/
  199. venv.bak/
  200. # Spyder project settings
  201. .spyderproject
  202. .spyproject
  203. # Rope project settings
  204. .ropeproject
  205. # mkdocs documentation
  206. /site
  207. # mypy
  208. .mypy_cache/
  209. .dmypy.json
  210. dmypy.json
  211. # Pyre type checker
  212. .pyre/
  213. # pytype static type analyzer
  214. .pytype/
  215. # Cython debug symbols
  216. cython_debug/
  217. # PyCharm
  218. # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
  219. # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
  220. # and can be added to the global gitignore or merged into this file. For a more nuclear
  221. # option (not recommended) you can uncomment the following to ignore the entire idea folder.
  222. #.idea/
  223. # vscode
  224. .vscode/