ke-lly commited on
Commit
9835443
·
verified ·
1 Parent(s): 920d3d4

Training in progress, step 100

Browse files
Files changed (45) hide show
  1. adapter_config.json +33 -0
  2. adapter_model.safetensors +3 -0
  3. model.safetensors +1 -1
  4. runs/May23_09-17-27_gh008.hpc.nyu.edu/events.out.tfevents.1716470269.gh008.hpc.nyu.edu.1680318.0 +3 -0
  5. runs/May23_09-19-42_gh008.hpc.nyu.edu/events.out.tfevents.1716470404.gh008.hpc.nyu.edu.1680790.0 +3 -0
  6. runs/May23_09-21-20_gh008.hpc.nyu.edu/events.out.tfevents.1716470501.gh008.hpc.nyu.edu.1681292.0 +3 -0
  7. runs/May23_09-24-04_gh008.hpc.nyu.edu/events.out.tfevents.1716470666.gh008.hpc.nyu.edu.1681849.0 +3 -0
  8. runs/May23_09-42-15_gh008.hpc.nyu.edu/events.out.tfevents.1716471757.gh008.hpc.nyu.edu.1684717.0 +3 -0
  9. runs/May23_09-45-00_gh008.hpc.nyu.edu/events.out.tfevents.1716471922.gh008.hpc.nyu.edu.1685271.0 +3 -0
  10. runs/May23_09-50-20_gh008.hpc.nyu.edu/events.out.tfevents.1716472243.gh008.hpc.nyu.edu.1686093.0 +3 -0
  11. runs/May23_09-55-05_gh008.hpc.nyu.edu/events.out.tfevents.1716472528.gh008.hpc.nyu.edu.1687153.0 +3 -0
  12. runs/May23_10-00-21_gh008.hpc.nyu.edu/events.out.tfevents.1716472845.gh008.hpc.nyu.edu.1688009.0 +3 -0
  13. runs/May23_10-03-05_gh008.hpc.nyu.edu/events.out.tfevents.1716473005.gh008.hpc.nyu.edu.1688429.0 +3 -0
  14. runs/May23_10-03-08_ga040.hpc.nyu.edu/events.out.tfevents.1716473032.ga040.hpc.nyu.edu.911113.0 +3 -0
  15. runs/May23_10-08-13_gh008.hpc.nyu.edu/events.out.tfevents.1716473318.gh008.hpc.nyu.edu.1689599.0 +3 -0
  16. runs/May23_10-11-54_gh008.hpc.nyu.edu/events.out.tfevents.1716473537.gh008.hpc.nyu.edu.1690278.0 +3 -0
  17. runs/May23_10-15-06_gh008.hpc.nyu.edu/events.out.tfevents.1716473728.gh008.hpc.nyu.edu.1690907.0 +3 -0
  18. runs/May23_10-15-07_ga040.hpc.nyu.edu/events.out.tfevents.1716473745.ga040.hpc.nyu.edu.912882.0 +3 -0
  19. runs/May23_10-19-38_gh008.hpc.nyu.edu/events.out.tfevents.1716474002.gh008.hpc.nyu.edu.1691542.0 +3 -0
  20. runs/May23_10-24-33_gh008.hpc.nyu.edu/events.out.tfevents.1716474297.gh008.hpc.nyu.edu.1692311.0 +3 -0
  21. runs/May23_10-26-15_gh008.hpc.nyu.edu/events.out.tfevents.1716474398.gh008.hpc.nyu.edu.1692767.0 +3 -0
  22. runs/May23_10-26-16_ga040.hpc.nyu.edu/events.out.tfevents.1716474410.ga040.hpc.nyu.edu.915002.0 +3 -0
  23. runs/May23_10-29-12_gh008.hpc.nyu.edu/events.out.tfevents.1716474573.gh008.hpc.nyu.edu.1693185.0 +3 -0
  24. runs/May23_10-29-15_ga040.hpc.nyu.edu/events.out.tfevents.1716474585.ga040.hpc.nyu.edu.915764.0 +3 -0
  25. runs/May23_10-30-18_gh008.hpc.nyu.edu/events.out.tfevents.1716474643.gh008.hpc.nyu.edu.1693628.0 +3 -0
  26. runs/May23_10-32-06_ga040.hpc.nyu.edu/events.out.tfevents.1716474780.ga040.hpc.nyu.edu.916354.0 +3 -0
  27. runs/May23_10-34-15_gh008.hpc.nyu.edu/events.out.tfevents.1716475026.gh008.hpc.nyu.edu.1694553.0 +3 -0
  28. runs/May23_10-42-55_gh008.hpc.nyu.edu/events.out.tfevents.1716475421.gh008.hpc.nyu.edu.1696638.0 +3 -0
  29. runs/May23_10-45-21_gh008.hpc.nyu.edu/events.out.tfevents.1716475555.gh008.hpc.nyu.edu.1697347.0 +3 -0
  30. runs/May23_10-47-47_gh008.hpc.nyu.edu/events.out.tfevents.1716475850.gh008.hpc.nyu.edu.1698022.0 +3 -0
  31. runs/May23_10-52-12_gh008.hpc.nyu.edu/events.out.tfevents.1716476110.gh008.hpc.nyu.edu.1699180.0 +3 -0
  32. runs/May23_10-57-49_gh008.hpc.nyu.edu/events.out.tfevents.1716476333.gh008.hpc.nyu.edu.1700547.0 +3 -0
  33. runs/May23_11-04-50_gh008.hpc.nyu.edu/events.out.tfevents.1716476713.gh008.hpc.nyu.edu.1702280.0 +3 -0
  34. runs/May23_11-16-35_gh008.hpc.nyu.edu/events.out.tfevents.1716477418.gh008.hpc.nyu.edu.1706663.0 +3 -0
  35. runs/May23_11-21-39_gh008.hpc.nyu.edu/events.out.tfevents.1716477726.gh008.hpc.nyu.edu.1707933.0 +3 -0
  36. runs/May23_11-51-20_gh008.hpc.nyu.edu/events.out.tfevents.1716479506.gh008.hpc.nyu.edu.1714812.0 +3 -0
  37. runs/May23_13-33-24_gh008.hpc.nyu.edu/events.out.tfevents.1716485629.gh008.hpc.nyu.edu.1738478.0 +3 -0
  38. runs/May23_13-34-53_gh008.hpc.nyu.edu/events.out.tfevents.1716485719.gh008.hpc.nyu.edu.1738985.0 +3 -0
  39. runs/May23_13-46-07_gh008.hpc.nyu.edu/events.out.tfevents.1716486477.gh008.hpc.nyu.edu.1741687.0 +3 -0
  40. runs/May23_16-45-36_ga009.hpc.nyu.edu/events.out.tfevents.1716497438.ga009.hpc.nyu.edu.1538748.0 +3 -0
  41. special_tokens_map.json +21 -3
  42. tokenizer.json +0 -0
  43. tokenizer.model +3 -0
  44. tokenizer_config.json +32 -10
  45. training_args.bin +1 -1
adapter_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "meta-llama/Llama-2-7b-chat-hf",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layers_pattern": null,
10
+ "layers_to_transform": null,
11
+ "loftq_config": {},
12
+ "lora_alpha": 32,
13
+ "lora_dropout": 0.05,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 16,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "q_proj",
23
+ "up_proj",
24
+ "k_proj",
25
+ "o_proj",
26
+ "gate_proj",
27
+ "down_proj",
28
+ "v_proj"
29
+ ],
30
+ "task_type": "CAUSAL_LM",
31
+ "use_dora": false,
32
+ "use_rslora": false
33
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31bda5918cdcd2694c0aa40bc33e4a639322ebcf39c29e9d7591662de8cf52eb
3
+ size 159967880
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df9763f0f2c61358cfdc3fd03d0d89bae99c3d79bca45d5276390e7b02d88d7e
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:445b6306bda265a64ed6d8a9b46e6aa929d3592601705f32909f6a6e3031865d
3
  size 497774208
runs/May23_09-17-27_gh008.hpc.nyu.edu/events.out.tfevents.1716470269.gh008.hpc.nyu.edu.1680318.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18ec2c2db78a13a4568d22c9ed4ea388cb4fe8bc9b51d211535f1b70ac0e82c9
3
+ size 4484
runs/May23_09-19-42_gh008.hpc.nyu.edu/events.out.tfevents.1716470404.gh008.hpc.nyu.edu.1680790.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:face84397a4b1f5e5e84939b28d2c841dda66211a5ea50892b5d0c2c79d6eb4a
3
+ size 4484
runs/May23_09-21-20_gh008.hpc.nyu.edu/events.out.tfevents.1716470501.gh008.hpc.nyu.edu.1681292.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb72c6c8867a5ff9bcc6de636721aa6d2ddf7bb8bde155315910378c13a5eec7
3
+ size 4484
runs/May23_09-24-04_gh008.hpc.nyu.edu/events.out.tfevents.1716470666.gh008.hpc.nyu.edu.1681849.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8795879268313a37e7e1f231dda96c2447c76b7382208b68e88398f804854be6
3
+ size 4484
runs/May23_09-42-15_gh008.hpc.nyu.edu/events.out.tfevents.1716471757.gh008.hpc.nyu.edu.1684717.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79b929c2b7c56e906434fed1b73dac2e30ccd2a740723acacfed02d91bddac88
3
+ size 4484
runs/May23_09-45-00_gh008.hpc.nyu.edu/events.out.tfevents.1716471922.gh008.hpc.nyu.edu.1685271.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b40bf4803f7a8e25260555a9978564ad5899232040a5f2649790754409c5202
3
+ size 4484
runs/May23_09-50-20_gh008.hpc.nyu.edu/events.out.tfevents.1716472243.gh008.hpc.nyu.edu.1686093.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aaac4bb3dcd7a9ec067569ff4077ddfd8a6507bdcfdb19ce534403bbc87bcf3
3
+ size 4484
runs/May23_09-55-05_gh008.hpc.nyu.edu/events.out.tfevents.1716472528.gh008.hpc.nyu.edu.1687153.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff1e1b55addf81394800071a1a45be8cd06a50757f9b2b434de78f2532874cd0
3
+ size 4484
runs/May23_10-00-21_gh008.hpc.nyu.edu/events.out.tfevents.1716472845.gh008.hpc.nyu.edu.1688009.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86365f0c3a9d46983d1c60c451466af73eb0f76e274afbaa022656a37346a3bd
3
+ size 4483
runs/May23_10-03-05_gh008.hpc.nyu.edu/events.out.tfevents.1716473005.gh008.hpc.nyu.edu.1688429.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c9a5ae38baa4ea56688ba1c86ad7f598feb2a033dab914dabf850cf9bc5105c
3
+ size 4483
runs/May23_10-03-08_ga040.hpc.nyu.edu/events.out.tfevents.1716473032.ga040.hpc.nyu.edu.911113.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc3423224948a50579c9c7864f6d97e9c229494106a3eee06841dea146c21b46
3
+ size 4483
runs/May23_10-08-13_gh008.hpc.nyu.edu/events.out.tfevents.1716473318.gh008.hpc.nyu.edu.1689599.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88882e622ab6bc1ad92f66b7a3a93b7df678fb4bf5164d37d0b9c5f88c32b9db
3
+ size 4483
runs/May23_10-11-54_gh008.hpc.nyu.edu/events.out.tfevents.1716473537.gh008.hpc.nyu.edu.1690278.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b4b5faca6513ad6cafce84d8fc93852224e7b6051787ef5e1afb9c9ad5f1e4d
3
+ size 4483
runs/May23_10-15-06_gh008.hpc.nyu.edu/events.out.tfevents.1716473728.gh008.hpc.nyu.edu.1690907.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed29b3508fb12ecb0e7977761040af07fcccddf1e627f9a67104e267a619f8d0
3
+ size 4483
runs/May23_10-15-07_ga040.hpc.nyu.edu/events.out.tfevents.1716473745.ga040.hpc.nyu.edu.912882.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78dfb5fcaae82c6d1f94ff4d647be052012d0a2be9a798b9cba7287c5bc7b087
3
+ size 4483
runs/May23_10-19-38_gh008.hpc.nyu.edu/events.out.tfevents.1716474002.gh008.hpc.nyu.edu.1691542.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52d9ac9b5eaf6df22c7082147ff02705c4efd81fb18f4325e845d8da0f9439c2
3
+ size 4482
runs/May23_10-24-33_gh008.hpc.nyu.edu/events.out.tfevents.1716474297.gh008.hpc.nyu.edu.1692311.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d132e29280054f0ccaf4ec2aa153b6ce800bf858e540ec4aeb9bb1923149f06
3
+ size 4482
runs/May23_10-26-15_gh008.hpc.nyu.edu/events.out.tfevents.1716474398.gh008.hpc.nyu.edu.1692767.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94a9b5f024417491544e1b434f0fb71d8cdfb65bddef5901d6719d77100d06ca
3
+ size 4482
runs/May23_10-26-16_ga040.hpc.nyu.edu/events.out.tfevents.1716474410.ga040.hpc.nyu.edu.915002.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6da6256a472c9d8a5a26a3f94c6ce003d1f53fc2194dbb46c7645bde3bf0f5f8
3
+ size 4482
runs/May23_10-29-12_gh008.hpc.nyu.edu/events.out.tfevents.1716474573.gh008.hpc.nyu.edu.1693185.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66559ecf40bc257f668ba1b8a501e7b7316ec4e2ef72db12ae77b710627108a5
3
+ size 4482
runs/May23_10-29-15_ga040.hpc.nyu.edu/events.out.tfevents.1716474585.ga040.hpc.nyu.edu.915764.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec1c802cee45811a3fb0d279ba7644ac563f46440a50169666a02a969d4682bc
3
+ size 4482
runs/May23_10-30-18_gh008.hpc.nyu.edu/events.out.tfevents.1716474643.gh008.hpc.nyu.edu.1693628.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f20789935231fff7a199f0fb241357f9f49b10b6af6e8e2a1100db0ac036eb12
3
+ size 4482
runs/May23_10-32-06_ga040.hpc.nyu.edu/events.out.tfevents.1716474780.ga040.hpc.nyu.edu.916354.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94bb4e7aa5aa473bd42547152e8665d72951ac66a4bb85d18556fbce5443aca1
3
+ size 4482
runs/May23_10-34-15_gh008.hpc.nyu.edu/events.out.tfevents.1716475026.gh008.hpc.nyu.edu.1694553.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f952313b5bb2a57d8939910c231c9253b250af32eeb39f1947251ca2ce3a0aea
3
+ size 4482
runs/May23_10-42-55_gh008.hpc.nyu.edu/events.out.tfevents.1716475421.gh008.hpc.nyu.edu.1696638.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904571427eb76c577af06f07feb1fc53880815fd226144258f9b5e0fff2f345a
3
+ size 4483
runs/May23_10-45-21_gh008.hpc.nyu.edu/events.out.tfevents.1716475555.gh008.hpc.nyu.edu.1697347.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab0a70de4e7ba548001959cc0947fc36cf53d4097fa69e7066778a9c00c3cfb6
3
+ size 4483
runs/May23_10-47-47_gh008.hpc.nyu.edu/events.out.tfevents.1716475850.gh008.hpc.nyu.edu.1698022.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a975830f34f2a0ea88331a9e194aeb432016873981d44330e0b238ec6f03b52
3
+ size 346
runs/May23_10-52-12_gh008.hpc.nyu.edu/events.out.tfevents.1716476110.gh008.hpc.nyu.edu.1699180.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d00954e1235202bd5a21ba66e9ba0ad7cbe98af1c600ca12c8f4caebe86e2d9
3
+ size 4482
runs/May23_10-57-49_gh008.hpc.nyu.edu/events.out.tfevents.1716476333.gh008.hpc.nyu.edu.1700547.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3c6d7d6ef395e9d1f04fc08691fd9e66ead6f9b446eded4dab325019620b9e1
3
+ size 4482
runs/May23_11-04-50_gh008.hpc.nyu.edu/events.out.tfevents.1716476713.gh008.hpc.nyu.edu.1702280.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdabf37b2d97462b475553bccc8b89586e2a01ca94e1844c151dad691fcc9b8f
3
+ size 4482
runs/May23_11-16-35_gh008.hpc.nyu.edu/events.out.tfevents.1716477418.gh008.hpc.nyu.edu.1706663.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da756bdf09eab54df3e1ec24d490262f2693da70a7c2a53f4de8226447b0570e
3
+ size 4482
runs/May23_11-21-39_gh008.hpc.nyu.edu/events.out.tfevents.1716477726.gh008.hpc.nyu.edu.1707933.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca5820032dbd96149a6c634b7fe9137fc8aee0da2b48be555ca0c53d2e3943a5
3
+ size 5406
runs/May23_11-51-20_gh008.hpc.nyu.edu/events.out.tfevents.1716479506.gh008.hpc.nyu.edu.1714812.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32af5242425b7692f75b0979821e3d2cc420ef706ca55e5958b8e39d46c8149
3
+ size 4483
runs/May23_13-33-24_gh008.hpc.nyu.edu/events.out.tfevents.1716485629.gh008.hpc.nyu.edu.1738478.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199cbab01d4dcfbcd178c5d3759f9e014461caefc974616a8ffa3c35b145d381
3
+ size 4483
runs/May23_13-34-53_gh008.hpc.nyu.edu/events.out.tfevents.1716485719.gh008.hpc.nyu.edu.1738985.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c33ded9c0b0c8745593aebf4d3aa5a554919dabe3f4bd975709ae1fae537a87
3
+ size 4637
runs/May23_13-46-07_gh008.hpc.nyu.edu/events.out.tfevents.1716486477.gh008.hpc.nyu.edu.1741687.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c39382ff776f2066f03c2cc4ac45b3020566ea7e16325bcff3dfdf8e7b2500ab
3
+ size 4741
runs/May23_16-45-36_ga009.hpc.nyu.edu/events.out.tfevents.1716497438.ga009.hpc.nyu.edu.1538748.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1b9e165460b595eb373577b896c7d598550e579b2b0febadf216f860004fdba
3
+ size 5049
special_tokens_map.json CHANGED
@@ -1,6 +1,24 @@
1
  {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
 
 
 
 
 
 
 
 
 
 
 
 
4
  "pad_token": "#",
5
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
6
  }
 
1
  {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
  "pad_token": "#",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json CHANGED
@@ -1,21 +1,43 @@
1
  {
 
2
  "add_eos": true,
3
- "add_prefix_space": false,
4
  "added_tokens_decoder": {
5
- "50256": {
6
- "content": "<|endoftext|>",
7
  "lstrip": false,
8
- "normalized": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9
  "rstrip": false,
10
  "single_word": false,
11
  "special": true
12
  }
13
  },
14
- "bos_token": "<|endoftext|>",
15
- "clean_up_tokenization_spaces": true,
16
- "eos_token": "<|endoftext|>",
17
- "model_max_length": 1024,
 
 
18
  "pad_token": "#",
19
- "tokenizer_class": "GPT2Tokenizer",
20
- "unk_token": "<|endoftext|>"
 
 
 
21
  }
 
1
  {
2
+ "add_bos_token": true,
3
  "add_eos": true,
4
+ "add_eos_token": false,
5
  "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
  "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
  "rstrip": false,
27
  "single_word": false,
28
  "special": true
29
  }
30
  },
31
+ "bos_token": "<s>",
32
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content.strip() + ' ' + eos_token }}{% endif %}{% endfor %}",
33
+ "clean_up_tokenization_spaces": false,
34
+ "eos_token": "</s>",
35
+ "legacy": false,
36
+ "model_max_length": 1000000000000000019884624838656,
37
  "pad_token": "#",
38
+ "padding_side": "right",
39
+ "sp_model_kwargs": {},
40
+ "tokenizer_class": "LlamaTokenizer",
41
+ "unk_token": "<unk>",
42
+ "use_default_system_prompt": false
43
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb0fec6293f9c6ee8ac8975b776f54669f53c2c96d2ea4dd7cde5aeabea2e5f5
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be3a3083b66353ca8787f4c78dce7b49a9e7e2f1d29b9995063b2852c517160d
3
  size 4283