Training in progress, step 100
Browse files- adapter_config.json +33 -0
- adapter_model.safetensors +3 -0
- model.safetensors +1 -1
- runs/May23_09-17-27_gh008.hpc.nyu.edu/events.out.tfevents.1716470269.gh008.hpc.nyu.edu.1680318.0 +3 -0
- runs/May23_09-19-42_gh008.hpc.nyu.edu/events.out.tfevents.1716470404.gh008.hpc.nyu.edu.1680790.0 +3 -0
- runs/May23_09-21-20_gh008.hpc.nyu.edu/events.out.tfevents.1716470501.gh008.hpc.nyu.edu.1681292.0 +3 -0
- runs/May23_09-24-04_gh008.hpc.nyu.edu/events.out.tfevents.1716470666.gh008.hpc.nyu.edu.1681849.0 +3 -0
- runs/May23_09-42-15_gh008.hpc.nyu.edu/events.out.tfevents.1716471757.gh008.hpc.nyu.edu.1684717.0 +3 -0
- runs/May23_09-45-00_gh008.hpc.nyu.edu/events.out.tfevents.1716471922.gh008.hpc.nyu.edu.1685271.0 +3 -0
- runs/May23_09-50-20_gh008.hpc.nyu.edu/events.out.tfevents.1716472243.gh008.hpc.nyu.edu.1686093.0 +3 -0
- runs/May23_09-55-05_gh008.hpc.nyu.edu/events.out.tfevents.1716472528.gh008.hpc.nyu.edu.1687153.0 +3 -0
- runs/May23_10-00-21_gh008.hpc.nyu.edu/events.out.tfevents.1716472845.gh008.hpc.nyu.edu.1688009.0 +3 -0
- runs/May23_10-03-05_gh008.hpc.nyu.edu/events.out.tfevents.1716473005.gh008.hpc.nyu.edu.1688429.0 +3 -0
- runs/May23_10-03-08_ga040.hpc.nyu.edu/events.out.tfevents.1716473032.ga040.hpc.nyu.edu.911113.0 +3 -0
- runs/May23_10-08-13_gh008.hpc.nyu.edu/events.out.tfevents.1716473318.gh008.hpc.nyu.edu.1689599.0 +3 -0
- runs/May23_10-11-54_gh008.hpc.nyu.edu/events.out.tfevents.1716473537.gh008.hpc.nyu.edu.1690278.0 +3 -0
- runs/May23_10-15-06_gh008.hpc.nyu.edu/events.out.tfevents.1716473728.gh008.hpc.nyu.edu.1690907.0 +3 -0
- runs/May23_10-15-07_ga040.hpc.nyu.edu/events.out.tfevents.1716473745.ga040.hpc.nyu.edu.912882.0 +3 -0
- runs/May23_10-19-38_gh008.hpc.nyu.edu/events.out.tfevents.1716474002.gh008.hpc.nyu.edu.1691542.0 +3 -0
- runs/May23_10-24-33_gh008.hpc.nyu.edu/events.out.tfevents.1716474297.gh008.hpc.nyu.edu.1692311.0 +3 -0
- runs/May23_10-26-15_gh008.hpc.nyu.edu/events.out.tfevents.1716474398.gh008.hpc.nyu.edu.1692767.0 +3 -0
- runs/May23_10-26-16_ga040.hpc.nyu.edu/events.out.tfevents.1716474410.ga040.hpc.nyu.edu.915002.0 +3 -0
- runs/May23_10-29-12_gh008.hpc.nyu.edu/events.out.tfevents.1716474573.gh008.hpc.nyu.edu.1693185.0 +3 -0
- runs/May23_10-29-15_ga040.hpc.nyu.edu/events.out.tfevents.1716474585.ga040.hpc.nyu.edu.915764.0 +3 -0
- runs/May23_10-30-18_gh008.hpc.nyu.edu/events.out.tfevents.1716474643.gh008.hpc.nyu.edu.1693628.0 +3 -0
- runs/May23_10-32-06_ga040.hpc.nyu.edu/events.out.tfevents.1716474780.ga040.hpc.nyu.edu.916354.0 +3 -0
- runs/May23_10-34-15_gh008.hpc.nyu.edu/events.out.tfevents.1716475026.gh008.hpc.nyu.edu.1694553.0 +3 -0
- runs/May23_10-42-55_gh008.hpc.nyu.edu/events.out.tfevents.1716475421.gh008.hpc.nyu.edu.1696638.0 +3 -0
- runs/May23_10-45-21_gh008.hpc.nyu.edu/events.out.tfevents.1716475555.gh008.hpc.nyu.edu.1697347.0 +3 -0
- runs/May23_10-47-47_gh008.hpc.nyu.edu/events.out.tfevents.1716475850.gh008.hpc.nyu.edu.1698022.0 +3 -0
- runs/May23_10-52-12_gh008.hpc.nyu.edu/events.out.tfevents.1716476110.gh008.hpc.nyu.edu.1699180.0 +3 -0
- runs/May23_10-57-49_gh008.hpc.nyu.edu/events.out.tfevents.1716476333.gh008.hpc.nyu.edu.1700547.0 +3 -0
- runs/May23_11-04-50_gh008.hpc.nyu.edu/events.out.tfevents.1716476713.gh008.hpc.nyu.edu.1702280.0 +3 -0
- runs/May23_11-16-35_gh008.hpc.nyu.edu/events.out.tfevents.1716477418.gh008.hpc.nyu.edu.1706663.0 +3 -0
- runs/May23_11-21-39_gh008.hpc.nyu.edu/events.out.tfevents.1716477726.gh008.hpc.nyu.edu.1707933.0 +3 -0
- runs/May23_11-51-20_gh008.hpc.nyu.edu/events.out.tfevents.1716479506.gh008.hpc.nyu.edu.1714812.0 +3 -0
- runs/May23_13-33-24_gh008.hpc.nyu.edu/events.out.tfevents.1716485629.gh008.hpc.nyu.edu.1738478.0 +3 -0
- runs/May23_13-34-53_gh008.hpc.nyu.edu/events.out.tfevents.1716485719.gh008.hpc.nyu.edu.1738985.0 +3 -0
- runs/May23_13-46-07_gh008.hpc.nyu.edu/events.out.tfevents.1716486477.gh008.hpc.nyu.edu.1741687.0 +3 -0
- runs/May23_16-45-36_ga009.hpc.nyu.edu/events.out.tfevents.1716497438.ga009.hpc.nyu.edu.1538748.0 +3 -0
- special_tokens_map.json +21 -3
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +32 -10
- training_args.bin +1 -1
adapter_config.json
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alpha_pattern": {},
|
| 3 |
+
"auto_mapping": null,
|
| 4 |
+
"base_model_name_or_path": "meta-llama/Llama-2-7b-chat-hf",
|
| 5 |
+
"bias": "none",
|
| 6 |
+
"fan_in_fan_out": false,
|
| 7 |
+
"inference_mode": true,
|
| 8 |
+
"init_lora_weights": true,
|
| 9 |
+
"layers_pattern": null,
|
| 10 |
+
"layers_to_transform": null,
|
| 11 |
+
"loftq_config": {},
|
| 12 |
+
"lora_alpha": 32,
|
| 13 |
+
"lora_dropout": 0.05,
|
| 14 |
+
"megatron_config": null,
|
| 15 |
+
"megatron_core": "megatron.core",
|
| 16 |
+
"modules_to_save": null,
|
| 17 |
+
"peft_type": "LORA",
|
| 18 |
+
"r": 16,
|
| 19 |
+
"rank_pattern": {},
|
| 20 |
+
"revision": null,
|
| 21 |
+
"target_modules": [
|
| 22 |
+
"q_proj",
|
| 23 |
+
"up_proj",
|
| 24 |
+
"k_proj",
|
| 25 |
+
"o_proj",
|
| 26 |
+
"gate_proj",
|
| 27 |
+
"down_proj",
|
| 28 |
+
"v_proj"
|
| 29 |
+
],
|
| 30 |
+
"task_type": "CAUSAL_LM",
|
| 31 |
+
"use_dora": false,
|
| 32 |
+
"use_rslora": false
|
| 33 |
+
}
|
adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31bda5918cdcd2694c0aa40bc33e4a639322ebcf39c29e9d7591662de8cf52eb
|
| 3 |
+
size 159967880
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 497774208
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:445b6306bda265a64ed6d8a9b46e6aa929d3592601705f32909f6a6e3031865d
|
| 3 |
size 497774208
|
runs/May23_09-17-27_gh008.hpc.nyu.edu/events.out.tfevents.1716470269.gh008.hpc.nyu.edu.1680318.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18ec2c2db78a13a4568d22c9ed4ea388cb4fe8bc9b51d211535f1b70ac0e82c9
|
| 3 |
+
size 4484
|
runs/May23_09-19-42_gh008.hpc.nyu.edu/events.out.tfevents.1716470404.gh008.hpc.nyu.edu.1680790.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:face84397a4b1f5e5e84939b28d2c841dda66211a5ea50892b5d0c2c79d6eb4a
|
| 3 |
+
size 4484
|
runs/May23_09-21-20_gh008.hpc.nyu.edu/events.out.tfevents.1716470501.gh008.hpc.nyu.edu.1681292.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb72c6c8867a5ff9bcc6de636721aa6d2ddf7bb8bde155315910378c13a5eec7
|
| 3 |
+
size 4484
|
runs/May23_09-24-04_gh008.hpc.nyu.edu/events.out.tfevents.1716470666.gh008.hpc.nyu.edu.1681849.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8795879268313a37e7e1f231dda96c2447c76b7382208b68e88398f804854be6
|
| 3 |
+
size 4484
|
runs/May23_09-42-15_gh008.hpc.nyu.edu/events.out.tfevents.1716471757.gh008.hpc.nyu.edu.1684717.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79b929c2b7c56e906434fed1b73dac2e30ccd2a740723acacfed02d91bddac88
|
| 3 |
+
size 4484
|
runs/May23_09-45-00_gh008.hpc.nyu.edu/events.out.tfevents.1716471922.gh008.hpc.nyu.edu.1685271.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b40bf4803f7a8e25260555a9978564ad5899232040a5f2649790754409c5202
|
| 3 |
+
size 4484
|
runs/May23_09-50-20_gh008.hpc.nyu.edu/events.out.tfevents.1716472243.gh008.hpc.nyu.edu.1686093.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3aaac4bb3dcd7a9ec067569ff4077ddfd8a6507bdcfdb19ce534403bbc87bcf3
|
| 3 |
+
size 4484
|
runs/May23_09-55-05_gh008.hpc.nyu.edu/events.out.tfevents.1716472528.gh008.hpc.nyu.edu.1687153.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff1e1b55addf81394800071a1a45be8cd06a50757f9b2b434de78f2532874cd0
|
| 3 |
+
size 4484
|
runs/May23_10-00-21_gh008.hpc.nyu.edu/events.out.tfevents.1716472845.gh008.hpc.nyu.edu.1688009.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86365f0c3a9d46983d1c60c451466af73eb0f76e274afbaa022656a37346a3bd
|
| 3 |
+
size 4483
|
runs/May23_10-03-05_gh008.hpc.nyu.edu/events.out.tfevents.1716473005.gh008.hpc.nyu.edu.1688429.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c9a5ae38baa4ea56688ba1c86ad7f598feb2a033dab914dabf850cf9bc5105c
|
| 3 |
+
size 4483
|
runs/May23_10-03-08_ga040.hpc.nyu.edu/events.out.tfevents.1716473032.ga040.hpc.nyu.edu.911113.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc3423224948a50579c9c7864f6d97e9c229494106a3eee06841dea146c21b46
|
| 3 |
+
size 4483
|
runs/May23_10-08-13_gh008.hpc.nyu.edu/events.out.tfevents.1716473318.gh008.hpc.nyu.edu.1689599.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88882e622ab6bc1ad92f66b7a3a93b7df678fb4bf5164d37d0b9c5f88c32b9db
|
| 3 |
+
size 4483
|
runs/May23_10-11-54_gh008.hpc.nyu.edu/events.out.tfevents.1716473537.gh008.hpc.nyu.edu.1690278.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b4b5faca6513ad6cafce84d8fc93852224e7b6051787ef5e1afb9c9ad5f1e4d
|
| 3 |
+
size 4483
|
runs/May23_10-15-06_gh008.hpc.nyu.edu/events.out.tfevents.1716473728.gh008.hpc.nyu.edu.1690907.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed29b3508fb12ecb0e7977761040af07fcccddf1e627f9a67104e267a619f8d0
|
| 3 |
+
size 4483
|
runs/May23_10-15-07_ga040.hpc.nyu.edu/events.out.tfevents.1716473745.ga040.hpc.nyu.edu.912882.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78dfb5fcaae82c6d1f94ff4d647be052012d0a2be9a798b9cba7287c5bc7b087
|
| 3 |
+
size 4483
|
runs/May23_10-19-38_gh008.hpc.nyu.edu/events.out.tfevents.1716474002.gh008.hpc.nyu.edu.1691542.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52d9ac9b5eaf6df22c7082147ff02705c4efd81fb18f4325e845d8da0f9439c2
|
| 3 |
+
size 4482
|
runs/May23_10-24-33_gh008.hpc.nyu.edu/events.out.tfevents.1716474297.gh008.hpc.nyu.edu.1692311.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d132e29280054f0ccaf4ec2aa153b6ce800bf858e540ec4aeb9bb1923149f06
|
| 3 |
+
size 4482
|
runs/May23_10-26-15_gh008.hpc.nyu.edu/events.out.tfevents.1716474398.gh008.hpc.nyu.edu.1692767.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94a9b5f024417491544e1b434f0fb71d8cdfb65bddef5901d6719d77100d06ca
|
| 3 |
+
size 4482
|
runs/May23_10-26-16_ga040.hpc.nyu.edu/events.out.tfevents.1716474410.ga040.hpc.nyu.edu.915002.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6da6256a472c9d8a5a26a3f94c6ce003d1f53fc2194dbb46c7645bde3bf0f5f8
|
| 3 |
+
size 4482
|
runs/May23_10-29-12_gh008.hpc.nyu.edu/events.out.tfevents.1716474573.gh008.hpc.nyu.edu.1693185.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66559ecf40bc257f668ba1b8a501e7b7316ec4e2ef72db12ae77b710627108a5
|
| 3 |
+
size 4482
|
runs/May23_10-29-15_ga040.hpc.nyu.edu/events.out.tfevents.1716474585.ga040.hpc.nyu.edu.915764.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec1c802cee45811a3fb0d279ba7644ac563f46440a50169666a02a969d4682bc
|
| 3 |
+
size 4482
|
runs/May23_10-30-18_gh008.hpc.nyu.edu/events.out.tfevents.1716474643.gh008.hpc.nyu.edu.1693628.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f20789935231fff7a199f0fb241357f9f49b10b6af6e8e2a1100db0ac036eb12
|
| 3 |
+
size 4482
|
runs/May23_10-32-06_ga040.hpc.nyu.edu/events.out.tfevents.1716474780.ga040.hpc.nyu.edu.916354.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94bb4e7aa5aa473bd42547152e8665d72951ac66a4bb85d18556fbce5443aca1
|
| 3 |
+
size 4482
|
runs/May23_10-34-15_gh008.hpc.nyu.edu/events.out.tfevents.1716475026.gh008.hpc.nyu.edu.1694553.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f952313b5bb2a57d8939910c231c9253b250af32eeb39f1947251ca2ce3a0aea
|
| 3 |
+
size 4482
|
runs/May23_10-42-55_gh008.hpc.nyu.edu/events.out.tfevents.1716475421.gh008.hpc.nyu.edu.1696638.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:904571427eb76c577af06f07feb1fc53880815fd226144258f9b5e0fff2f345a
|
| 3 |
+
size 4483
|
runs/May23_10-45-21_gh008.hpc.nyu.edu/events.out.tfevents.1716475555.gh008.hpc.nyu.edu.1697347.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab0a70de4e7ba548001959cc0947fc36cf53d4097fa69e7066778a9c00c3cfb6
|
| 3 |
+
size 4483
|
runs/May23_10-47-47_gh008.hpc.nyu.edu/events.out.tfevents.1716475850.gh008.hpc.nyu.edu.1698022.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a975830f34f2a0ea88331a9e194aeb432016873981d44330e0b238ec6f03b52
|
| 3 |
+
size 346
|
runs/May23_10-52-12_gh008.hpc.nyu.edu/events.out.tfevents.1716476110.gh008.hpc.nyu.edu.1699180.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d00954e1235202bd5a21ba66e9ba0ad7cbe98af1c600ca12c8f4caebe86e2d9
|
| 3 |
+
size 4482
|
runs/May23_10-57-49_gh008.hpc.nyu.edu/events.out.tfevents.1716476333.gh008.hpc.nyu.edu.1700547.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3c6d7d6ef395e9d1f04fc08691fd9e66ead6f9b446eded4dab325019620b9e1
|
| 3 |
+
size 4482
|
runs/May23_11-04-50_gh008.hpc.nyu.edu/events.out.tfevents.1716476713.gh008.hpc.nyu.edu.1702280.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdabf37b2d97462b475553bccc8b89586e2a01ca94e1844c151dad691fcc9b8f
|
| 3 |
+
size 4482
|
runs/May23_11-16-35_gh008.hpc.nyu.edu/events.out.tfevents.1716477418.gh008.hpc.nyu.edu.1706663.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da756bdf09eab54df3e1ec24d490262f2693da70a7c2a53f4de8226447b0570e
|
| 3 |
+
size 4482
|
runs/May23_11-21-39_gh008.hpc.nyu.edu/events.out.tfevents.1716477726.gh008.hpc.nyu.edu.1707933.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca5820032dbd96149a6c634b7fe9137fc8aee0da2b48be555ca0c53d2e3943a5
|
| 3 |
+
size 5406
|
runs/May23_11-51-20_gh008.hpc.nyu.edu/events.out.tfevents.1716479506.gh008.hpc.nyu.edu.1714812.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f32af5242425b7692f75b0979821e3d2cc420ef706ca55e5958b8e39d46c8149
|
| 3 |
+
size 4483
|
runs/May23_13-33-24_gh008.hpc.nyu.edu/events.out.tfevents.1716485629.gh008.hpc.nyu.edu.1738478.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:199cbab01d4dcfbcd178c5d3759f9e014461caefc974616a8ffa3c35b145d381
|
| 3 |
+
size 4483
|
runs/May23_13-34-53_gh008.hpc.nyu.edu/events.out.tfevents.1716485719.gh008.hpc.nyu.edu.1738985.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c33ded9c0b0c8745593aebf4d3aa5a554919dabe3f4bd975709ae1fae537a87
|
| 3 |
+
size 4637
|
runs/May23_13-46-07_gh008.hpc.nyu.edu/events.out.tfevents.1716486477.gh008.hpc.nyu.edu.1741687.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c39382ff776f2066f03c2cc4ac45b3020566ea7e16325bcff3dfdf8e7b2500ab
|
| 3 |
+
size 4741
|
runs/May23_16-45-36_ga009.hpc.nyu.edu/events.out.tfevents.1716497438.ga009.hpc.nyu.edu.1538748.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1b9e165460b595eb373577b896c7d598550e579b2b0febadf216f860004fdba
|
| 3 |
+
size 5049
|
special_tokens_map.json
CHANGED
|
@@ -1,6 +1,24 @@
|
|
| 1 |
{
|
| 2 |
-
"bos_token":
|
| 3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
"pad_token": "#",
|
| 5 |
-
"unk_token":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "</s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
"pad_token": "#",
|
| 17 |
+
"unk_token": {
|
| 18 |
+
"content": "<unk>",
|
| 19 |
+
"lstrip": false,
|
| 20 |
+
"normalized": false,
|
| 21 |
+
"rstrip": false,
|
| 22 |
+
"single_word": false
|
| 23 |
+
}
|
| 24 |
}
|
tokenizer.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
|
| 3 |
+
size 499723
|
tokenizer_config.json
CHANGED
|
@@ -1,21 +1,43 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"add_eos": true,
|
| 3 |
-
"
|
| 4 |
"added_tokens_decoder": {
|
| 5 |
-
"
|
| 6 |
-
"content": "
|
| 7 |
"lstrip": false,
|
| 8 |
-
"normalized":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
"rstrip": false,
|
| 10 |
"single_word": false,
|
| 11 |
"special": true
|
| 12 |
}
|
| 13 |
},
|
| 14 |
-
"bos_token": "
|
| 15 |
-
"
|
| 16 |
-
"
|
| 17 |
-
"
|
|
|
|
|
|
|
| 18 |
"pad_token": "#",
|
| 19 |
-
"
|
| 20 |
-
"
|
|
|
|
|
|
|
|
|
|
| 21 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"add_bos_token": true,
|
| 3 |
"add_eos": true,
|
| 4 |
+
"add_eos_token": false,
|
| 5 |
"added_tokens_decoder": {
|
| 6 |
+
"0": {
|
| 7 |
+
"content": "<unk>",
|
| 8 |
"lstrip": false,
|
| 9 |
+
"normalized": false,
|
| 10 |
+
"rstrip": false,
|
| 11 |
+
"single_word": false,
|
| 12 |
+
"special": true
|
| 13 |
+
},
|
| 14 |
+
"1": {
|
| 15 |
+
"content": "<s>",
|
| 16 |
+
"lstrip": false,
|
| 17 |
+
"normalized": false,
|
| 18 |
+
"rstrip": false,
|
| 19 |
+
"single_word": false,
|
| 20 |
+
"special": true
|
| 21 |
+
},
|
| 22 |
+
"2": {
|
| 23 |
+
"content": "</s>",
|
| 24 |
+
"lstrip": false,
|
| 25 |
+
"normalized": false,
|
| 26 |
"rstrip": false,
|
| 27 |
"single_word": false,
|
| 28 |
"special": true
|
| 29 |
}
|
| 30 |
},
|
| 31 |
+
"bos_token": "<s>",
|
| 32 |
+
"chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content.strip() + ' ' + eos_token }}{% endif %}{% endfor %}",
|
| 33 |
+
"clean_up_tokenization_spaces": false,
|
| 34 |
+
"eos_token": "</s>",
|
| 35 |
+
"legacy": false,
|
| 36 |
+
"model_max_length": 1000000000000000019884624838656,
|
| 37 |
"pad_token": "#",
|
| 38 |
+
"padding_side": "right",
|
| 39 |
+
"sp_model_kwargs": {},
|
| 40 |
+
"tokenizer_class": "LlamaTokenizer",
|
| 41 |
+
"unk_token": "<unk>",
|
| 42 |
+
"use_default_system_prompt": false
|
| 43 |
}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4283
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be3a3083b66353ca8787f4c78dce7b49a9e7e2f1d29b9995063b2852c517160d
|
| 3 |
size 4283
|