totenwqh1101 commited on
Commit
77ba916
·
verified ·
1 Parent(s): 8c7ae28

Training in progress, epoch 0

Browse files
adapter_config.json CHANGED
@@ -27,11 +27,11 @@
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
 
30
  "v_proj",
31
- "q_proj",
32
  "dense",
33
- "o_proj",
34
- "k_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
37
  "trainable_token_indices": null,
 
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
30
+ "o_proj",
31
  "v_proj",
 
32
  "dense",
33
+ "k_proj",
34
+ "q_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
37
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0b21fdcdc9a65cf5f8d06ca171d6ec8e09e189ea26caf4edd762a75a3352e7f
3
  size 2732672640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b27cb8a4a92ba14d321837469faebebb769adb447a1e27584cc76e9086329795
3
  size 2732672640
runs/Jun04_06-21-54_raycluster-training-coreweave-gpu-group-worker-88787/events.out.tfevents.1749018154.raycluster-training-coreweave-gpu-group-worker-88787 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f074c68d798757aa3eaabbef68107b317fbca1ee525735cd4c273cec855cae8b
3
+ size 7028
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5541bcb592c19bf3a50648bfd7147f8e5f289ed96d239633694053ef71414502
3
- size 5816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7717fc4105221c10be7b9a08616747adabc4072c548785dd8f4dc567afb007f
3
+ size 6225