Training in progress, epoch 1
Browse files
eval/Information-Retrieval_evaluation_results.csv
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
epoch,steps,cosine-Accuracy@1,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@1,cosine-MRR@5,cosine-MRR@10,cosine-NDCG@1,cosine-NDCG@5,cosine-NDCG@10,cosine-MAP@100
|
| 2 |
0,0,0.98,1.0,1.0,0.98,0.98,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.98,0.99,0.99,0.98,0.9926185950714291,0.9926185950714291,0.99
|
| 3 |
-
1.0,25,0.96,1.0,1.0,0.96,0.96,0.
|
|
|
|
| 1 |
epoch,steps,cosine-Accuracy@1,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@1,cosine-MRR@5,cosine-MRR@10,cosine-NDCG@1,cosine-NDCG@5,cosine-NDCG@10,cosine-MAP@100
|
| 2 |
0,0,0.98,1.0,1.0,0.98,0.98,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.98,0.99,0.99,0.98,0.9926185950714291,0.9926185950714291,0.99
|
| 3 |
+
1.0,25,0.96,1.0,1.0,0.96,0.96,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.96,0.9783333333333333,0.9783333333333333,0.96,0.9839278926071438,0.9839278926071438,0.9783333333333333
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1191586416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b59c305413a49854b41dceafe313ef4f47ad94567e58a99da0412915528ce695
|
| 3 |
size 1191586416
|
runs/Sep30_16-50-24_95c4d53e8554/events.out.tfevents.1759251025.95c4d53e8554.12407.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:530addc6d0ffa46e22a37c3fc57f86e4f31b19e6037fd3d4f49f91df98fd7d81
|
| 3 |
+
size 7448
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6225
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc77ed28663e3e0d4245d176d0327935fec8fb2ff97bfc66001a8f4bdf38be83
|
| 3 |
size 6225
|
training_config.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"model_variant": "0.6B",
|
| 3 |
"train_file": "data/train_queries.csv",
|
| 4 |
"output_dir": "models/qwen-finetuned",
|
| 5 |
-
"run_name": "20250930-
|
| 6 |
"epochs": 1,
|
| 7 |
"batch_size": 4,
|
| 8 |
"learning_rate": 5e-05,
|
|
@@ -19,6 +19,6 @@
|
|
| 19 |
"save_total_limit": null,
|
| 20 |
"logging_steps": null,
|
| 21 |
"gradient_accumulation_steps": 4,
|
| 22 |
-
"gradient_checkpointing":
|
| 23 |
"optim": "adamw_torch"
|
| 24 |
}
|
|
|
|
| 2 |
"model_variant": "0.6B",
|
| 3 |
"train_file": "data/train_queries.csv",
|
| 4 |
"output_dir": "models/qwen-finetuned",
|
| 5 |
+
"run_name": "20250930-165021",
|
| 6 |
"epochs": 1,
|
| 7 |
"batch_size": 4,
|
| 8 |
"learning_rate": 5e-05,
|
|
|
|
| 19 |
"save_total_limit": null,
|
| 20 |
"logging_steps": null,
|
| 21 |
"gradient_accumulation_steps": 4,
|
| 22 |
+
"gradient_checkpointing": true,
|
| 23 |
"optim": "adamw_torch"
|
| 24 |
}
|