Training in progress, epoch 1

Files changed (5) hide show

eval/Information-Retrieval_evaluation_results.csv CHANGED Viewed

@@ -1,3 +1,3 @@
 epoch,steps,cosine-Accuracy@1,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@1,cosine-MRR@5,cosine-MRR@10,cosine-NDCG@1,cosine-NDCG@5,cosine-NDCG@10,cosine-MAP@100
 0,0,0.98,1.0,1.0,0.98,0.98,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.98,0.99,0.99,0.98,0.9926185950714291,0.9926185950714291,0.99
-1.0,25,0.96,1.0,1.0,0.96,0.96,0.33000000000000007,0.99,0.19999999999999996,1.0,0.09999999999999998,1.0,0.96,0.9775,0.9775,0.96,0.9832346581878777,0.9832346581878777,0.9775

 epoch,steps,cosine-Accuracy@1,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@1,cosine-MRR@5,cosine-MRR@10,cosine-NDCG@1,cosine-NDCG@5,cosine-NDCG@10,cosine-MAP@100
 0,0,0.98,1.0,1.0,0.98,0.98,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.98,0.99,0.99,0.98,0.9926185950714291,0.9926185950714291,0.99
+1.0,25,0.96,1.0,1.0,0.96,0.96,0.3333333333333334,1.0,0.19999999999999996,1.0,0.09999999999999998,1.0,0.96,0.9783333333333333,0.9783333333333333,0.96,0.9839278926071438,0.9839278926071438,0.9783333333333333

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:684b8120f0e57c454b9b622fea8c21754012d1c7f37308d33ac36b92f663dfee
 size 1191586416

 version https://git-lfs.github.com/spec/v1
+oid sha256:b59c305413a49854b41dceafe313ef4f47ad94567e58a99da0412915528ce695
 size 1191586416

runs/Sep30_16-50-24_95c4d53e8554/events.out.tfevents.1759251025.95c4d53e8554.12407.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:530addc6d0ffa46e22a37c3fc57f86e4f31b19e6037fd3d4f49f91df98fd7d81
+size 7448

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af27db47276bcadd7c9fc56be13116529021dd1f8b4cd9ab529cbc107ded3fdb
 size 6225

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc77ed28663e3e0d4245d176d0327935fec8fb2ff97bfc66001a8f4bdf38be83
 size 6225

training_config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "model_variant": "0.6B",
   "train_file": "data/train_queries.csv",
   "output_dir": "models/qwen-finetuned",
-  "run_name": "20250930-164726",
   "epochs": 1,
   "batch_size": 4,
   "learning_rate": 5e-05,
@@ -19,6 +19,6 @@
   "save_total_limit": null,
   "logging_steps": null,
   "gradient_accumulation_steps": 4,
-  "gradient_checkpointing": false,
   "optim": "adamw_torch"
 }

   "model_variant": "0.6B",
   "train_file": "data/train_queries.csv",
   "output_dir": "models/qwen-finetuned",
+  "run_name": "20250930-165021",
   "epochs": 1,
   "batch_size": 4,
   "learning_rate": 5e-05,
   "save_total_limit": null,
   "logging_steps": null,
   "gradient_accumulation_steps": 4,
+  "gradient_checkpointing": true,
   "optim": "adamw_torch"
 }