Training in progress, step 10

Files changed (5) hide show

README.md CHANGED Viewed

@@ -4,8 +4,8 @@ library_name: transformers
 model_name: Qwen2.5-VL-3B-Instruct-trl-mpo-rlaif-v
 tags:
 - generated_from_trainer
-- trl
 - dpo
 licence: license
 ---

 model_name: Qwen2.5-VL-3B-Instruct-trl-mpo-rlaif-v
 tags:
 - generated_from_trainer
 - dpo
+- trl
 licence: license
 ---

adapter_config.json CHANGED Viewed

@@ -30,11 +30,11 @@
   "target_modules": [
     "k_proj",
     "q_proj",
     "gate_proj",
-    "v_proj",
     "up_proj",
-    "o_proj",
-    "down_proj"
   ],
   "task_type": null,
   "trainable_token_indices": null,

   "target_modules": [
     "k_proj",
     "q_proj",
+    "o_proj",
     "gate_proj",
     "up_proj",
+    "down_proj",
+    "v_proj"
   ],
   "task_type": null,
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a358fda16769da7583c241ffafbe176ace7b9b6cb405b1b41abb2541db609cf2
 size 79626296

 version https://git-lfs.github.com/spec/v1
+oid sha256:79cfcfc73bea9cced970eedbe70653a455398102956e76d775c026ae12170b94
 size 79626296

runs/Jul22_10-43-50_f851870d1cd3/events.out.tfevents.1753181341.f851870d1cd3.10684.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f58493690b89d332d23e103f95eaddbf8c9b86ca8f98d764928d8641fb3f7c43
+size 10838

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0502123a77058b3edbf521c5a0e961dc6b1ad43bc7d54c9b018370ee752085ce
 size 6392

 version https://git-lfs.github.com/spec/v1
+oid sha256:944d27848448eac100fcbcc65d9dcd8a4ef82a3965ed43aae9c58fa04e0e89e5
 size 6392