Training in progress, epoch 1

Files changed (6) hide show

README.md CHANGED Viewed

@@ -34,10 +34,10 @@ This model was trained with SFT.
 ### Framework versions
-- TRL: 0.16.1
-- Transformers: 4.50.3
-- Pytorch: 2.2.2
-- Datasets: 3.5.0
 - Tokenizers: 0.21.1
 ## Citations

 ### Framework versions
+- TRL: 0.15.2
+- Transformers: 4.51.0
+- Pytorch: 2.6.0
+- Datasets: 3.3.2
 - Tokenizers: 0.21.1
 ## Citations

adapter_config.json CHANGED Viewed

@@ -3,7 +3,6 @@
   "auto_mapping": null,
   "base_model_name_or_path": "google/gemma-3-4b-pt",
   "bias": "none",
-  "corda_config": null,
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
@@ -27,19 +26,19 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
-    "o_proj",
-    "up_proj",
     "down_proj",
-    "fc2",
-    "q_proj",
     "v_proj",
     "out_proj",
-    "fc1",
-    "gate_proj"
   ],
   "task_type": "CAUSAL_LM",
-  "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false
 }

   "auto_mapping": null,
   "base_model_name_or_path": "google/gemma-3-4b-pt",
   "bias": "none",
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
+    "fc1",
+    "gate_proj",
+    "lm_head",
     "v_proj",
+    "q_proj",
+    "o_proj",
     "out_proj",
+    "up_proj",
+    "k_proj",
+    "fc2"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a5946d970833815c70f617b28f76fd602c786c1e1e87398b229f355de32f86f6
 size 2839124552

 version https://git-lfs.github.com/spec/v1
+oid sha256:10a0983125ec85332be9a20afe7bea354a20e1c91fe76a8b79fc75e4717deeb9
 size 2839124552

runs/Apr08_08-52-32_krishnan-srinivas-nc40/events.out.tfevents.1744108008.krishnan-srinivas-nc40.4023.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f6d884688e6a5d25e173c90476bf1e2701e22ede66b814f1265385636788e84
+size 6786

runs/Apr08_10-27-18_krishnan-srinivas-nc40/events.out.tfevents.1744108046.krishnan-srinivas-nc40.4023.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:09c8d384cfeb08c1ff7516945ac631bdf96ac9ed7add6a0ee0ac14c48da05dd0
+size 7197

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:60349569af3e6bc0178144eab375e77102a48ac0f96cccdd0935772c31c6e0b2
-size 5752

 version https://git-lfs.github.com/spec/v1
+oid sha256:ebd1f8bb9b9e95ed8e54d12109eb1983e52ba023c81787751513b2ae39d2cdc6
+size 5624