Training in progress, step 2600

Files changed (6) hide show

adapter_config.json CHANGED Viewed

@@ -9,7 +9,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 32,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -19,13 +19,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
-    "down_proj",
-    "up_proj",
-    "gate_proj",
     "v_proj",
     "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 16,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
+    "gate_proj",
+    "up_proj",
+    "o_proj",
     "q_proj",
+    "k_proj",
+    "down_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb78a78afe7ab77859553e39647be0334a70356048379027e4e8de57c6e21f32
 size 639691872

 version https://git-lfs.github.com/spec/v1
+oid sha256:da094212136e495b867fa5a2f74bf5324b02731577b79c6fe2bd4482708410e3
 size 639691872

angle.config CHANGED Viewed

@@ -6,16 +6,16 @@
   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
     "r": 64,
-    "lora_alpha": 32,
     "lora_dropout": 0.1,
     "bias": "none",
     "target_modules": [
-      "q_proj",
       "v_proj",
-      "o_proj",
       "up_proj",
       "k_proj",
-      "gate_proj",
       "down_proj"
     ]
   },

   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
     "r": 64,
+    "lora_alpha": 16,
     "lora_dropout": 0.1,
     "bias": "none",
     "target_modules": [
       "v_proj",
+      "gate_proj",
       "up_proj",
+      "o_proj",
+      "q_proj",
       "k_proj",
       "down_proj"
     ]
   },

runs/Mar23_02-16-23_instance-20240226-074643/events.out.tfevents.1711160195.instance-20240226-074643.3613579.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46b2b8c16879d46a72713d0dde8ff4bafe4c199e8e941ed31298f41d450cf5e4
-size 11321

 version https://git-lfs.github.com/spec/v1
+oid sha256:30ff47b9b05e08bc2234b76492784b8bc20c0745b898247fb9272ef96aa21f6f
+size 12941

runs/Mar24_10-47-38_instance-20240226-074643/events.out.tfevents.1711277263.instance-20240226-074643.300367.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d08acc73908603fe8cea89cf63c0945e253e754eced99ab1d365953c757e78ad
+size 10688

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:03ea38a21f34dfac031cbda7385810d20b697435671e70aa1b4d60b84eabc5f2
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:0d25ac5d64e6b4d88ac8b861ed2a41d07744dcd0874dd58e5ddbad7c2e928dfb
 size 5048