Training in progress, step 500

Files changed (6) hide show

adapter_config.json CHANGED Viewed

@@ -9,26 +9,23 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 32,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
-  "modules_to_save": [
-    "model.leaky_norm.weight",
-    "model.leaky_norm.bias"
-  ],
   "peft_type": "LORA",
-  "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "o_proj",
-    "q_proj",
-    "up_proj",
-    "v_proj",
     "down_proj",
-    "k_proj",
-    "gate_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 16,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
+  "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 64,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
     "o_proj",
     "down_proj",
+    "v_proj",
+    "gate_proj",
+    "q_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e435f0aa476689f73a4533c0ed439a269faf4383a979cfce4c6c3bcbf39e055d
-size 319876032

 version https://git-lfs.github.com/spec/v1
+oid sha256:aee0d090b0541bb5167188b9198a2ab5f7292290651b09ba6ea477a2d4c1d6a5
+size 639691872

angle.config CHANGED Viewed

@@ -5,10 +5,19 @@
   "pooling_strategy": "cls",
   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
-    "r": 32,
-    "lora_alpha": 32,
     "lora_dropout": 0.1,
-    "bias": "none"
   },
   "apply_lora": 1
 }

   "pooling_strategy": "cls",
   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
+    "r": 64,
+    "lora_alpha": 16,
     "lora_dropout": 0.1,
+    "bias": "none",
+    "target_modules": [
+      "v_proj",
+      "gate_proj",
+      "k_proj",
+      "down_proj",
+      "q_proj",
+      "up_proj",
+      "o_proj"
+    ]
   },
   "apply_lora": 1
 }

runs/Mar20_06-17-12_instance-20240226-074643/events.out.tfevents.1710915444.instance-20240226-074643.1721310.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c90b97ddcede90885b0cc6bc66fb578c855a60808b3a7b4cc8a07df808d628f6
-size 14486

 version https://git-lfs.github.com/spec/v1
+oid sha256:09aea37f7e2efe0e4e90d82ccafddd3f98f1bef1f72ae98bd53c3e6329f9d4a5
+size 14840

runs/Mar20_13-21-43_instance-20240226-074643/events.out.tfevents.1710940908.instance-20240226-074643.1922101.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:092413b45d9f29c97a7d165bf3a6ec151e9f7430bac4f0043e8389335c9626eb
+size 6257

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a17c613d3e0e22264379b569a7ef021e7162704a72661d8fc663d1e63e01d8e
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:0462a9ded0b9349dfe5bea51e9ef06739149993b3576240578be5b4934a7ceae
 size 5048