ramdhanfirdaus commited on
Commit
3fe056f
1 Parent(s): d15e673

Training in progress, step 1900, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -201,19 +201,7 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
201
  ## Training procedure
202
 
203
 
204
- The following `bitsandbytes` quantization config was used during training:
205
- - quant_method: bitsandbytes
206
- - load_in_8bit: False
207
- - load_in_4bit: True
208
- - llm_int8_threshold: 6.0
209
- - llm_int8_skip_modules: None
210
- - llm_int8_enable_fp32_cpu_offload: False
211
- - llm_int8_has_fp16_weight: False
212
- - bnb_4bit_quant_type: nf4
213
- - bnb_4bit_use_double_quant: True
214
- - bnb_4bit_compute_dtype: float16
215
-
216
  ### Framework versions
217
 
218
 
219
- - PEFT 0.6.0.dev0
 
201
  ## Training procedure
202
 
203
 
 
 
 
 
 
 
 
 
 
 
 
 
204
  ### Framework versions
205
 
206
 
207
+ - PEFT 0.6.0
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4d45db665dd61cf0b6b6c28a27c5cceb5550819457f7c9a4ac5d7e2bd6a4ab6
3
  size 50349441
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdfe09cab2aff62aca857964575ca03366c4ebc12dbf03ef7ddb00734bf8bf8e
3
  size 50349441
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfd1ba7d57b14e8adbac3874aa7b89e93f5ee2d0bcd59860947ea69f3e387a23
3
- size 100693001
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daa64d5ba82fa546d882dc9dce9b736527998c5935371e0b2ffc56cc6fd5c305
3
+ size 100691721
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1389c8fb4da5b08654d5ecff1c857ae43115866bad194f9289834fc2a0b6a9c8
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fbdd2b971dfbcc7cf5454c92a80f7cd63b0ae56a21c3ba0214c0de0e3064545
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0410ad60e6d0138b921a03b0a3e367fd27c6ab07cb9a5006fcb66ea8e5bbacc4
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2d4b4cadcabd3e17adcc39c43d8312038a1f5c7f53125f288ba4de5ed25396b
3
  size 627
last-checkpoint/special_tokens_map.json CHANGED
@@ -1,6 +1,24 @@
1
  {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
 
 
 
 
 
 
 
 
 
 
 
 
4
  "pad_token": "<|endoftext|>",
5
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
6
  }
 
1
  {
2
+ "bos_token": {
3
+ "content": "<|endoftext|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
  "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
  }
last-checkpoint/tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.5018609762191772,
3
- "best_model_checkpoint": "./outputs/checkpoint-1700",
4
- "epoch": 1.238615664845173,
5
  "eval_steps": 100,
6
- "global_step": 1700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -245,13 +245,41 @@
245
  "eval_samples_per_second": 43.536,
246
  "eval_steps_per_second": 5.447,
247
  "step": 1700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
248
  }
249
  ],
250
  "logging_steps": 100,
251
  "max_steps": 4116,
252
  "num_train_epochs": 3,
253
  "save_steps": 100,
254
- "total_flos": 1.0135854358789325e+17,
255
  "trial_name": null,
256
  "trial_params": null
257
  }
 
1
  {
2
+ "best_metric": 1.4871549606323242,
3
+ "best_model_checkpoint": "./outputs/checkpoint-1800",
4
+ "epoch": 1.3846994535519126,
5
  "eval_steps": 100,
6
+ "global_step": 1900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
245
  "eval_samples_per_second": 43.536,
246
  "eval_steps_per_second": 5.447,
247
  "step": 1700
248
+ },
249
+ {
250
+ "epoch": 1.31,
251
+ "learning_rate": 0.0002,
252
+ "loss": 1.4781,
253
+ "step": 1800
254
+ },
255
+ {
256
+ "epoch": 1.31,
257
+ "eval_loss": 1.4871549606323242,
258
+ "eval_runtime": 148.0177,
259
+ "eval_samples_per_second": 42.387,
260
+ "eval_steps_per_second": 5.303,
261
+ "step": 1800
262
+ },
263
+ {
264
+ "epoch": 1.38,
265
+ "learning_rate": 0.0002,
266
+ "loss": 1.4858,
267
+ "step": 1900
268
+ },
269
+ {
270
+ "epoch": 1.38,
271
+ "eval_loss": 1.498619794845581,
272
+ "eval_runtime": 133.9486,
273
+ "eval_samples_per_second": 46.839,
274
+ "eval_steps_per_second": 5.86,
275
+ "step": 1900
276
  }
277
  ],
278
  "logging_steps": 100,
279
  "max_steps": 4116,
280
  "num_train_epochs": 3,
281
  "save_steps": 100,
282
+ "total_flos": 1.1326135108192666e+17,
283
  "trial_name": null,
284
  "trial_params": null
285
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5641e8a6689f7acd324a9f463af2ea7fb0e928566e361888ca8bcd1f82571899
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01ce1b3e35021f8f6dfd4d75b8f2f8de9073bd529f840d1746890d9de9ab9328
3
  size 4155