ucmp137538 commited on
Commit
a3e8ec9
1 Parent(s): 49162e7

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -30,7 +30,7 @@
30
  "rotary_pct": 0.25,
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "float32",
33
- "transformers_version": "4.39.1",
34
  "use_cache": true,
35
  "use_parallel_residual": true,
36
  "vocab_size": 50304
 
30
  "rotary_pct": 0.25,
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "float32",
33
+ "transformers_version": "4.40.1",
34
  "use_cache": true,
35
  "use_parallel_residual": true,
36
  "vocab_size": 50304
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8ca79a8e54b9e30137efb27188ee29969b2e59b081c1c138e0280d0698b18df
3
  size 494780976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72d5995b3576a89c5280daba2c3a54fb79e3cee6415c24b25bc4360ad62a9dd5
3
  size 494780976
runs/Apr30_00-13-46_f0b30b8955e2/events.out.tfevents.1714436028.f0b30b8955e2.1367.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20bf8d89ce7ee30eaef3f4ce1b3fa0bcdf06a1a3066d7e1ae5c97a1c20295697
3
+ size 6097
tokenizer.json CHANGED
@@ -248,10 +248,30 @@
248
  "use_regex": true
249
  },
250
  "post_processor": {
251
- "type": "ByteLevel",
252
- "add_prefix_space": false,
253
- "trim_offsets": true,
254
- "use_regex": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
255
  },
256
  "decoder": {
257
  "type": "ByteLevel",
@@ -267,6 +287,7 @@
267
  "end_of_word_suffix": null,
268
  "fuse_unk": false,
269
  "byte_fallback": false,
 
270
  "vocab": {
271
  "<|endoftext|>": 0,
272
  "<|padding|>": 1,
 
248
  "use_regex": true
249
  },
250
  "post_processor": {
251
+ "type": "TemplateProcessing",
252
+ "single": [
253
+ {
254
+ "Sequence": {
255
+ "id": "A",
256
+ "type_id": 0
257
+ }
258
+ }
259
+ ],
260
+ "pair": [
261
+ {
262
+ "Sequence": {
263
+ "id": "A",
264
+ "type_id": 0
265
+ }
266
+ },
267
+ {
268
+ "Sequence": {
269
+ "id": "B",
270
+ "type_id": 1
271
+ }
272
+ }
273
+ ],
274
+ "special_tokens": {}
275
  },
276
  "decoder": {
277
  "type": "ByteLevel",
 
287
  "end_of_word_suffix": null,
288
  "fuse_unk": false,
289
  "byte_fallback": false,
290
+ "ignore_merges": false,
291
  "vocab": {
292
  "<|endoftext|>": 0,
293
  "<|padding|>": 1,
tokenizer_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
 
1
  {
2
+ "add_bos_token": false,
3
+ "add_eos_token": false,
4
  "add_prefix_space": false,
5
  "added_tokens_decoder": {
6
  "0": {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b1576b206a4cc952f87f11a226b4e26d7040ff2655ecd92466366a5f9d9eb95
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ccc0e0ed6c8c658dffe5084169e13d177d224738cd1b1b9dbb8cabeaf5abaa7
3
+ size 5048