vladkolev commited on
Commit
6159af3
1 Parent(s): 32cfdcf

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,12 +1,11 @@
1
  {
2
- "_name_or_path": "Geotrend/bert-base-bg-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "directionality": "bidi",
9
- "gradient_checkpointing": false,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
@@ -35,6 +34,7 @@
35
  "model_type": "bert",
36
  "num_attention_heads": 12,
37
  "num_hidden_layers": 12,
 
38
  "pad_token_id": 0,
39
  "pooler_fc_size": 768,
40
  "pooler_num_attention_heads": 12,
@@ -47,5 +47,5 @@
47
  "transformers_version": "4.27.4",
48
  "type_vocab_size": 2,
49
  "use_cache": true,
50
- "vocab_size": 12134
51
  }
 
1
  {
2
+ "_name_or_path": "DeepPavlov/bert-base-bg-cs-pl-ru-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "directionality": "bidi",
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
34
  "model_type": "bert",
35
  "num_attention_heads": 12,
36
  "num_hidden_layers": 12,
37
+ "output_past": true,
38
  "pad_token_id": 0,
39
  "pooler_fc_size": 768,
40
  "pooler_num_attention_heads": 12,
 
47
  "transformers_version": "4.27.4",
48
  "type_vocab_size": 2,
49
  "use_cache": true,
50
+ "vocab_size": 119547
51
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12046501283d8b26b21a61d7de45b49d27f8c1ab7010d34a4e70a1c074b2d9bd
3
- size 381535349
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:181740487ed0e6fe105166908b13c4280cf3ddd3f50e2d245de19e9025eba415
3
+ size 711508085
runs/Apr03_06-28-19_93e96c54436e/events.out.tfevents.1680503330.93e96c54436e.135.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b912062c0c3dd28ad5561e7de796ffcb2eaee36904da5cd00cffb3a0f9ee0462
3
- size 7164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4783c353ebfab23f67374512dd28560c644267aa430130e674a23eea919abc57
3
+ size 7518
runs/Apr03_06-28-19_93e96c54436e/events.out.tfevents.1680504601.93e96c54436e.135.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dd9835fd16917fc99d12ddcdbf76d530ee394634a4557c7884de4008e4541fc
3
+ size 457
runs/Apr03_06-58-30_93e96c54436e/1680505156.2080572/events.out.tfevents.1680505156.93e96c54436e.135.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6076e8784053406a7f77e31ada8b2274679ff4914384b5dfd308aec8eeea02
3
+ size 5887
runs/Apr03_06-58-30_93e96c54436e/events.out.tfevents.1680505156.93e96c54436e.135.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1444ba48f5914fc4b3cc920705ea04b7d4645bfe034e74ed5f8cd7a3fede26f6
3
+ size 5054
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -3,11 +3,11 @@
3
  "do_basic_tokenize": true,
4
  "do_lower_case": false,
5
  "mask_token": "[MASK]",
6
- "model_max_length": 512,
7
  "never_split": null,
8
  "pad_token": "[PAD]",
9
  "sep_token": "[SEP]",
10
- "special_tokens_map_file": null,
11
  "strip_accents": null,
12
  "tokenize_chinese_chars": true,
13
  "tokenizer_class": "BertTokenizer",
 
3
  "do_basic_tokenize": true,
4
  "do_lower_case": false,
5
  "mask_token": "[MASK]",
6
+ "model_max_length": 1000000000000000019884624838656,
7
  "never_split": null,
8
  "pad_token": "[PAD]",
9
  "sep_token": "[SEP]",
10
+ "special_tokens_map_file": "/root/.cache/huggingface/hub/models--DeepPavlov--bert-base-bg-cs-pl-ru-cased/snapshots/0ab00895c22312978e0a8abd16bbec3fbf7f2bc8/special_tokens_map.json",
11
  "strip_accents": null,
12
  "tokenize_chinese_chars": true,
13
  "tokenizer_class": "BertTokenizer",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:707aaffd5f2e63e4dfee6c3803969edda413fb5138a5db5c7e358fb9e5606eba
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a35bf911db0770445e001b82f62698ef32e8be97f3d422b14ae72951bd03d9e5
3
  size 3579
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff