mak050 commited on
Commit
c170788
1 Parent(s): 2ef70b9

Model save

Browse files
README.md CHANGED
@@ -5,7 +5,7 @@ tags:
5
  - trl
6
  - sft
7
  - generated_from_trainer
8
- base_model: vilsonrodrigues/falcon-7b-instruct-sharded
9
  model-index:
10
  - name: falcon7binstruct
11
  results: []
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # falcon7binstruct
18
 
19
- This model is a fine-tuned version of [vilsonrodrigues/falcon-7b-instruct-sharded](https://huggingface.co/vilsonrodrigues/falcon-7b-instruct-sharded) on the None dataset.
20
 
21
  ## Model description
22
 
@@ -47,10 +47,14 @@ The following hyperparameters were used during training:
47
  - training_steps: 10
48
  - mixed_precision_training: Native AMP
49
 
 
 
 
 
50
  ### Framework versions
51
 
52
- - PEFT 0.7.2.dev0
53
- - Transformers 4.36.2
54
- - Pytorch 2.1.0+cu121
55
- - Datasets 2.16.1
56
- - Tokenizers 0.15.0
 
5
  - trl
6
  - sft
7
  - generated_from_trainer
8
+ base_model: tiiuae/falcon-7b
9
  model-index:
10
  - name: falcon7binstruct
11
  results: []
 
16
 
17
  # falcon7binstruct
18
 
19
+ This model is a fine-tuned version of [tiiuae/falcon-7b](https://huggingface.co/tiiuae/falcon-7b) on the None dataset.
20
 
21
  ## Model description
22
 
 
47
  - training_steps: 10
48
  - mixed_precision_training: Native AMP
49
 
50
+ ### Training results
51
+
52
+
53
+
54
  ### Framework versions
55
 
56
+ - PEFT 0.9.1.dev0
57
+ - Transformers 4.38.2
58
+ - Pytorch 2.2.1+cu121
59
+ - Datasets 2.18.0
60
+ - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "vilsonrodrigues/falcon-7b-instruct-sharded",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
  "loftq_config": {},
@@ -19,11 +20,12 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "dense_h_to_4h",
23
  "dense",
24
  "dense_4h_to_h",
25
- "query_key_value"
 
26
  ],
27
  "task_type": "CAUSAL_LM",
 
28
  "use_rslora": false
29
  }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "tiiuae/falcon-7b",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
9
+ "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "dense",
24
  "dense_4h_to_h",
25
+ "query_key_value",
26
+ "dense_h_to_4h"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
+ "use_dora": false,
30
  "use_rslora": false
31
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5967403586bbf8b5c66aabb2475c8cec61035cf4e1cb75cc2c4cb9c32ad60fcb
3
  size 130583912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a031bb464b6a0305756a52f74c1810ba5c3f2108a201b6f962628d638091cae7
3
  size 130583912
runs/Mar16_04-01-53_0bc99fd71e10/events.out.tfevents.1710561746.0bc99fd71e10.280.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7942ca6d75985a0fcc6863bdd1dcd87517b20fa88b709ba2c28fb5dfa8838fba
3
+ size 11707
tokenizer.json CHANGED
@@ -2,7 +2,7 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 1024,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d061ff7501cef667fce3218cf66f5de86959968a038ae3ec253026a3e5ee8545
3
- size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:565de370674ac9fedf70cd360599dbfb92c90f74bc34691d31c6396df6c8456d
3
+ size 4920