mav23 commited on 4 days ago

Commit

80f7abe

•

1 Parent(s): 0a8e2c0

Upload folder using huggingface_hub

Browse files

Files changed (20) hide show

.gitattributes +17 -0
README.md +143 -0
config.json +24 -0
mistral-7b-instruct-v0.1.Q2_K.gguf +3 -0
mistral-7b-instruct-v0.1.Q3_K.gguf +3 -0
mistral-7b-instruct-v0.1.Q3_K_L.gguf +3 -0
mistral-7b-instruct-v0.1.Q3_K_M.gguf +3 -0
mistral-7b-instruct-v0.1.Q3_K_S.gguf +3 -0
mistral-7b-instruct-v0.1.Q4_0.gguf +3 -0
mistral-7b-instruct-v0.1.Q4_1.gguf +3 -0
mistral-7b-instruct-v0.1.Q4_K.gguf +3 -0
mistral-7b-instruct-v0.1.Q4_K_M.gguf +3 -0
mistral-7b-instruct-v0.1.Q4_K_S.gguf +3 -0
mistral-7b-instruct-v0.1.Q5_0.gguf +3 -0
mistral-7b-instruct-v0.1.Q5_1.gguf +3 -0
mistral-7b-instruct-v0.1.Q5_K.gguf +3 -0
mistral-7b-instruct-v0.1.Q5_K_M.gguf +3 -0
mistral-7b-instruct-v0.1.Q5_K_S.gguf +3 -0
mistral-7b-instruct-v0.1.Q6_K.gguf +3 -0
mistral-7b-instruct-v0.1.Q8_0.gguf +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,20 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q3_K.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q4_K.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q5_K.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+mistral-7b-instruct-v0.1.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,143 @@

+---
+license: apache-2.0
+tags:
+- finetuned
+base_model: mistralai/Mistral-7B-v0.1
+pipeline_tag: text-generation
+inference: true
+widget:
+- messages:
+  - role: user
+    content: What is your favorite condiment?
+extra_gated_description: If you want to learn more about how we process your personal data, please read our <a href="https://mistral.ai/terms/">Privacy Policy</a>.
+---
+# Model Card for Mistral-7B-Instruct-v0.1
+## Encode and Decode with `mistral_common`
+```py
+from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
+from mistral_common.protocol.instruct.messages import UserMessage
+from mistral_common.protocol.instruct.request import ChatCompletionRequest
+mistral_models_path = "MISTRAL_MODELS_PATH"
+tokenizer = MistralTokenizer.v1()
+completion_request = ChatCompletionRequest(messages=[UserMessage(content="Explain Machine Learning to me in a nutshell.")])
+tokens = tokenizer.encode_chat_completion(completion_request).tokens
+```
+## Inference with `mistral_inference`
+ ```py
+from mistral_inference.transformer import Transformer
+from mistral_inference.generate import generate
+model = Transformer.from_folder(mistral_models_path)
+out_tokens, _ = generate([tokens], model, max_tokens=64, temperature=0.0, eos_id=tokenizer.instruct_tokenizer.tokenizer.eos_id)
+result = tokenizer.decode(out_tokens[0])
+print(result)
+```
+## Inference with hugging face `transformers`
+```py
+from transformers import AutoModelForCausalLM
+model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
+model.to("cuda")
+generated_ids = model.generate(tokens, max_new_tokens=1000, do_sample=True)
+# decode with mistral tokenizer
+result = tokenizer.decode(generated_ids[0].tolist())
+print(result)
+```
+> [!TIP]
+> PRs to correct the `transformers` tokenizer so that it gives 1-to-1 the same results as the `mistral_common` reference implementation are very welcome!
+---
+The Mistral-7B-Instruct-v0.1 Large Language Model (LLM) is a instruct fine-tuned version of the [Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) generative text model using a variety of publicly available conversation datasets.
+For full details of this model please read our [paper](https://arxiv.org/abs/2310.06825) and [release blog post](https://mistral.ai/news/announcing-mistral-7b/).
+## Instruction format
+In order to leverage instruction fine-tuning, your prompt should be surrounded by `[INST]` and `[/INST]` tokens. The very first instruction should begin with a begin of sentence id. The next instructions should not. The assistant generation will be ended by the end-of-sentence token id.
+E.g.
+```
+text = "<s>[INST] What is your favourite condiment? [/INST]"
+"Well, I'm quite partial to a good squeeze of fresh lemon juice. It adds just the right amount of zesty flavour to whatever I'm cooking up in the kitchen!</s> "
+"[INST] Do you have mayonnaise recipes? [/INST]"
+```
+This format is available as a [chat template](https://huggingface.co/docs/transformers/main/chat_templating) via the `apply_chat_template()` method:
+```python
+from transformers import AutoModelForCausalLM, AutoTokenizer
+device = "cuda" # the device to load the model onto
+model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
+tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
+messages = [
+    {"role": "user", "content": "What is your favourite condiment?"},
+    {"role": "assistant", "content": "Well, I'm quite partial to a good squeeze of fresh lemon juice. It adds just the right amount of zesty flavour to whatever I'm cooking up in the kitchen!"},
+    {"role": "user", "content": "Do you have mayonnaise recipes?"}
+]
+encodeds = tokenizer.apply_chat_template(messages, return_tensors="pt")
+model_inputs = encodeds.to(device)
+model.to(device)
+generated_ids = model.generate(model_inputs, max_new_tokens=1000, do_sample=True)
+decoded = tokenizer.batch_decode(generated_ids)
+print(decoded[0])
+```
+## Model Architecture
+This instruction model is based on Mistral-7B-v0.1, a transformer model with the following architecture choices:
+- Grouped-Query Attention
+- Sliding-Window Attention
+- Byte-fallback BPE tokenizer
+## Troubleshooting
+- If you see the following error:
+```
+Traceback (most recent call last):
+File "", line 1, in
+File "/transformers/models/auto/auto_factory.py", line 482, in from_pretrained
+config, kwargs = AutoConfig.from_pretrained(
+File "/transformers/models/auto/configuration_auto.py", line 1022, in from_pretrained
+config_class = CONFIG_MAPPING[config_dict["model_type"]]
+File "/transformers/models/auto/configuration_auto.py", line 723, in getitem
+raise KeyError(key)
+KeyError: 'mistral'
+```
+Installing transformers from source should solve the issue
+pip install git+https://github.com/huggingface/transformers
+This should not be required after transformers-v4.33.4.
+## Limitations
+The Mistral 7B Instruct model is a quick demonstration that the base model can be easily fine-tuned to achieve compelling performance.
+It does not have any moderation mechanisms. We're looking forward to engaging with the community on ways to
+make the model finely respect guardrails, allowing for deployment in environments requiring moderated outputs.
+## The Mistral AI Team
+Albert Jiang, Alexandre Sablayrolles, Arthur Mensch, Chris Bamford, Devendra Singh Chaplot, Diego de las Casas, Florian Bressand, Gianna Lengyel, Guillaume Lample, Lélio Renard Lavaud, Lucile Saulnier, Marie-Anne Lachaux, Pierre Stock, Teven Le Scao, Thibaut Lavril, Thomas Wang, Timothée Lacroix, William El Sayed.

config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 14336,
+  "max_position_embeddings": 32768,
+  "model_type": "mistral",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 10000.0,
+  "sliding_window": 4096,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.34.0.dev0",
+  "use_cache": true,
+  "vocab_size": 32000
+}

mistral-7b-instruct-v0.1.Q2_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aa26dc10c3739e2a68f327876344bbb238396bc81677a1e8b7672e1be80b1261
+size 2719243808

mistral-7b-instruct-v0.1.Q3_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3d1926c9ab518c5c2debf9dad208a4c20c2f49bf34e06cbcb79f4b4d9e36564
+size 3518987808

mistral-7b-instruct-v0.1.Q3_K_L.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad7675be40c656c8f4f1cd8ad1f4aa04fc145e468645402255d17d91ce7d7125
+size 3822026272

mistral-7b-instruct-v0.1.Q3_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3d1926c9ab518c5c2debf9dad208a4c20c2f49bf34e06cbcb79f4b4d9e36564
+size 3518987808

mistral-7b-instruct-v0.1.Q3_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a10a9f3a42271df1ed117f6cbba589f8a2c36dc4c8fee6e08d73bc653f78b81
+size 3164569120

mistral-7b-instruct-v0.1.Q4_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5a7d4f43933ccf111c0a586ba027698e1d111173a595dd8e4bf28d00ae6cbeb
+size 4108918304

mistral-7b-instruct-v0.1.Q4_1.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9cf789fd37e33e9f01e71cae50e1a814dd44569ddedee3ec6192d439d0365a61
+size 4553317920

mistral-7b-instruct-v0.1.Q4_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:afe690a8d8dd5021f0b3abc1aa25e3379197c8fd7b1c712b4dc64d4bf3106ecb
+size 4368440864

mistral-7b-instruct-v0.1.Q4_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:afe690a8d8dd5021f0b3abc1aa25e3379197c8fd7b1c712b4dc64d4bf3106ecb
+size 4368440864

mistral-7b-instruct-v0.1.Q4_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3bc7ba03de9880339b9d9a8d5152ccfe9328ad1d49ed3441e003088dac49b3e6
+size 4140375584

mistral-7b-instruct-v0.1.Q5_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84a763fa1eae58959d60bb2f91180279540001e7cce22facfe991bf073d49ef0
+size 4997717536

mistral-7b-instruct-v0.1.Q5_1.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba782381352b7a518f9d0b76bc7c9010a5428dbd135bca2c7dd19a734296a621
+size 5442117152

mistral-7b-instruct-v0.1.Q5_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8df439e21b9680cb7668e4483eb165ff31d2f54b11a44f6206006877c80ee00
+size 5131410976

mistral-7b-instruct-v0.1.Q5_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8df439e21b9680cb7668e4483eb165ff31d2f54b11a44f6206006877c80ee00
+size 5131410976

mistral-7b-instruct-v0.1.Q5_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b44de61c1b7876a57269586ff79a387a88074a8100d9ff513b95a0222ceb4ac4
+size 4997717536

mistral-7b-instruct-v0.1.Q6_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b833423c65b573fd0803ce2d47c315a344dd6bf2ce679692dbd3129583e38a1c
+size 5942066720

mistral-7b-instruct-v0.1.Q8_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc3ee6009901673dedbd30430dc599495b55407f6c1ccaf0b434fa016640456e
+size 7695859232