commit files to HF hub

Files changed (6) hide show

README.md CHANGED Viewed

@@ -7,9 +7,11 @@ tags:
 # mistralai/Mistral-7B-Instruct-v0.2
-This is the [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) model, quantized with An example of how to do inference on this model:
 ```python
-from optimum.intel.openvino import OVModelForCausalLM
 from transformers import AutoTokenizer, pipeline
 # model_id should be set to either a local directory or a model available on the HuggingFace hub.

 # mistralai/Mistral-7B-Instruct-v0.2
+This is the [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) model converted to [OpenVINO](https://openvino.ai), for accelerated inference.
+An example of how to do inference on this model:
 ```python
+from optimum.intel import OVModelForCausalLM
 from transformers import AutoTokenizer, pipeline
 # model_id should be set to either a local directory or a model available on the HuggingFace hub.

config.json CHANGED Viewed

@@ -21,7 +21,7 @@
   "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.37.2",
   "use_cache": true,
   "vocab_size": 32000
 }

   "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.40.2",
   "use_cache": true,
   "vocab_size": 32000
 }

inference.py CHANGED Viewed

@@ -1,10 +1,10 @@
-from optimum.intel.openvino import OVModelForCausalLM
 from transformers import AutoTokenizer, pipeline
 # model_id should be set to either a local directory or a model available on the HuggingFace hub.
 model_id = "helenai/mistralai-Mistral-7B-Instruct-v0.2-ov"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
-model = OVModelForCausalLM.from_pretrained(model_id, revision='int8-ptq')
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
 result = pipe("hello world")
 print(result)

+from optimum.intel import OVModelForCausalLM
 from transformers import AutoTokenizer, pipeline
 # model_id should be set to either a local directory or a model available on the HuggingFace hub.
 model_id = "helenai/mistralai-Mistral-7B-Instruct-v0.2-ov"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = OVModelForCausalLM.from_pretrained(model_id)
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
 result = pipe("hello world")
 print(result)

openvino_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c87aaf4a0409c66efe34b90babb9b874b306e69aa28ada4d4b448dd71ee22e95
-size 7280406372

 version https://git-lfs.github.com/spec/v1
+oid sha256:45dc61bad946196600fbbc9cd6cdaf4a87bb28f49abfe63c8c0f078e96ef4ffb
+size 14500241654

openvino_model.xml CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc4f0bd70b3709312d9d1d9e5ba674794b6bc5abc17429897a540f93882f25fc
-size 1795303

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdc45dc7f18a5c55e0dcb36f4f187a7c429d6aaa1693a17d20422b85081642d9
+size 1795331