Update README.md

Browse files

Files changed (1) hide show

README.md +6 -6

README.md CHANGED Viewed

@@ -131,15 +131,15 @@ vllm serve \
 ```bash
 # Download model from Red Hat Registry via docker
 # Note: This downloads the model to ~/.cache/instructlab/models unless --model-dir is specified.
-ilab model download --repository docker://registry.redhat.io/rhelai1/mistral-small-3-1-24b-instruct-2503:1.5
 ```
 ```bash
 # Serve model via ilab
-ilab model serve --model-path ~/.cache/instructlab/models/mistral-small-3-1-24b-instruct-2503 -- --tokenizer-mode "mistral" --config-format "mistral" --load-format "mistral" --tool-call-parser "mistral" --enable-auto-tool-choice --limit-mm-per-prompt "image=10" --max-model-len 16384 --uvicorn-log-level "debug" --trust-remote-code
 # Chat with model
-ilab model chat --model ~/.cache/instructlab/models/mistral-small-3-1-24b-instruct-2503
 ```
 See [Red Hat Enterprise Linux AI documentation](https://docs.redhat.com/en/documentation/red_hat_enterprise_linux_ai/1.4) for more details.
 </details>
@@ -193,9 +193,9 @@ apiVersion: serving.kserve.io/v1beta1
 kind: InferenceService
 metadata:
   annotations:
-    openshift.io/display-name: Mistral-Small-3.1-24B-Instruct-2503-FP8-dynamic # OPTIONAL CHANGE
     serving.kserve.io/deploymentMode: RawDeployment
-  name: Mistral-Small-3.1-24B-Instruct-2503-FP8-dynamic          # specify model name. This value will be used to invoke the model in the payload
   labels:
     opendatahub.io/dashboard: 'true'
 spec:
@@ -244,7 +244,7 @@ oc apply -f qwen-inferenceservice.yaml
 curl https://<inference-service-name>-predictor-default.<domain>/v1/chat/completions
         -H "Content-Type: application/json" \
         -d '{
-    "model": "Mistral-Small-3.1-24B-Instruct-2503-FP8-dynamic",
     "stream": true,
     "stream_options": {
         "include_usage": true

 ```bash
 # Download model from Red Hat Registry via docker
 # Note: This downloads the model to ~/.cache/instructlab/models unless --model-dir is specified.
+ilab model download --repository docker://registry.redhat.io/rhelai1/mistral-small-3-1-24b-instruct-2503-fp8-dynamic:1.5
 ```
 ```bash
 # Serve model via ilab
+ilab model serve --model-path ~/.cache/instructlab/models/mistral-small-3-1-24b-instruct-2503-fp8-dynamic
 # Chat with model
+ilab model chat --model ~/.cache/instructlab/models/mistral-small-3-1-24b-instruct-2503-fp8-dynamic
 ```
 See [Red Hat Enterprise Linux AI documentation](https://docs.redhat.com/en/documentation/red_hat_enterprise_linux_ai/1.4) for more details.
 </details>
 kind: InferenceService
 metadata:
   annotations:
+    openshift.io/display-name: mistral-small-3-1-24b-instruct-2503-fp8-dynamic # OPTIONAL CHANGE
     serving.kserve.io/deploymentMode: RawDeployment
+  name: mistral-small-3-1-24b-instruct-2503-fp8-dynamic          # specify model name. This value will be used to invoke the model in the payload
   labels:
     opendatahub.io/dashboard: 'true'
 spec:
 curl https://<inference-service-name>-predictor-default.<domain>/v1/chat/completions
         -H "Content-Type: application/json" \
         -d '{
+    "model": "mistral-small-3-1-24b-instruct-2503-fp8-dynamic",
     "stream": true,
     "stream_options": {
         "include_usage": true