jennyyyi commited on
Commit
2f6cd4a
·
verified ·
1 Parent(s): b08a314

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -221,7 +221,7 @@ oc apply -f qwen-inferenceservice.yaml
221
  curl https://<inference-service-name>-predictor-default.<domain>/v1/chat/completions
222
  -H "Content-Type: application/json" \
223
  -d '{
224
- "model": "Llama-4-Maverick-17B-128E-Instruct-FP8",
225
  "stream": true,
226
  "stream_options": {
227
  "include_usage": true
 
221
  curl https://<inference-service-name>-predictor-default.<domain>/v1/chat/completions
222
  -H "Content-Type: application/json" \
223
  -d '{
224
+ "model": "llama-3-3-70b-instruct-quantized-w4a16",
225
  "stream": true,
226
  "stream_options": {
227
  "include_usage": true