Example
import subprocess
def get_mesh_ip():
cmd = f"kubectl get svc seldon-mesh -n seldon -o jsonpath='{{.status.loadBalancer.ingress[0].ip}}'"
return subprocess.check_output(cmd, shell=True).decode('utf-8')!cat models/tiny-llama/model-settings.json{
"name": "tiny-llama",
"implementation": "mlserver_llm_local.runtime.Local",
"parameters": {
"extra": {
"backend": "vllm",
"config": {
"model_type": "chat.completions",
"model_settings": {
"model": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
"dtype": "float16"
}
},
"prompt_utils": {
"model_type": "compiled"
}
}
}
}Last updated
Was this helpful?