We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent dcbf9df commit 498e666Copy full SHA for 498e666
docs/kubernetes/README.md
@@ -53,6 +53,12 @@ Each backend has deployment examples and configuration options:
53
export NAMESPACE=dynamo-cloud
54
kubectl create namespace ${NAMESPACE}
55
56
+# to pull model from HF
57
+export HF_TOKEN=<Token-Here>
58
+kubectl create secret generic hf-token-secret \
59
+ --from-literal=HF_TOKEN="$HF_TOKEN" \
60
+ -n ${NAMESPACE};
61
+
62
# Deploy any example (this uses vLLM with Qwen model using aggregated serving)
63
kubectl apply -f components/backends/vllm/deploy/agg.yaml -n ${NAMESPACE}
64
0 commit comments