diff --git a/runpodctl/reference/runpodctl-hub.mdx b/runpodctl/reference/runpodctl-hub.mdx index 2def79e6..9f8aca35 100644 --- a/runpodctl/reference/runpodctl-hub.mdx +++ b/runpodctl/reference/runpodctl-hub.mdx @@ -38,7 +38,7 @@ runpodctl hub list --owner runpod #### List flags -Filter by deployment type (`POD` or `SERVERLESS`). +Filter by deployment type (`POD` or `SERVERLESS`). This filter is applied client-side, so `--limit` may return fewer results than specified. @@ -83,7 +83,7 @@ runpodctl hub search stable-diffusion --limit 5 #### Search flags -Filter by deployment type (`POD` or `SERVERLESS`). +Filter by deployment type (`POD` or `SERVERLESS`). This filter is applied client-side, so `--limit` may return fewer results than specified. diff --git a/runpodctl/reference/runpodctl-serverless.mdx b/runpodctl/reference/runpodctl-serverless.mdx index d306b908..a09b2440 100644 --- a/runpodctl/reference/runpodctl-serverless.mdx +++ b/runpodctl/reference/runpodctl-serverless.mdx @@ -68,9 +68,14 @@ runpodctl serverless create --name "my-endpoint" --template-id "tpl_abc123" # Create from a Hub repo runpodctl hub search vllm # Find the hub ID runpodctl serverless create --hub-id cm8h09d9n000008jvh2rqdsmb --name "my-vllm" + +# Create from a Hub repo with custom environment variables +runpodctl serverless create --hub-id cm8h09d9n000008jvh2rqdsmb --name "my-vllm" \ + --env MODEL_NAME=meta-llama/Llama-3.1-8B-Instruct \ + --env MAX_TOKENS=4096 ``` -When using `--hub-id`, GPU IDs and container disk size are automatically pulled from the Hub release config. You can override the GPU type with `--gpu-id`. +When using `--hub-id`, GPU IDs and container disk size are automatically pulled from the Hub release config. You can override the GPU type with `--gpu-id`. Environment variables from the Hub release are included automatically, and you can override or add to them with `--env`. @@ -150,6 +155,10 @@ Enable or disable flash boot for faster worker startup. When enabled, workers st Execution timeout in seconds. Jobs that exceed this duration are terminated. The CLI accepts seconds but converts to milliseconds internally. + +Environment variable in `KEY=VALUE` format. Use multiple `--env` flags to set multiple variables. When deploying from `--hub-id`, these values override the Hub release defaults. + + ### Update an endpoint Update endpoint configuration: