|
4 | 4 |
|
5 | 5 | import logging
|
6 | 6 | import os
|
7 |
| -import sys |
8 | 7 | from typing import Optional
|
9 | 8 |
|
10 | 9 | from vllm.config import KVTransferConfig
|
|
29 | 28 |
|
30 | 29 | logger = logging.getLogger(__name__)
|
31 | 30 |
|
32 |
| -DEFAULT_ENDPOINT = "dyn://dynamo.backend.generate" |
33 | 31 | DEFAULT_MODEL = "Qwen/Qwen3-0.6B"
|
34 | 32 |
|
35 | 33 | VALID_CONNECTORS = {"nixl", "lmcache", "kvbm", "null", "none"}
|
@@ -72,12 +70,6 @@ def parse_args() -> Config:
|
72 | 70 | parser.add_argument(
|
73 | 71 | "--version", action="version", version=f"Dynamo Backend VLLM {__version__}"
|
74 | 72 | )
|
75 |
| - parser.add_argument( |
76 |
| - "--endpoint", |
77 |
| - type=str, |
78 |
| - default=DEFAULT_ENDPOINT, |
79 |
| - help=f"Dynamo endpoint string in 'dyn://namespace.component.endpoint' format. Default: {DEFAULT_ENDPOINT}", |
80 |
| - ) |
81 | 73 | parser.add_argument(
|
82 | 74 | "--is-prefill-worker",
|
83 | 75 | action="store_true",
|
@@ -145,27 +137,9 @@ def parse_args() -> Config:
|
145 | 137 | # This becomes an `Option` on the Rust side
|
146 | 138 | config.served_model_name = None
|
147 | 139 |
|
148 |
| - namespace = os.environ.get("DYN_NAMESPACE", "dynamo") |
149 |
| - |
150 |
| - if args.is_prefill_worker: |
151 |
| - args.endpoint = f"dyn://{namespace}.prefill.generate" |
152 |
| - else: |
153 |
| - # For decode workers, also use the provided namespace instead of hardcoded "dynamo" |
154 |
| - args.endpoint = f"dyn://{namespace}.backend.generate" |
155 |
| - |
156 |
| - endpoint_str = args.endpoint.replace("dyn://", "", 1) |
157 |
| - endpoint_parts = endpoint_str.split(".") |
158 |
| - if len(endpoint_parts) != 3: |
159 |
| - logger.error( |
160 |
| - f"Invalid endpoint format: '{args.endpoint}'. Expected 'dyn://namespace.component.endpoint' or 'namespace.component.endpoint'." |
161 |
| - ) |
162 |
| - sys.exit(1) |
163 |
| - |
164 |
| - parsed_namespace, parsed_component_name, parsed_endpoint_name = endpoint_parts |
165 |
| - |
166 |
| - config.namespace = parsed_namespace |
167 |
| - config.component = parsed_component_name |
168 |
| - config.endpoint = parsed_endpoint_name |
| 140 | + config.namespace = os.environ.get("DYN_NAMESPACE", "dynamo") |
| 141 | + config.component = "prefill" if args.is_prefill_worker else "backend" |
| 142 | + config.endpoint = "generate" |
169 | 143 | config.engine_args = engine_args
|
170 | 144 | config.is_prefill_worker = args.is_prefill_worker
|
171 | 145 | config.migration_limit = args.migration_limit
|
|
0 commit comments