File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed
Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change 33from centml .sdk .api import get_centml_client
44from centml .sdk import DeploymentType , CreateCServeV2DeploymentRequest , CServeV2Recipe
55
6- def get_fastest_cserve_config (model ):
6+ def get_fastest_cserve_config (cclient , model ):
77 return cclient .get_cserve_recipe (model = model )[0 ].fastest
88
99def get_default_cserve_config (model ):
@@ -12,7 +12,7 @@ def get_default_cserve_config(model):
1212def main ():
1313 with get_centml_client () as cclient :
1414 # Get fastest recipe for the Qwen model
15- qwen_config = get_fastest_config ( model = "Qwen/Qwen2-VL-7B-Instruct" )
15+ qwen_config = get_fastest_cserve_config ( cclient , model = "Qwen/Qwen2-VL-7B-Instruct" )
1616
1717 # Modify the recipe if necessary
1818 qwen_config .recipe .additional_properties ["max_num_seqs" ] = 512
You can’t perform that action at this time.
0 commit comments