66 DeploymentStatus ,
77 CreateInferenceDeploymentRequest ,
88 CreateComputeDeploymentRequest ,
9- CreateCServeDeploymentRequest ,
9+ CreateCServeV2DeploymentRequest ,
1010)
1111
1212from centml .sdk import auth
@@ -32,16 +32,16 @@ def get_compute(self, id):
3232 return self ._api .get_compute_deployment_deployments_compute_deployment_id_get (id )
3333
3434 def get_cserve (self , id ):
35- return self ._api .get_cserve_deployment_deployments_cserve_deployment_id_get (id )
35+ return self ._api .get_cserve_v2_deployment_deployments_cserve_v2_deployment_id_get (id )
3636
3737 def create_inference (self , request : CreateInferenceDeploymentRequest ):
3838 return self ._api .create_inference_deployment_deployments_inference_post (request )
3939
4040 def create_compute (self , request : CreateComputeDeploymentRequest ):
4141 return self ._api .create_compute_deployment_deployments_compute_post (request )
4242
43- def create_cserve (self , request : CreateCServeDeploymentRequest ):
44- return self ._api .create_cserve_deployment_deployments_cserve_post (request )
43+ def create_cserve (self , request : CreateCServeV2DeploymentRequest ):
44+ return self ._api .create_cserve_v2_deployment_deployments_cserve_v2_post (request )
4545
4646 def _update_status (self , id , new_status ):
4747 status_req = platform_api_python_client .DeploymentStatusRequest (status = new_status )
@@ -67,8 +67,16 @@ def get_hardware_instances(self, cluster_id=None):
6767 def get_prebuilt_images (self , depl_type : DeploymentType ):
6868 return self ._api .get_prebuilt_images_prebuilt_images_get (type = depl_type )
6969
70- def get_cserve_recipe (self ):
71- return self ._api .get_cserve_recipe_deployments_cserve_recipes_get ().results
70+ def get_cserve_recipe (self , model = None , hf_token = None ):
71+ return self ._api .get_cserve_recipe_deployments_cserve_recipes_get (model = model , hf_token = hf_token ).results
72+
73+ def get_cluster_id (self , hardware_instance_id ):
74+ filtered_hw = list (filter (lambda h : h .id == hardware_instance_id , self .get_hardware_instances ()))
75+
76+ if len (filtered_hw ) == 0 :
77+ raise Exception (f"Invalid hardware instance id { hardware_instance_id } " )
78+
79+ return filtered_hw [0 ].cluster_id
7280
7381
7482@contextmanager
0 commit comments