@@ -105,7 +105,7 @@ async def list_deployments(
105
105
106
106
res = self ._request (
107
107
"GET" ,
108
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments" ,
108
+ f"/inference/v1beta1/regions/{ param_region } /deployments" ,
109
109
params = {
110
110
"name" : name ,
111
111
"order_by" : order_by ,
@@ -196,7 +196,7 @@ async def get_deployment(
196
196
197
197
res = self ._request (
198
198
"GET" ,
199
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
199
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
200
200
)
201
201
202
202
self ._throw_on_error (res )
@@ -287,14 +287,14 @@ async def create_deployment(
287
287
288
288
res = self ._request (
289
289
"POST" ,
290
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments" ,
290
+ f"/inference/v1beta1/regions/{ param_region } /deployments" ,
291
291
body = marshal_CreateDeploymentRequest (
292
292
CreateDeploymentRequest (
293
293
model_name = model_name ,
294
294
node_type = node_type ,
295
295
endpoints = endpoints ,
296
296
region = region ,
297
- name = name or random_name (prefix = "llm " ),
297
+ name = name or random_name (prefix = "inference " ),
298
298
project_id = project_id ,
299
299
accept_eula = accept_eula ,
300
300
tags = tags ,
@@ -344,7 +344,7 @@ async def update_deployment(
344
344
345
345
res = self ._request (
346
346
"PATCH" ,
347
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
347
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
348
348
body = marshal_UpdateDeploymentRequest (
349
349
UpdateDeploymentRequest (
350
350
deployment_id = deployment_id ,
@@ -389,7 +389,7 @@ async def delete_deployment(
389
389
390
390
res = self ._request (
391
391
"DELETE" ,
392
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
392
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } " ,
393
393
)
394
394
395
395
self ._throw_on_error (res )
@@ -424,7 +424,7 @@ async def get_deployment_certificate(
424
424
425
425
res = self ._request (
426
426
"GET" ,
427
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /certificate" ,
427
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /certificate" ,
428
428
)
429
429
430
430
self ._throw_on_error (res )
@@ -460,7 +460,7 @@ async def create_endpoint(
460
460
461
461
res = self ._request (
462
462
"POST" ,
463
- f"/llm- inference/v1beta1/regions/{ param_region } /endpoints" ,
463
+ f"/inference/v1beta1/regions/{ param_region } /endpoints" ,
464
464
body = marshal_CreateEndpointRequest (
465
465
CreateEndpointRequest (
466
466
deployment_id = deployment_id ,
@@ -505,7 +505,7 @@ async def update_endpoint(
505
505
506
506
res = self ._request (
507
507
"PATCH" ,
508
- f"/llm- inference/v1beta1/regions/{ param_region } /endpoints/{ param_endpoint_id } " ,
508
+ f"/inference/v1beta1/regions/{ param_region } /endpoints/{ param_endpoint_id } " ,
509
509
body = marshal_UpdateEndpointRequest (
510
510
UpdateEndpointRequest (
511
511
endpoint_id = endpoint_id ,
@@ -546,7 +546,7 @@ async def delete_endpoint(
546
546
547
547
res = self ._request (
548
548
"DELETE" ,
549
- f"/llm- inference/v1beta1/regions/{ param_region } /endpoints/{ param_endpoint_id } " ,
549
+ f"/inference/v1beta1/regions/{ param_region } /endpoints/{ param_endpoint_id } " ,
550
550
)
551
551
552
552
self ._throw_on_error (res )
@@ -583,7 +583,7 @@ async def list_deployment_acl_rules(
583
583
584
584
res = self ._request (
585
585
"GET" ,
586
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
586
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
587
587
params = {
588
588
"page" : page ,
589
589
"page_size" : page_size or self .client .default_page_size ,
@@ -660,7 +660,7 @@ async def add_deployment_acl_rules(
660
660
661
661
res = self ._request (
662
662
"POST" ,
663
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
663
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
664
664
body = marshal_AddDeploymentACLRulesRequest (
665
665
AddDeploymentACLRulesRequest (
666
666
deployment_id = deployment_id ,
@@ -704,7 +704,7 @@ async def set_deployment_acl_rules(
704
704
705
705
res = self ._request (
706
706
"PUT" ,
707
- f"/llm- inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
707
+ f"/inference/v1beta1/regions/{ param_region } /deployments/{ param_deployment_id } /acls" ,
708
708
body = marshal_SetDeploymentACLRulesRequest (
709
709
SetDeploymentACLRulesRequest (
710
710
deployment_id = deployment_id ,
@@ -744,7 +744,7 @@ async def delete_deployment_acl_rule(
744
744
745
745
res = self ._request (
746
746
"DELETE" ,
747
- f"/llm- inference/v1beta1/regions/{ param_region } /acls/{ param_acl_id } " ,
747
+ f"/inference/v1beta1/regions/{ param_region } /acls/{ param_acl_id } " ,
748
748
)
749
749
750
750
self ._throw_on_error (res )
@@ -784,7 +784,7 @@ async def list_models(
784
784
785
785
res = self ._request (
786
786
"GET" ,
787
- f"/llm- inference/v1beta1/regions/{ param_region } /models" ,
787
+ f"/inference/v1beta1/regions/{ param_region } /models" ,
788
788
params = {
789
789
"name" : name ,
790
790
"order_by" : order_by ,
@@ -870,7 +870,7 @@ async def get_model(
870
870
871
871
res = self ._request (
872
872
"GET" ,
873
- f"/llm- inference/v1beta1/regions/{ param_region } /models/{ param_model_id } " ,
873
+ f"/inference/v1beta1/regions/{ param_region } /models/{ param_model_id } " ,
874
874
)
875
875
876
876
self ._throw_on_error (res )
@@ -902,7 +902,7 @@ async def get_model_eula(
902
902
903
903
res = self ._request (
904
904
"GET" ,
905
- f"/llm- inference/v1beta1/regions/{ param_region } /models/{ param_model_id } /eula" ,
905
+ f"/inference/v1beta1/regions/{ param_region } /models/{ param_model_id } /eula" ,
906
906
)
907
907
908
908
self ._throw_on_error (res )
@@ -939,7 +939,7 @@ async def list_node_types(
939
939
940
940
res = self ._request (
941
941
"GET" ,
942
- f"/llm- inference/v1beta1/regions/{ param_region } /node-types" ,
942
+ f"/inference/v1beta1/regions/{ param_region } /node-types" ,
943
943
params = {
944
944
"include_disabled_types" : include_disabled_types ,
945
945
"page" : page ,
0 commit comments