Skip to content

Latest commit

 

History

History
40 lines (31 loc) · 1.53 KB

CreateRagDeploymentRequest.md

File metadata and controls

40 lines (31 loc) · 1.53 KB

CreateRagDeploymentRequest

Properties

Name Type Description Notes
name str
cluster_id int
hardware_instance_id int
recipe CServeV2RecipeInput
hf_token str [optional]
llm_model str
centml_api_key str
min_scale int [optional] [default to 1]
max_scale int [optional] [default to 1]
endpoint_certificate_authority str [optional]
concurrency int [optional]
env_vars Dict[str, str] [optional]

Example

from platform_api_python_client.models.create_rag_deployment_request import CreateRagDeploymentRequest

# TODO update the JSON string below
json = "{}"
# create an instance of CreateRagDeploymentRequest from a JSON string
create_rag_deployment_request_instance = CreateRagDeploymentRequest.from_json(json)
# print the JSON string representation of the object
print(CreateRagDeploymentRequest.to_json())

# convert the object into a dict
create_rag_deployment_request_dict = create_rag_deployment_request_instance.to_dict()
# create an instance of CreateRagDeploymentRequest from a dict
create_rag_deployment_request_from_dict = CreateRagDeploymentRequest.from_dict(create_rag_deployment_request_dict)

[Back to Model list] [Back to API list] [Back to README]