Models
Create a Model
Creates a new custom model for the workspace. Provider credentials in the configuration are encrypted using the workspace encryption key before being persisted.import orq_ai_sdk
from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.create(configuration={
}, display_name="Albert_Emmerich25", has_functions=False, id="<id>", input_cost=2127.52, metadata=orq_ai_sdk.ModelMetadata(
is_private=False,
), model_developer="<value>", model_family="<value>", model_id="<id>", model_type="<value>", output_cost=5446, parameters=[
{
"config": {
},
"name": "<value>",
"parameter": "<value>",
"parameter_type": "<value>",
},
], provider="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"configuration": Dict[str, Any], # required
"display_name": str, # required
"has_functions": bool, # required
"id": str, # required
"input_cost": float, # required
"metadata": { # required
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool, # required
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_1h": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_5m": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"input": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"output": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"reasoning": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"variants": { # optional
"cache_read": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_1h": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_5m": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"input": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"output": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"reasoning": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"when": str, # required
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": str, # required
"model_family": str, # required
"model_id": str, # required
"model_type": str, # required
"output_cost": float, # required
"parameters": { # required
"config": Dict[str, Any], # required
"description": Optional[str],
"hints": Optional[str],
"name": str, # required
"parameter": str, # required
"parameter_type": str, # required
"position": Optional[int],
},
"provider": str, # required
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Create Autorouter
Creates an autorouter model that routes between a strong and economical source model based on the requested profile. Both source models must already exist for the workspace and be marked autorouter-eligible in master data.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.create_autorouter(economical_model="<value>", key="<key>", strong_model="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"economical_model": str, # required
"key": str, # required
"strong_model": str, # required
"profile": Optional[str],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Update Autorouter
Re-configures an autorouter model. Each of key/strong_model/economical_model/profile falls back to the existing value when omitted. Changing the key enforces uniqueness and rewrites PRICING_KV.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.update_autorouter(id="<id>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"id": str, # required
"economical_model": Optional[str],
"key": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Create AWS Bedrock
Registers an AWS Bedrock inference profile as a custom model for the workspace. Credentials are resolved at request time via either the integration reference or pod-identity - nothing is stored with the model.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.create_aws_bedrock(auth_mode="<value>", display_name="Shanon.Wintheiser", model_developer="<value>", model_id="<id>", region="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"auth_mode": str, # required
"display_name": str, # required
"model_developer": str, # required
"model_id": str, # required
"region": str, # required
"assume_role_arn": Optional[str],
"assume_role_external_id": Optional[str],
"description": Optional[str],
"has_reasoning": Optional[bool],
"input_cost": Optional[float],
"integration_id": Optional[str],
"max_tokens": Optional[int],
"model_family": Optional[str],
"model_type": Optional[str],
"output_cost": Optional[float],
"supports_adaptive_reasoning": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_json_mode": Optional[bool],
"supports_json_schema": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_vision": Optional[bool],
"temperature": Optional[float],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Validate AWS Bedrock
Performs a live Bedrock Converse probe to verify the inference profile ARN and credentials, then best-effort enriches the response from known system models.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
orq.models.validate_aws_bedrock(auth_mode="<value>", inference_profile_arn="<value>", region="<value>")
# Use the SDK ...
Show Parameters
Show Parameters
{
"auth_mode": str, # required
"inference_profile_arn": str, # required
"region": str, # required
"assume_role_arn": Optional[str],
"assume_role_external_id": Optional[str],
"integration_id": Optional[str],
}
Update AWS Bedrock
Updates an AWS Bedrock custom model. ARN changes are format-validated (live AWS validation lives in the dedicated validate endpoint). Configuration and metadata are spread-merged. Parameters are replaced only when the request produces a non-empty list.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.update_aws_bedrock(id="<id>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"id": str, # required
"assume_role_arn": Optional[str],
"assume_role_external_id": Optional[str],
"description": Optional[str],
"display_name": Optional[str],
"has_reasoning": Optional[bool],
"input_cost": Optional[float],
"max_tokens": Optional[int],
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": Optional[str],
"model_type": Optional[str],
"output_cost": Optional[float],
"region": Optional[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_json_mode": Optional[bool],
"supports_json_schema": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_vision": Optional[bool],
"temperature": Optional[float],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Azure Foundry Deployments
Lists Azure Foundry deployments under the given base_url and joins each entry with the Orq master-data row. Only OpenAI-developed deployments in succeeded state with chat/completion/embedding/vision model types are returned.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.azure_foundry_deployments(api_key="<value>", base_url="https://admired-overcoat.info", provider="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"api_key": str, # required
"base_url": str, # required
"provider": str, # required
"api_version": Optional[str],
}
Show Response
Show Response
{
"deployments": {
"id": str,
"master_data": { # optional
"has_functions": bool,
"id": str,
"input_cost": float,
"metadata": Dict[str, Any],
"model_developer": Nullable[str],
"model_family": Nullable[str],
"model_id": str,
"model_type": str,
"output_cost": float,
"parameters": List[Any],
},
"model": str,
},
"region": str,
}
Import LiteLLM
Bulk-imports a list of LiteLLM model definitions into the workspace model garden.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.import_litellm(request=[
{
"litellm_params": {
"merge_reasoning_content_in_choices": False,
"model": "CX-9",
"use_in_pass_through": False,
"use_litellm_proxy": False,
},
"model_info": {
"db_model": True,
"id": "<id>",
"key": "<key>",
"litellm_provider": "<value>",
"mode": "<value>",
},
"model_name": "<value>",
},
])
# Handle response
print(res)
Show Parameters
Show Parameters
{
"request": List[LiteLLMModel], # required
}
List LiteLLM
Fetches the list of models from the LiteLLM instance configured for the workspace. Requires a stored LiteLLM integration.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.list_litellm()
# Handle response
print(res)
Create OpenAI Like
Creates a custom model backed by any OpenAI-compatible endpoint. The handler probes the target API with the supplied credentials before persisting the model.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.create_openai_like(api_key="<value>", base_url="https://guilty-cap.org/", display_name="Richard.Beatty45", model_id="<id>", model_type="<value>", region="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"api_key": str, # required
"base_url": str, # required
"display_name": str, # required
"model_id": str, # required
"model_type": str, # required
"region": str, # required
"cost_per_image": Optional[float],
"description": Optional[str],
"has_reasoning": Optional[bool],
"input_cost": Optional[float],
"max_tokens": Optional[int],
"output_cost": Optional[float],
"supports_image_edit": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_vision": Optional[bool],
"temperature": Optional[float],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Update OpenAI Like
Updates an OpenAI-compatible custom model. Live-re-probes the target API when base_url or model_id changes, using the stored encrypted api_key. Metadata is merged (existing preserved, new overrides).from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.update_openai_like(id="<id>", display_name="Verlie82", model_type="<value>", region="<value>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"id": str, # required
"display_name": str, # required
"model_type": str, # required
"region": str, # required
"base_url": Optional[str],
"cost_per_image": Optional[float],
"description": Optional[str],
"has_reasoning": Optional[bool],
"input_cost": Optional[float],
"max_tokens": Optional[int],
"model_id": Optional[str],
"output_cost": Optional[float],
"supports_image_edit": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_vision": Optional[bool],
"temperature": Optional[float],
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Validate a Model
Validates a provider endpoint by performing a minimal live probe. Currently supports Azure OpenAI. Response includes the resolved region, whether the model is known to Orq, and either the full model document or a synthesized default.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
orq.models.validate(api_key="<value>", provider="<value>")
# Use the SDK ...
Show Parameters
Show Parameters
{
"api_key": str, # required
"provider": str, # required
"api_version": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"subtype": Optional[str],
}
Create Vertex
Registers a Google Vertex AI model as a custom model for the workspace. The service account credentials are probed against Vertex AI with a minimal GenerateContent call before persisting.import orq_ai_sdk
from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.create_vertex(configuration=orq_ai_sdk.VertexConfiguration(
location="<value>",
model_configuration=orq_ai_sdk.VertexModelConfiguration(
capabilities=orq_ai_sdk.VertexCapabilities(
structured_output=True,
support_tool_calling=False,
vision=True,
),
id="<id>",
input_cost=6100.6,
output_cost=4860.06,
parameters=orq_ai_sdk.VertexParameters(
max_tokens=orq_ai_sdk.VertexParamRangeInt(
max=816266,
min=370614,
),
temperature=orq_ai_sdk.VertexParamRange(
max=1989.61,
min=8564.64,
),
top_p=orq_ai_sdk.VertexParamRange(
max=3250.24,
min=8051.01,
),
),
),
project_id="<id>",
service_account={
"key": "<value>",
"key1": "<value>",
"key2": "<value>",
},
), display_name="Birdie_Bailey-Abernathy")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"configuration": { # required
"location": str, # required
"model_configuration": { # required
"capabilities": { # required
"structured_output": bool, # required
"support_tool_calling": bool, # required
"vision": bool, # required
},
"id": str, # required
"input_cost": float, # required
"output_cost": float, # required
"parameters": { # required
"max_tokens": { # required
"max": int, # required
"min": int, # required
},
"temperature": { # required
"max": float, # required
"min": float, # required
},
"top_p": { # required
"max": float, # required
"min": float, # required
},
},
},
"project_id": str, # required
"service_account": Dict[str, Any], # required
},
"display_name": str, # required
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Delete a Model
Deletes a custom model from the workspace. System models cannot be deleted. Returns 200 with an explanatory message if the model is a system model or is still referenced by experiments.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
orq.models.delete(id="<id>")
# Use the SDK ...
Show Parameters
Show Parameters
{
"id": str, # required
}
Update a Model
Updates a custom model. Only fields present in the request body are modified, except formetadata and parameters, which are fully replaced when present (preserved from the legacy handler’s behavior).
from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.update(id="<id>")
# Handle response
print(res)
Show Parameters
Show Parameters
{
"id": str, # required
"display_name": Optional[str],
"has_functions": Optional[bool],
"input_cost": Optional[float],
"metadata": { # optional
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool, # required
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_1h": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_5m": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"input": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"output": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"reasoning": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"variants": { # optional
"cache_read": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_1h": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"cache_write_5m": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"input": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"output": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"reasoning": { # optional
"cost": float, # required
"currency": str, # required
"per": int, # required
"unit": str, # required
},
"when": str, # required
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_type": Optional[str],
"output_cost": Optional[float],
"parameters": { # optional
"config": Dict[str, Any],
"description": Optional[str],
"hints": Optional[str],
"id": str, # required
"is_active": Optional[bool],
"name": Optional[str],
"parameter": Optional[str],
"parameter_type": Optional[str],
"position": Optional[int],
},
}
Show Response
Show Response
{
"configuration": {
"api_key_env": Optional[str],
"api_version": Optional[str],
"auth_mode": Optional[str],
"auth_type": Optional[str],
"base_url": Optional[str],
"deployment_name": Optional[str],
"endpoint": Optional[str],
"inference_profile_arn": Optional[str],
"integration_id": Optional[str],
"is_openai_compatible": Optional[bool],
"is_tuned_model": Optional[bool],
"location": Optional[str],
"project_id": Optional[str],
"provider": str,
"region": Optional[str],
"should_use_beta_features": Optional[bool],
"subtype": Optional[str],
"workspace_id": Optional[str],
},
"created": date,
"description": Nullable[str],
"display_name": str,
"docs_url": Nullable[str],
"enabled": bool,
"enabled_for_endpoints": bool,
"enabled_for_playground": bool,
"has_cpu_pricing": bool,
"has_functions": bool,
"id": str,
"input_cost": Nullable[float],
"input_currency": str,
"is_active": bool,
"metadata": {
"allowed_passthrough_parameters": List[str],
"autorouter": { # optional
"economical_model": Optional[str],
"id": Optional[str],
"profile": Optional[str],
"strong_model": Optional[str],
"version": Optional[str],
},
"cached_image_input_cost": Optional[float],
"cached_input_cost": Optional[float],
"chain_of_thought": Optional[bool],
"context_length": Optional[int],
"context_window": Optional[int],
"cost_efficiency_rating": Optional[int],
"cost_per_image": Optional[float],
"deprecation_date": Optional[str],
"embedding_dimensions": Optional[int],
"extended_context_pricing_mode": Optional[str],
"extended_context_threshold": Optional[int],
"generate_audio": Optional[bool],
"image_input_cost": Optional[float],
"image_output_cost": Optional[float],
"image_token_cost": Optional[float],
"intelligence_rating": Optional[int],
"is_private": bool,
"is_realtime": Optional[bool],
"knowledge_cutoff": Optional[str],
"max_images_per_request": Optional[int],
"max_input_tokens": Optional[int],
"max_output_tokens": Optional[int],
"million_searches_cost": Optional[float],
"million_tokens_above_128k_cache_read_cost": Optional[float],
"million_tokens_above_128k_cache_write_cost": Optional[float],
"million_tokens_above_128k_input_cost": Optional[float],
"million_tokens_above_128k_output_cost": Optional[float],
"million_tokens_above_200k_cache_read_cost": Optional[float],
"million_tokens_above_200k_cache_write_cost": Optional[float],
"million_tokens_above_200k_input_cost": Optional[float],
"million_tokens_above_200k_output_cost": Optional[float],
"million_tokens_audio_input_cost": Optional[float],
"million_tokens_audio_output_cost": Optional[float],
"million_tokens_batches_input_cost": Optional[float],
"million_tokens_batches_output_cost": Optional[float],
"million_tokens_cache_read_cost": Optional[float],
"million_tokens_cache_write_1h_cost": Optional[float],
"million_tokens_cache_write_5m_cost": Optional[float],
"million_tokens_cache_write_cost": Optional[float],
"million_tokens_input_cost": Optional[float],
"million_tokens_output_cost": Optional[float],
"million_tokens_reasoning_cost": Optional[float],
"multilingual": Optional[bool],
"offline": Optional[bool],
"per_video_second_cost": Optional[float],
"per_video_second_cost_1080p": Optional[float],
"pricing": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"variants": { # optional
"cache_read": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_1h": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"cache_write_5m": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"input": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"output": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"reasoning": { # optional
"cost": float,
"currency": str,
"per": int,
"unit": str,
},
"when": str,
},
},
"reasoning_cost": Optional[float],
"reasoning_tokens": Optional[int],
"region": Optional[str],
"speed_rating": Optional[int],
"supported_video_aspect_ratios": List[str],
"supported_video_durations": List[int],
"supported_video_frame_images": List[str],
"supported_video_resolutions": List[str],
"supported_video_sizes": List[str],
"supports_adaptive_reasoning": Optional[bool],
"supports_audio_input": Optional[bool],
"supports_audio_output": Optional[bool],
"supports_b64_json_response_format": Optional[bool],
"supports_batch_api": Optional[bool],
"supports_code_execution": Optional[bool],
"supports_commercial_use": Optional[bool],
"supports_computer_use": Optional[bool],
"supports_developer_message": Optional[bool],
"supports_direct_cost": Optional[bool],
"supports_distillation": Optional[bool],
"supports_extended_thinking": Optional[bool],
"supports_fine_tuning": Optional[bool],
"supports_image_edit": Optional[bool],
"supports_image_input": Optional[bool],
"supports_image_output": Optional[bool],
"supports_images": Optional[bool],
"supports_json_mode_response_format": Optional[bool],
"supports_json_schema_response_format": Optional[bool],
"supports_max_completion_tokens": Optional[bool],
"supports_openai_sdk": Optional[bool],
"supports_parallel_tool_calls": Optional[bool],
"supports_pdf_input": Optional[bool],
"supports_prompt_caching": Optional[bool],
"supports_reasoning": Optional[bool],
"supports_reasoning_effort_default": Optional[bool],
"supports_reasoning_effort_high": Optional[bool],
"supports_reasoning_effort_low": Optional[bool],
"supports_reasoning_effort_medium": Optional[bool],
"supports_reasoning_effort_minimal": Optional[bool],
"supports_reasoning_effort_none": Optional[bool],
"supports_reasoning_effort_xhigh": Optional[bool],
"supports_responses_api": Optional[bool],
"supports_sampling_params": Optional[bool],
"supports_streaming": Optional[bool],
"supports_strict_tool": Optional[bool],
"supports_structured_outputs": Optional[bool],
"supports_system_message": Optional[bool],
"supports_text": Optional[bool],
"supports_text_input": Optional[bool],
"supports_text_output": Optional[bool],
"supports_tool_calling": Optional[bool],
"supports_tool_choice": Optional[bool],
"supports_url_context": Optional[bool],
"supports_url_response_format": Optional[bool],
"supports_video_input": Optional[bool],
"supports_video_output": Optional[bool],
"supports_video_seed": Optional[bool],
"supports_vision": Optional[bool],
"supports_web_search": Optional[bool],
"supports_zdr": Optional[bool],
"thinking_enforced": Optional[bool],
},
"model_developer": Optional[str],
"model_family": Optional[str],
"model_id": str,
"model_type": str,
"output_cost": Nullable[float],
"output_currency": str,
"owner": str,
"parameters": {
"config": Dict[str, Any],
"description": Nullable[str],
"hints": Optional[str],
"id": str,
"is_active": bool,
"name": str,
"parameter": str,
"parameter_type": str,
"position": Optional[int],
},
"pricing_url": Nullable[str],
"provider": str,
"ref_id": str,
"updated": date,
}
Enable a Model
Adds the model to the workspace’s enabled set. Idempotent - re-enabling an already-enabled model returns 204 with no state change.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
orq.models.enable(model_id="<id>")
# Use the SDK ...
Show Parameters
Show Parameters
{
"model_id": str, # required
}
Disable a Model
Removes the model from the workspace’s enabled set. Idempotent - disabling an already-disabled model returns 204.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
orq.models.disable(model_id="<id>")
# Use the SDK ...
Show Parameters
Show Parameters
{
"model_id": str, # required
}
List Models
Lists all models available through the AI Router. Returns each model in OpenAI-compatible shape with its provider, ID, and creation timestamp.from orq_ai_sdk import Orq
import os
with Orq(
api_key=os.getenv("ORQ_API_KEY", ""),
) as orq:
res = orq.models.list()
# Handle response
print(res)
Show Response
Show Response
{
"data": {
"created": int,
"id": str,
"object": Literal["model"],
"owned_by": str,
},
"object": Literal["list"],
}