Getting Started
Spaces Guide
Tools Guide
Developer Guide
API REFERENCE
- Spaces
- Data
- Chat
- Assistants
- Documents
PULZE ACADEMY
Update Space And Models
Update an Space’s configuration.
curl --request PUT \
--url https://api.pulze.ai/v1/apps/update \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json' \
--data '{
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"weights": {
"cost": 0,
"latency": 0,
"quality": 1
},
"policies": {
"privacy_level": 1,
"max_cost": 0.02,
"max_switch_model_retries": 1,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"has_failover_chain": true,
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 4096,
"temperature": 0.7
}
}'
{
"main": {
"app": {
"auth0_id": "<string>",
"modified_by": "<string>",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"hashed_key": "<string>",
"key_end": "<string>",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"is_active": true,
"rate_limit": 123,
"has_failover_chain": true,
"weights": {
"cost": 123,
"latency": 123,
"quality": 123
},
"policies": {
"privacy_level": 1,
"max_cost": 1.0001,
"max_switch_model_retries": 2,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 123,
"temperature": 0.5
},
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"benchmark_model": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt": {
"prompt": "<string>",
"title": "<string>",
"description": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"tokens": 123,
"published_on": "2023-11-07T05:31:56Z",
"reviewed_on": "2023-11-07T05:31:56Z",
"approved_on": "2023-11-07T05:31:56Z",
"decline_reason": "<string>",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
}
},
"active_models": 123,
"base_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"custom_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"failover_models": [
{
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
}
],
"current_user_permissions": [
"<string>"
]
},
"sandbox": {
"app": {
"auth0_id": "<string>",
"modified_by": "<string>",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"hashed_key": "<string>",
"key_end": "<string>",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"is_active": true,
"rate_limit": 123,
"has_failover_chain": true,
"weights": {
"cost": 123,
"latency": 123,
"quality": 123
},
"policies": {
"privacy_level": 1,
"max_cost": 1.0001,
"max_switch_model_retries": 2,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 123,
"temperature": 0.5
},
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"benchmark_model": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt": {
"prompt": "<string>",
"title": "<string>",
"description": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"tokens": 123,
"published_on": "2023-11-07T05:31:56Z",
"reviewed_on": "2023-11-07T05:31:56Z",
"approved_on": "2023-11-07T05:31:56Z",
"decline_reason": "<string>",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
}
},
"active_models": 123,
"base_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"custom_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"failover_models": [
{
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
}
],
"current_user_permissions": [
"<string>"
]
},
"sandbox_status": "outdated"
}
Authorizations
Bearer authentication header of the form Bearer <token>
, where <token>
is your auth token.
Body
The app this sandbox relates to
Used to update the benchmark model
1
Prioritizes cost when selecting the most optimized models for your use case.
Prioritizes latency and reduces the time delay between submitting a request and receiving the response.
Prioritizes the quality and readability of the generated responses.
The level of privacy for a given request
0 = (UNSUPPORTED -- public logs)
1 = Log request, response and all of its metadata (Normal mode)
2 = Do not log neither the request prompt nor the response text. Logs are still visible, and all of the request metadata accessible. Retrievable as a log. (TBD)
3 = Do not log at all. Internally, a minimal representation may be stored for billing: model name, tokens used, which app it belongs to, and timestamp. Not retrievable as a log. (TBD)
1
, 2
, 3
The maximum cost allowed for a request. Only works with compounded requests that require multiple LLM calls. If the value is reached, it will exit with an exception.
x > 0.0001
If an LLM call fails, how many other models should Pulze try, chosen by quality descending? It will be a maximum of N+1 models (original + N other models)
0 < x < 5
If an LLM call fails, how many times should Pulze retry the call to the same LLM? There will be a maximum of N+1 calls (original + N retries)
0 < x < 3
Optimize the internal / intermediate LLM requests, for a big gain in speed and cost savings, at the cost of a potential, and very slight, penalty on quality. The final request ("SYNTHESIZE") is always performed using your original settings.
0
, 1
Prompt ID that we will use for requests
Response
The Auth0ID of the creator of the app
The Auth0ID of the last person to modify the table
The hashed value of the API Key which we store in our database
The last characters of the API key
A name for this app
True if the app is active (not soft-deleted, etc.), false otherwise
A Failover chain, when enabled, skips the SMART router and instead calls the failover chain in order.
Compare the results of LLMs against this model (for speed, quality, cost...)
Compare the results of LLMs against this model (for speed, quality, cost...)
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The Prompt associated to the app, if any
1 - 60
1 - 200
Reason for decline
The Org to which this App belongs
If any, the ID of the prompt associated with this app
A description for this app
A logo for this app
Prioritizes cost when selecting the most optimized models for your use case.
Prioritizes latency and reduces the time delay between submitting a request and receiving the response.
Prioritizes the quality and readability of the generated responses.
The level of privacy for a given request
0 = (UNSUPPORTED -- public logs)
1 = Log request, response and all of its metadata (Normal mode)
2 = Do not log neither the request prompt nor the response text. Logs are still visible, and all of the request metadata accessible. Retrievable as a log. (TBD)
3 = Do not log at all. Internally, a minimal representation may be stored for billing: model name, tokens used, which app it belongs to, and timestamp. Not retrievable as a log. (TBD)
1
, 2
, 3
The maximum cost allowed for a request. Only works with compounded requests that require multiple LLM calls. If the value is reached, it will exit with an exception.
x > 0.0001
If an LLM call fails, how many other models should Pulze try, chosen by quality descending? It will be a maximum of N+1 models (original + N other models)
0 < x < 5
If an LLM call fails, how many times should Pulze retry the call to the same LLM? There will be a maximum of N+1 calls (original + N retries)
0 < x < 3
Optimize the internal / intermediate LLM requests, for a big gain in speed and cost savings, at the cost of a potential, and very slight, penalty on quality. The final request ("SYNTHESIZE") is always performed using your original settings.
0
, 1
Prompt ID that we will use for requests
The app might be a (testing) sandbox of a different App.
If true, the app will use the custom data of the parent app
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Used to uniquely target models when we enable/disable them
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
Whether the model is active for the app.
Whether the model is active for the org.
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Used to uniquely target models when we enable/disable them
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
Whether the model is active for the app.
Whether the model is active for the org.
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
The Auth0ID of the creator of the app
The Auth0ID of the last person to modify the table
The hashed value of the API Key which we store in our database
The last characters of the API key
A name for this app
True if the app is active (not soft-deleted, etc.), false otherwise
A Failover chain, when enabled, skips the SMART router and instead calls the failover chain in order.
Compare the results of LLMs against this model (for speed, quality, cost...)
Compare the results of LLMs against this model (for speed, quality, cost...)
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The Prompt associated to the app, if any
1 - 60
1 - 200
Reason for decline
The Org to which this App belongs
If any, the ID of the prompt associated with this app
A description for this app
A logo for this app
Prioritizes cost when selecting the most optimized models for your use case.
Prioritizes latency and reduces the time delay between submitting a request and receiving the response.
Prioritizes the quality and readability of the generated responses.
The level of privacy for a given request
0 = (UNSUPPORTED -- public logs)
1 = Log request, response and all of its metadata (Normal mode)
2 = Do not log neither the request prompt nor the response text. Logs are still visible, and all of the request metadata accessible. Retrievable as a log. (TBD)
3 = Do not log at all. Internally, a minimal representation may be stored for billing: model name, tokens used, which app it belongs to, and timestamp. Not retrievable as a log. (TBD)
1
, 2
, 3
The maximum cost allowed for a request. Only works with compounded requests that require multiple LLM calls. If the value is reached, it will exit with an exception.
x > 0.0001
If an LLM call fails, how many other models should Pulze try, chosen by quality descending? It will be a maximum of N+1 models (original + N other models)
0 < x < 5
If an LLM call fails, how many times should Pulze retry the call to the same LLM? There will be a maximum of N+1 calls (original + N retries)
0 < x < 3
Optimize the internal / intermediate LLM requests, for a big gain in speed and cost savings, at the cost of a potential, and very slight, penalty on quality. The final request ("SYNTHESIZE") is always performed using your original settings.
0
, 1
Prompt ID that we will use for requests
The app might be a (testing) sandbox of a different App.
If true, the app will use the custom data of the parent app
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Used to uniquely target models when we enable/disable them
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
Whether the model is active for the app.
Whether the model is active for the org.
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Used to uniquely target models when we enable/disable them
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
Whether the model is active for the app.
Whether the model is active for the org.
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
True if the model supports function
/tool
call
True if the model supports json
-formatted responses
True if the model supports n
and best_of
-- i.e, multiple responses
True if the model supports frequency_penalty
and presence_penalty
True if the model supports streaming responses
True if the model supports image recognition (vision)
The cost of a completion token, in USD
The cost of a prompt token, in USD
A (usually 0) cost added on top of a request. Some models charge per request, not only per token
The unit of billing for this model
tokens
, characters
The name of the model. Can belong to many providers
The fully qualified (namespaced) model name
The max_tokens for this model
The most recent data this model has been trained with
A description of the model
A URL to the model's page or more informatino
Whether it's rag-tuned or not
Whether it's fine-tuned or not
True if the model is open source
True if the model complies with GDPR
True if the model is of type Chat Completions, False if it's a Text Completion model.
The ID of this model
The app_id that has access to this model (if only one)
The org_id that has acccess to this model
The user (auth0_id) who created the model
When the model was added. Auto-populated in DB
When the model was updated. Auto-populated in DB
True if the model is publicly accessible to all
Test models are only used for testing and do not perform any LLM requests
Model has been created and shared by Pulze
This determines if the model will be available + pre-selected when users create new apps.
The provider for the model.
The owner of the model. Sometimes, for a provider/model combination, many instances exist, trained on different data
Extra model settings inferred from namespace
Store the name of the model the API requires
For models whose deprecation date is known (past or future), to show errors and deny service, or show warnings
The ID of parent, in case it's not a base model
The ID of prompt, used for this model
The ID of prompt, used for this model
The ID of prompt, used for this model
outdated
Was this page helpful?
curl --request PUT \
--url https://api.pulze.ai/v1/apps/update \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json' \
--data '{
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"weights": {
"cost": 0,
"latency": 0,
"quality": 1
},
"policies": {
"privacy_level": 1,
"max_cost": 0.02,
"max_switch_model_retries": 1,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"has_failover_chain": true,
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 4096,
"temperature": 0.7
}
}'
{
"main": {
"app": {
"auth0_id": "<string>",
"modified_by": "<string>",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"hashed_key": "<string>",
"key_end": "<string>",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"is_active": true,
"rate_limit": 123,
"has_failover_chain": true,
"weights": {
"cost": 123,
"latency": 123,
"quality": 123
},
"policies": {
"privacy_level": 1,
"max_cost": 1.0001,
"max_switch_model_retries": 2,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 123,
"temperature": 0.5
},
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"benchmark_model": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt": {
"prompt": "<string>",
"title": "<string>",
"description": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"tokens": 123,
"published_on": "2023-11-07T05:31:56Z",
"reviewed_on": "2023-11-07T05:31:56Z",
"approved_on": "2023-11-07T05:31:56Z",
"decline_reason": "<string>",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
}
},
"active_models": 123,
"base_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"custom_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"failover_models": [
{
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
}
],
"current_user_permissions": [
"<string>"
]
},
"sandbox": {
"app": {
"auth0_id": "<string>",
"modified_by": "<string>",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"hashed_key": "<string>",
"key_end": "<string>",
"name": "<string>",
"description": "<string>",
"app_logo": "<string>",
"is_active": true,
"rate_limit": 123,
"has_failover_chain": true,
"weights": {
"cost": 123,
"latency": 123,
"quality": 123
},
"policies": {
"privacy_level": 1,
"max_cost": 1.0001,
"max_switch_model_retries": 2,
"max_same_model_retries": 1,
"optimize_internal_requests": 0,
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
},
"settings": {
"assistant_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"assistant_version_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"instructions": "<string>",
"max_tokens": 123,
"temperature": 0.5
},
"sandbox_of": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"use_parent_custom_data": true,
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"benchmark_model_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"benchmark_model": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt": {
"prompt": "<string>",
"title": "<string>",
"description": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"tokens": 123,
"published_on": "2023-11-07T05:31:56Z",
"reviewed_on": "2023-11-07T05:31:56Z",
"approved_on": "2023-11-07T05:31:56Z",
"decline_reason": "<string>",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a"
}
},
"active_models": 123,
"base_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"custom_model_settings": [
{
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"active": true,
"globally_disabled": true
}
],
"failover_models": [
{
"supports_functions": true,
"supports_json": true,
"supports_n": true,
"supports_penalties": true,
"supports_stream": true,
"supports_vision": true,
"completion_token_cost": 123,
"prompt_token_cost": 123,
"base_cost": 123,
"price_unit": "tokens",
"model": "<string>",
"provider": "<string>",
"owner": "<string>",
"namespace": "<string>",
"at": "<string>",
"context_window": 123,
"until": "2023-11-07T05:31:56Z",
"description": "<string>",
"url": "<string>",
"api_target": "<string>",
"deprecated_on": "2023-11-07T05:31:56Z",
"parent_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"parent": {},
"prompt_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"is_rag": true,
"is_ft": true,
"is_open_source": true,
"is_gdpr": true,
"is_chat": true,
"id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"app_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"org_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
"added_by": "<string>",
"added_on": "2023-11-07T05:31:56Z",
"modified_on": "2023-11-07T05:31:56Z",
"is_public": true,
"is_test_model": true,
"is_pulze_owner": true,
"default_active": true
}
],
"current_user_permissions": [
"<string>"
]
},
"sandbox_status": "outdated"
}