|
Up
|
|
|
|
|
access.md
|
|
|
|
|
activates-a-deployment-associated-with-an-environment.md
|
|
|
|
|
activates-a-deployment.md
|
|
|
|
|
activates-a-development-deployment.md
|
|
|
|
|
advanced-features.md
|
|
|
|
|
all-mpnet-base-v2.md
|
|
|
|
|
api-keys.md
|
|
|
|
|
async.md
|
|
|
|
|
autoscaling-engines.md
|
|
|
|
|
autoscaling.md
|
|
|
|
|
b10cache.md
|
|
|
|
|
base-images.md
|
|
|
|
|
basics.md
|
|
|
|
|
bei-bert.md
|
|
|
|
|
bei-reference.md
|
|
|
|
|
bei.md
|
|
|
|
|
binary.md
|
|
|
|
|
binaryio.md
|
|
|
|
|
bis-llm-config.md
|
|
|
|
|
build-commands.md
|
|
|
|
|
build-your-first-model.md
|
|
|
|
|
cache.md
|
|
|
|
|
calling-your-model.md
|
|
|
|
|
cancel-async-request.md
|
|
|
|
|
cancel-promotion.md
|
|
|
|
|
chains-audio-transcription.md
|
|
|
|
|
chains-build-rag.md
|
|
|
|
|
chains-cli.md
|
|
|
|
|
chains.md
|
|
|
|
|
chat-completions.md
|
|
|
|
|
checkpointing.md
|
|
|
|
|
cleanup.md
|
|
|
|
|
code-first-development.md
|
|
|
|
|
comfyui.md
|
|
|
|
|
concepts.md
|
|
|
|
|
concurrency.md
|
|
|
|
|
configuration.md
|
|
|
|
|
configure.md
|
|
|
|
|
container.md
|
|
|
|
|
create-a-chain-environment.md
|
|
|
|
|
create-an-environment.md
|
|
|
|
|
create-training-project.md
|
|
|
|
|
creates-a-team-api-key.md
|
|
|
|
|
creates-a-team-training-project.md
|
|
|
|
|
creates-an-api-key.md
|
|
|
|
|
custom-engine-builder.md
|
|
|
|
|
custom-health-checks.md
|
|
|
|
|
custom-server.md
|
|
|
|
|
data-directory.md
|
|
|
|
|
datadog.md
|
|
|
|
|
deactivates-a-deployment-associated-with-an-environment.md
|
|
|
|
|
deactivates-a-deployment.md
|
|
|
|
|
deactivates-a-development-deployment.md
|
|
|
|
|
deepseek-r1-qwen-7b.md
|
|
|
|
|
deepseek-r1.md
|
|
|
|
|
delete-an-api-key.md
|
|
|
|
|
deletes-a-chain-by-id.md
|
|
|
|
|
deletes-a-chain-deployment-by-id.md
|
|
|
|
|
deletes-a-model-by-id.md
|
|
|
|
|
deletes-a-models-deployment-by-id.md
|
|
|
|
|
deploy-and-iterate.md
|
|
|
|
|
deploy-your-first-model.md
|
|
|
|
|
deploy.md
|
|
|
|
|
deployment-async-predict.md
|
|
|
|
|
deployment-async-run-remote.md
|
|
|
|
|
deployment-from-training-and-s3.md
|
|
|
|
|
deployment-get-async-queue-status.md
|
|
|
|
|
deployment-predict.md
|
|
|
|
|
deployment-run-remote.md
|
|
|
|
|
deployment-wake.md
|
|
|
|
|
deployment-websocket.md
|
|
|
|
|
deployment.md
|
|
|
|
|
deployments.md
|
|
|
|
|
deprecation.md
|
|
|
|
|
design.md
|
|
|
|
|
development-async-predict.md
|
|
|
|
|
development-async-run-remote.md
|
|
|
|
|
development-get-async-queue-status.md
|
|
|
|
|
development-predict.md
|
|
|
|
|
development-run-remote.md
|
|
|
|
|
development-wake.md
|
|
|
|
|
development-websocket.md
|
|
|
|
|
docker.md
|
|
|
|
|
download-training-job.md
|
|
|
|
|
engine-builder-config.md
|
|
|
|
|
engine-builder-customization.md
|
|
|
|
|
engine-builder-models.md
|
|
|
|
|
engine-builder-overview.md
|
|
|
|
|
environments-async-predict.md
|
|
|
|
|
environments-async-run-remote.md
|
|
|
|
|
environments-get-async-queue-status.md
|
|
|
|
|
environments-predict.md
|
|
|
|
|
environments-run-remote.md
|
|
|
|
|
environments-websocket.md
|
|
|
|
|
environments.md
|
|
|
|
|
errorhandling.md
|
|
|
|
|
files.md
|
|
|
|
|
flux-schnell.md
|
|
|
|
|
function-calling.md
|
|
|
|
|
gemma-3-27b-it.md
|
|
|
|
|
get-a-chain-environments-details.md
|
|
|
|
|
get-all-chain-environments.md
|
|
|
|
|
get-all-environments.md
|
|
|
|
|
get-an-environments-details.md
|
|
|
|
|
get-async-request-status.md
|
|
|
|
|
get-training-job-checkpoint-files.md
|
|
|
|
|
get-training-job-checkpoints.md
|
|
|
|
|
get-training-job-logs.md
|
|
|
|
|
get-training-job-metrics.md
|
|
|
|
|
get-training-job.md
|
|
|
|
|
get-training-projects.md
|
|
|
|
|
gets-a-chain-by-id.md
|
|
|
|
|
gets-a-chain-deployment-by-id.md
|
|
|
|
|
gets-a-model-by-id.md
|
|
|
|
|
gets-a-models-deployment-by-id.md
|
|
|
|
|
gets-a-models-development-deployment.md
|
|
|
|
|
gets-a-models-production-deployment.md
|
|
|
|
|
gets-all-chain-deployments.md
|
|
|
|
|
gets-all-chains.md
|
|
|
|
|
gets-all-deployments-of-a-model.md
|
|
|
|
|
gets-all-instance-types.md
|
|
|
|
|
gets-all-models.md
|
|
|
|
|
gets-all-secrets.md
|
|
|
|
|
gets-all-team-secrets.md
|
|
|
|
|
gets-instance-type-prices.md
|
|
|
|
|
getting-started.md
|
|
|
|
|
grafana.md
|
|
|
|
|
grpc.md
|
|
|
|
|
health.md
|
|
|
|
|
howbasetenworks.md
|
|
|
|
|
image-generation.md
|
|
|
|
|
image.md
|
|
|
|
|
implementation.md
|
|
|
|
|
index.md
|
|
|
|
|
inference.md
|
|
|
|
|
init.md
|
|
|
|
|
integrations.md
|
|
|
|
|
invocation.md
|
|
|
|
|
kokoro.md
|
|
|
|
|
lifecycle.md
|
|
|
|
|
list-training-jobs.md
|
|
|
|
|
lists-all-teams.md
|
|
|
|
|
lists-the-users-api-keys.md
|
|
|
|
|
llama-33-70b-instruct.md
|
|
|
|
|
llms-full.txt
|
|
|
|
|
llms.txt
|
|
|
|
|
loading.md
|
|
|
|
|
localdev.md
|
|
|
|
|
login.md
|
|
|
|
|
lookahead-decoding.md
|
|
|
|
|
lora-support.md
|
|
|
|
|
management.md
|
|
|
|
|
mars6.md
|
|
|
|
|
metrics.md
|
|
|
|
|
model-cache.md
|
|
|
|
|
model-logs.md
|
|
|
|
|
multinode.md
|
|
|
|
|
new-relic.md
|
|
|
|
|
nomic-embed-v1-5.md
|
|
|
|
|
overview.md
|
|
|
|
|
performance-client.md
|
|
|
|
|
performance-optimization.md
|
|
|
|
|
predict.md
|
|
|
|
|
private-registries.md
|
|
|
|
|
production-wake.md
|
|
|
|
|
prometheus.md
|
|
|
|
|
promotes-a-chain-deployment-to-an-environment.md
|
|
|
|
|
promotes-a-deployment-to-an-environment.md
|
|
|
|
|
promotes-a-deployment-to-production.md
|
|
|
|
|
promotes-a-development-deployment-to-production.md
|
|
|
|
|
push.md
|
|
|
|
|
quantization-guide.md
|
|
|
|
|
quickstart.md
|
|
|
|
|
qwen-2-5-32b-coder-instruct.md
|
|
|
|
|
rate-limits-and-budgets.md
|
|
|
|
|
reasoning.md
|
|
|
|
|
recreate-training-job.md
|
|
|
|
|
requests.md
|
|
|
|
|
resources.md
|
|
|
|
|
responses.md
|
|
|
|
|
restricted-environments.md
|
|
|
|
|
run-python.md
|
|
|
|
|
sdxl-lightning.md
|
|
|
|
|
search-training-jobs.md
|
|
|
|
|
secrets.md
|
|
|
|
|
security.md
|
|
|
|
|
sglang.md
|
|
|
|
|
speculative-decoding.md
|
|
|
|
|
status.md
|
|
|
|
|
stop-training-job.md
|
|
|
|
|
streaming.md
|
|
|
|
|
structured-output.md
|
|
|
|
|
structured-outputs.md
|
|
|
|
|
stub.md
|
|
|
|
|
subclassing.md
|
|
|
|
|
supported-metrics.md
|
|
|
|
|
teams.md
|
|
|
|
|
tensorrt-llm.md
|
|
|
|
|
text-to-speech.md
|
|
|
|
|
torch-compile-cache.md
|
|
|
|
|
tracing.md
|
|
|
|
|
training-cli.md
|
|
|
|
|
training.md
|
|
|
|
|
truss-configuration.md
|
|
|
|
|
truss.md
|
|
|
|
|
update-a-chain-environments-settings.md
|
|
|
|
|
update-a-chainlet-environments-autoscaling-settings.md
|
|
|
|
|
update-a-chainlet-environments-instance-type-settings.md
|
|
|
|
|
update-an-environments-settings.md
|
|
|
|
|
updates-a-deployments-autoscaling-settings.md
|
|
|
|
|
updates-a-development-deployments-autoscaling-settings.md
|
|
|
|
|
upserts-a-secret.md
|
|
|
|
|
upserts-a-team-secret.md
|
|
|
|
|
usage.md
|
|
|
|
|
vllm.md
|
|
|
|
|
watch.md
|
|
|
|
|
websockets.md
|
|
|
|
|
whisper-v3-fastest.md
|
|
|
|
|
whoami.md
|
|
|
|
|
whybaseten.md
|
|
|
|