diff --git a/providers/cloudflare-ai-gateway/generate_models.sh b/providers/cloudflare-ai-gateway/generate_models.sh new file mode 100755 index 000000000..b9a84ba0b --- /dev/null +++ b/providers/cloudflare-ai-gateway/generate_models.sh @@ -0,0 +1,345 @@ +#!/usr/bin/env bash +# +# Generate model TOML files for Cloudflare AI Gateway +# +# Required environment variables: +# CLOUDFLARE_API_TOKEN - Your Cloudflare API token +# CLOUDFLARE_ACCOUNT_ID - Your Cloudflare account ID +# CLOUDFLARE_GATEWAY_ID - Your AI Gateway name/ID +# +# Usage: +# CLOUDFLARE_API_TOKEN=xxx CLOUDFLARE_ACCOUNT_ID=xxx CLOUDFLARE_GATEWAY_ID=xxx ./generate_models.sh +# + +set -eo pipefail + +# ============================================================================= +# CONFIGURATION: Providers and models to include +# ============================================================================= + +# Providers to include ALL models from (generated with defaults) +INCLUDE_ALL_PROVIDERS="workers-ai replicate" + +# Providers to cross-reference from source provider files +CROSS_REFERENCE_PROVIDERS="openai anthropic" + +# For cross-referenced providers, only include these well-known models (regex patterns) +# Format: "provider/model-pattern" +# Use $ anchor for exact matches to avoid dated versions and variants +WELL_KNOWN_MODELS=( + # OpenAI - canonical names only, no dated versions + "openai/gpt-5.1$" + "openai/gpt-5.1-codex$" + "openai/gpt-4o$" + "openai/gpt-4o-mini$" + "openai/gpt-4-turbo$" + "openai/gpt-4$" + "openai/gpt-3.5-turbo$" + "openai/o1$" + "openai/o1-mini$" + "openai/o1-preview$" + "openai/o3$" + "openai/o3-mini$" + "openai/o3-pro$" + "openai/o4-mini$" + + # Anthropic - canonical names only, no dated versions or duplicates + "anthropic/claude-sonnet-4.5$" + "anthropic/claude-opus-4.5$" + "anthropic/claude-haiku-4.5$" + "anthropic/claude-opus-4.1$" + "anthropic/claude-sonnet-4$" + "anthropic/claude-opus-4$" + "anthropic/claude-3.5-sonnet$" + "anthropic/claude-3.5-haiku$" + "anthropic/claude-3-opus$" + "anthropic/claude-3-sonnet$" + "anthropic/claude-3-haiku$" +) + +# ============================================================================= +# Helper function to get mapped model name for source file lookup +# ============================================================================= +get_mapped_name() { + local model_name="$1" + case "${model_name}" in + # Anthropic mappings (Cloudflare uses dots, source uses dashes) + "claude-sonnet-4.5") echo "claude-sonnet-4-5" ;; + "claude-opus-4.5") echo "claude-opus-4-5" ;; + "claude-haiku-4.5") echo "claude-haiku-4-5" ;; + "claude-opus-4.1") echo "claude-opus-4-1" ;; + "claude-sonnet-4") echo "claude-sonnet-4-0" ;; + "claude-opus-4") echo "claude-opus-4-0" ;; + "claude-3.5-sonnet") echo "claude-3-5-sonnet-20241022" ;; + "claude-3.5-haiku") echo "claude-3-5-haiku-latest" ;; + "claude-3-opus") echo "claude-3-opus-20240229" ;; + "claude-3-sonnet") echo "claude-3-sonnet-20240229" ;; + "claude-3-haiku") echo "claude-3-haiku-20240307" ;; + *) echo "${model_name}" ;; + esac +} + +# ============================================================================= +# Helper function to check if a model should be included +# ============================================================================= +should_include_model() { + local model_id="$1" + local provider + + # Extract provider from model ID (first path segment) + provider=$(echo "${model_id}" | cut -d'/' -f1) + + # Check if provider is in the "include all" list + for p in ${INCLUDE_ALL_PROVIDERS}; do + if [[ "${provider}" == "${p}" ]]; then + return 0 # Include + fi + done + + # Check if model matches any well-known pattern + for pattern in "${WELL_KNOWN_MODELS[@]}"; do + if echo "${model_id}" | grep -qE "^${pattern}"; then + return 0 # Include + fi + done + + return 1 # Exclude +} + +# ============================================================================= +# Helper function to find source file for cross-referenced models +# ============================================================================= +find_source_file() { + local provider="$1" + local model_name="$2" + + # Check if provider is in cross-reference list + local is_cross_ref=false + for p in ${CROSS_REFERENCE_PROVIDERS}; do + if [[ "${provider}" == "${p}" ]]; then + is_cross_ref=true + break + fi + done + + if [[ "${is_cross_ref}" != "true" ]]; then + return 1 + fi + + # Get mapped name + local mapped_name + mapped_name=$(get_mapped_name "${model_name}") + + local source_file="${PROVIDERS_DIR}/${provider}/models/${mapped_name}.toml" + + if [[ -f "${source_file}" ]]; then + echo "${source_file}" + return 0 + fi + + # Try original name if mapping didn't work + if [[ "${mapped_name}" != "${model_name}" ]]; then + source_file="${PROVIDERS_DIR}/${provider}/models/${model_name}.toml" + if [[ -f "${source_file}" ]]; then + echo "${source_file}" + return 0 + fi + fi + + return 1 +} + +# ============================================================================= +# Main script +# ============================================================================= + +# Validate required environment variables +if [[ -z "${CLOUDFLARE_API_TOKEN:-}" ]]; then + echo "Error: CLOUDFLARE_API_TOKEN environment variable is required" >&2 + exit 1 +fi + +if [[ -z "${CLOUDFLARE_ACCOUNT_ID:-}" ]]; then + echo "Error: CLOUDFLARE_ACCOUNT_ID environment variable is required" >&2 + exit 1 +fi + +if [[ -z "${CLOUDFLARE_GATEWAY_ID:-}" ]]; then + echo "Error: CLOUDFLARE_GATEWAY_ID environment variable is required" >&2 + exit 1 +fi + +SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)" +MODELS_DIR="${SCRIPT_DIR}/models" +PROVIDERS_DIR="${SCRIPT_DIR}/../.." + +# Fetch models from Cloudflare AI Gateway +echo "Fetching models from Cloudflare AI Gateway..." +API_URL="https://gateway.ai.cloudflare.com/v1/${CLOUDFLARE_ACCOUNT_ID}/${CLOUDFLARE_GATEWAY_ID}/compat/models" + +RESPONSE=$(curl -s -H "Authorization: Bearer ${CLOUDFLARE_API_TOKEN}" "${API_URL}") + +# Check if the response is valid JSON with data +if ! echo "${RESPONSE}" | jq -e '.data' > /dev/null 2>&1; then + echo "Error: Invalid API response or no data returned" >&2 + echo "Response: ${RESPONSE}" >&2 + exit 1 +fi + +MODEL_COUNT=$(echo "${RESPONSE}" | jq '.data | length') + +if [[ "${MODEL_COUNT}" -eq 0 ]]; then + echo "Error: No models found in API response" >&2 + exit 1 +fi + +echo "Found ${MODEL_COUNT} models from API" + +# Create a temporary file to track API model files +API_MODEL_FILES=$(mktemp) +trap "rm -f ${API_MODEL_FILES}" EXIT + +INCLUDED_COUNT=0 +SKIPPED_COUNT=0 +CROSS_REF_COUNT=0 + +# Process each model from the API response +echo "${RESPONSE}" | jq -c '.data[]' | while IFS= read -r MODEL_JSON; do + MODEL_ID=$(echo "${MODEL_JSON}" | jq -r '.id') + COST_IN=$(echo "${MODEL_JSON}" | jq -r '.cost_in // 0') + COST_OUT=$(echo "${MODEL_JSON}" | jq -r '.cost_out // 0') + CREATED_AT=$(echo "${MODEL_JSON}" | jq -r '.created_at // 0') + + # Skip empty IDs + [[ -z "${MODEL_ID}" || "${MODEL_ID}" == "null" ]] && continue + + # Check if this model should be included + if ! should_include_model "${MODEL_ID}"; then + ((SKIPPED_COUNT++)) || true + continue + fi + + ((INCLUDED_COUNT++)) || true + + # Extract provider and model name + PROVIDER=$(echo "${MODEL_ID}" | cut -d'/' -f1) + MODEL_NAME=$(echo "${MODEL_ID}" | cut -d'/' -f2-) + + # Convert model ID to file path based on the API format: + # - "workers-ai/@cf/vendor/model-name" -> "workers-ai/model-name.toml" + # - "anthropic/claude-opus-4-5" -> "anthropic/claude-opus-4-5.toml" + # - "replicate/meta/llama-3" -> "replicate/meta/llama-3.toml" + + if [[ "${MODEL_ID}" == workers-ai/@cf/* ]]; then + # Workers AI model: workers-ai/@cf/vendor/model-name -> workers-ai/model-name.toml + MODEL_NAME=$(echo "${MODEL_ID}" | sed 's|workers-ai/@cf/[^/]*/||') + MODEL_PATH="workers-ai/${MODEL_NAME}.toml" + else + # All other models: keep the path structure as-is + MODEL_PATH="${MODEL_ID}.toml" + fi + + FULL_PATH="${MODELS_DIR}/${MODEL_PATH}" + echo "${FULL_PATH}" >> "${API_MODEL_FILES}" + + # Create directory if needed + MODEL_DIR=$(dirname "${FULL_PATH}") + mkdir -p "${MODEL_DIR}" + + # Check if we should cross-reference from source provider + SOURCE_FILE=$(find_source_file "${PROVIDER}" "${MODEL_NAME}" || true) + + if [[ -n "${SOURCE_FILE}" && -f "${SOURCE_FILE}" ]]; then + echo "Cross-referencing: ${MODEL_PATH} <- ${SOURCE_FILE#${PROVIDERS_DIR}/}" + cp "${SOURCE_FILE}" "${FULL_PATH}" + ((CROSS_REF_COUNT++)) || true + else + # Generate file with defaults for workers-ai, replicate, etc. + echo "Generating: ${MODEL_PATH}" + + # Generate a human-readable name from model ID (use the last part) + DISPLAY_NAME=$(echo "${MODEL_ID}" | sed 's|.*/||' | sed 's/-/ /g' | sed 's/\b\(.\)/\u\1/g') + + # Convert created_at timestamp to date (YYYY-MM-DD) + if [[ "${CREATED_AT}" != "0" && "${CREATED_AT}" != "null" ]]; then + RELEASE_DATE=$(date -r "${CREATED_AT}" +%Y-%m-%d 2>/dev/null || date -d "@${CREATED_AT}" +%Y-%m-%d 2>/dev/null || date +%Y-%m-%d) + else + RELEASE_DATE=$(date +%Y-%m-%d) + fi + + # Convert cost per token to cost per million tokens + # API returns cost per token, we need cost per 1M tokens + # Treat negative or invalid costs as 0 + if [[ "${COST_IN}" != "0" && "${COST_IN}" != "null" ]]; then + COST_IN_PER_M=$(echo "${COST_IN} * 1000000" | bc -l | sed 's/^\./0./' | sed 's/0*$//' | sed 's/\.$//') + # If negative, set to 0 + if (( $(echo "${COST_IN_PER_M} < 0" | bc -l) )); then + COST_IN_PER_M="0" + fi + else + COST_IN_PER_M="0" + fi + + if [[ "${COST_OUT}" != "0" && "${COST_OUT}" != "null" ]]; then + COST_OUT_PER_M=$(echo "${COST_OUT} * 1000000" | bc -l | sed 's/^\./0./' | sed 's/0*$//' | sed 's/\.$//') + # If negative, set to 0 + if (( $(echo "${COST_OUT_PER_M} < 0" | bc -l) )); then + COST_OUT_PER_M="0" + fi + else + COST_OUT_PER_M="0" + fi + + # Always overwrite to ensure data is up to date + cat > "${FULL_PATH}" << EOF +name = "${DISPLAY_NAME}" +release_date = "${RELEASE_DATE}" +last_updated = "${RELEASE_DATE}" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = ${COST_IN_PER_M} +output = ${COST_OUT_PER_M} + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] +EOF + fi +done + +# Find and remove models that are not in the API response +echo "" +echo "Checking for models to remove..." +REMOVED_COUNT=0 + +# Find all existing .toml files in models directory +while IFS= read -r -d '' EXISTING_FILE; do + if ! grep -qxF "${EXISTING_FILE}" "${API_MODEL_FILES}"; then + REL_PATH="${EXISTING_FILE#${MODELS_DIR}/}" + echo "Removing model not in API: ${REL_PATH}" + rm -f "${EXISTING_FILE}" + ((REMOVED_COUNT++)) || true + fi +done < <(find "${MODELS_DIR}" -name "*.toml" -type f -print0) + +# Clean up empty directories +find "${MODELS_DIR}" -type d -empty -delete 2>/dev/null || true + +FINAL_COUNT=$(find "${MODELS_DIR}" -name "*.toml" -type f | wc -l | tr -d ' ') + +echo "" +echo "Summary:" +echo " Models from API: ${MODEL_COUNT}" +echo " Models included: ${FINAL_COUNT}" +echo " Models removed: ${REMOVED_COUNT}" +echo "" +echo "Done!" diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3-5-haiku.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-5-haiku.toml new file mode 100644 index 000000000..cee577dbc --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-5-haiku.toml @@ -0,0 +1,20 @@ +name = "claude 3 5 haiku" +release_date = "2024-11-04" +last_updated = "2024-11-04" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 4 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3-haiku.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-haiku.toml new file mode 100644 index 000000000..65ee2d9c7 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-haiku.toml @@ -0,0 +1,20 @@ +name = "claude 3 haiku" +release_date = "2024-07-31" +last_updated = "2024-07-31" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 1.25 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3-opus.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-opus.toml new file mode 100644 index 000000000..e29030abb --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-opus.toml @@ -0,0 +1,20 @@ +name = "claude 3 opus" +release_date = "2024-07-31" +last_updated = "2024-07-31" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 15 +output = 75 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3-sonnet.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-sonnet.toml new file mode 100644 index 000000000..7cd867290 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3-sonnet.toml @@ -0,0 +1,20 @@ +name = "claude 3 sonnet" +release_date = "2024-07-31" +last_updated = "2024-07-31" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 3 +output = 15 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml index 0afeca15b..76c00de87 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml @@ -1,23 +1,20 @@ -name = "Claude Haiku 3.5" -release_date = "2024-10-22" -last_updated = "2024-10-22" -attachment = true +name = "claude 3.5 haiku" +release_date = "2025-01-07" +last_updated = "2025-01-07" +attachment = false reasoning = false temperature = true -tool_call = true -knowledge = "2024-07-31" +tool_call = false open_weights = false [cost] -input = 0.80 -output = 4.00 -cache_read = 0.08 -cache_write = 1.00 +input = 0 +output = 4 [limit] -context = 200_000 -output = 8_192 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-sonnet.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-sonnet.toml new file mode 100644 index 000000000..dc043e702 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-sonnet.toml @@ -0,0 +1,20 @@ +name = "claude 3.5 sonnet" +release_date = "2024-07-31" +last_updated = "2024-07-31" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 3 +output = 15 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml deleted file mode 100644 index 5e4acc601..000000000 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Claude Sonnet 3.7" -release_date = "2025-02-19" -last_updated = "2025-02-19" -attachment = true -reasoning = true -temperature = true -tool_call = true -knowledge = "2024-01" -open_weights = false - -[cost] -input = 15.00 -output = 75.00 -cache_read = 1.50 -cache_write = 18.75 - -[limit] -context = 200_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4-5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4-5.toml new file mode 100644 index 000000000..744b76eb5 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4-5.toml @@ -0,0 +1,20 @@ +name = "claude haiku 4 5" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 1 +output = 5 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml index 9476e8081..2d84e5ad8 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml @@ -1,23 +1,20 @@ -name = "Claude Haiku 4.5" -release_date = "2025-10-15" -last_updated = "2025-10-15" -attachment = true -reasoning = true +name = "claude haiku 4.5" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-02-28" +tool_call = false open_weights = false [cost] -input = 1.00 -output = 5.00 -cache_read = 0.10 -cache_write = 1.25 +input = 1 +output = 5 [limit] -context = 200_000 -output = 64_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-1.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-1.toml new file mode 100644 index 000000000..28477e4b8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-1.toml @@ -0,0 +1,20 @@ +name = "claude opus 4 1" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 15 +output = 75 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-5.toml new file mode 100644 index 000000000..09ca2df60 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4-5.toml @@ -0,0 +1,20 @@ +name = "claude opus 4 5" +release_date = "2025-11-24" +last_updated = "2025-11-24" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 5 +output = 25 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml index a1f0975e2..8c6c46aef 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml @@ -1,23 +1,20 @@ -name = "Claude Opus 4.1" +name = "claude opus 4.1" release_date = "2025-08-05" last_updated = "2025-08-05" -attachment = true -reasoning = true +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-03-31" +tool_call = false open_weights = false [cost] -input = 15.00 -output = 75.00 -cache_read = 1.50 -cache_write = 18.75 +input = 15 +output = 75 [limit] -context = 200_000 -output = 32_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml index a9addac14..85110e5d8 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml @@ -1,23 +1,20 @@ -name = "Claude Opus 4.5" +name = "claude opus 4.5" release_date = "2025-11-24" last_updated = "2025-11-24" -attachment = true -reasoning = true +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-05-30" +tool_call = false open_weights = false [cost] -input = 5.00 -output = 25.00 -cache_read = 0.50 -cache_write = 6.25 +input = 5 +output = 25 [limit] -context = 200_000 -output = 32_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml index 96019db43..b7583a22e 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml @@ -1,23 +1,20 @@ -name = "Claude Opus 4" +name = "claude opus 4" release_date = "2025-05-22" last_updated = "2025-05-22" -attachment = true -reasoning = true +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-03-31" +tool_call = false open_weights = false [cost] -input = 15.00 -output = 75.00 -cache_read = 1.50 -cache_write = 18.75 +input = 15 +output = 75 [limit] -context = 200_000 -output = 32_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4-5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4-5.toml new file mode 100644 index 000000000..3619586a8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4-5.toml @@ -0,0 +1,20 @@ +name = "claude sonnet 4 5" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 3 +output = 15 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml index 328e11098..7b433ba55 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml @@ -1,29 +1,20 @@ -name = "Claude Sonnet 4.5" -release_date = "2025-09-29" -last_updated = "2025-09-29" -attachment = true -reasoning = true +name = "claude sonnet 4.5" +release_date = "2025-10-08" +last_updated = "2025-10-08" +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-07-31" +tool_call = false open_weights = false [cost] -input = 3.00 -output = 15.00 -cache_read = 0.30 -cache_write = 3.75 - -[cost.context_over_200k] -input = 6.00 -output = 22.50 -cache_read = 0.60 -cache_write = 7.50 +input = 3 +output = 15 [limit] -context = 1_000_000 -output = 64_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml index 9ccbe8098..a55f90435 100644 --- a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml @@ -1,29 +1,20 @@ -name = "Claude Sonnet 4" +name = "claude sonnet 4" release_date = "2025-05-22" last_updated = "2025-05-22" -attachment = true -reasoning = true +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2025-03-31" +tool_call = false open_weights = false [cost] -input = 3.00 -output = 15.00 -cache_read = 0.30 -cache_write = 3.75 - -[cost.context_over_200k] -input = 6.00 -output = 22.50 -cache_read = 0.60 -cache_write = 7.50 +input = 3 +output = 15 [limit] -context = 200_000 -output = 64_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml deleted file mode 100644 index 94d71a57f..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "deepseek/deepseek-chat-v3-0324:free" -name = "DeepSeek V3 0324" -release_date = "2025-03-24" -last_updated = "2025-03-24" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = false -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 16384, output = 8192 } - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml deleted file mode 100644 index 30b01d765..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek-V3.1" -release_date = "2025-08-21" -last_updated = "2025-08-21" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-07" -tool_call = true -open_weights = true - -[cost] -input = 0.20 -output = 0.80 - -[limit] -context = 163_840 -output = 163_840 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml deleted file mode 100644 index 736ed3524..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Deepseek R1 0528 Qwen3 8B (free)" -release_date = "2025-05-29" -last_updated = "2025-05-29" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 131_072 -output = 131_072 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml deleted file mode 100644 index 0d62f4504..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "R1 0528 (free)" -release_date = "2025-05-28" -last_updated = "2025-05-28" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 163_840 -output = 163_840 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml deleted file mode 100644 index cba6b81ff..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "deepseek/deepseek-r1-distill-llama-70b:free" -name = "DeepSeek R1 Distill Llama 70B" -release_date = "2025-01-23" -last_updated = "2025-01-23" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-10" -tool_call = false -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 8192, output = 8192 } - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml deleted file mode 100644 index 500930a64..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "deepseek/deepseek-r1-distill-qwen-14b:free" -name = "DeepSeek R1 Distill Qwen 14B" -release_date = "2025-01-29" -last_updated = "2025-01-29" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-10" -tool_call = false -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 64000, output = 8192 } - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml deleted file mode 100644 index eabdfb36e..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "R1 (free)" -release_date = "2025-01-20" -last_updated = "2025-01-20" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 163_840 -output = 163_840 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml deleted file mode 100644 index c87d9aa1a..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek V3 Base (free)" -release_date = "2025-03-29" -last_updated = "2025-03-29" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-03" -tool_call = false -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 163_840 -output = 163_840 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml deleted file mode 100644 index a78c43ba1..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek V3.1 Terminus" -release_date = "2025-09-22" -last_updated = "2025-09-22" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-07" -tool_call = true -open_weights = true - -[cost] -input = 0.27 -output = 1.00 - -[limit] -context = 131_072 -output = 65_536 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml deleted file mode 100644 index 373c4b575..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek V3.1 Terminus (exacto)" -release_date = "2025-09-22" -last_updated = "2025-09-22" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-07" -tool_call = true -open_weights = true - -[cost] -input = 0.27 -output = 1.00 - -[limit] -context = 131_072 -output = 65_536 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml deleted file mode 100644 index 023f7d0c8..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek V3.2 Speciale" -release_date = "2025-12-01" -last_updated = "2025-12-01" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-07" -tool_call = true -open_weights = true - -[cost] -input = 0.27 -output = 0.41 - -[limit] -context = 163_840 -output = 65_536 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml deleted file mode 100644 index ab57aee8b..000000000 --- a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "DeepSeek V3.2" -release_date = "2025-12-01" -last_updated = "2025-12-01" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-07" -tool_call = true -open_weights = true - -[cost] -input = 0.28 -output = 0.40 - -[limit] -context = 163_840 -output = 65_536 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml deleted file mode 100644 index 5168a0cd2..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.0 Flash" -release_date = "2024-12-11" -last_updated = "2024-12-11" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-06" -tool_call = true -open_weights = false - -[cost] -input = 0.10 -output = 0.40 -cache_read = 0.025 - -[limit] -context = 1_048_576 -output = 8_192 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml deleted file mode 100644 index ae135080e..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Gemini 2.0 Flash Experimental (free)" -release_date = "2024-12-11" -last_updated = "2024-12-11" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-12" -tool_call = true -open_weights = false - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 1_048_576 -output = 1_048_576 - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml deleted file mode 100644 index f0dcb0495..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Flash Lite Preview 09-25" -release_date = "2025-09-25" -last_updated = "2025-09-25" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 0.10 -output = 0.40 -cache_read = 0.025 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml deleted file mode 100644 index 4a534b571..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Flash Lite" -release_date = "2025-06-17" -last_updated = "2025-06-17" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 0.10 -output = 0.40 -cache_read = 0.025 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml deleted file mode 100644 index 5ee14ca12..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Flash Preview 09-25" -release_date = "2025-09-25" -last_updated = "2025-09-25" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 0.30 -output = 2.50 -cache_read = 0.031 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml deleted file mode 100644 index 3c4458c21..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Flash" -release_date = "2025-07-17" -last_updated = "2025-07-17" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 0.30 -output = 2.50 -cache_read = 0.0375 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml deleted file mode 100644 index 3618677e9..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Pro Preview 05-06" -release_date = "2025-05-06" -last_updated = "2025-05-06" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 -cache_read = 0.31 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml deleted file mode 100644 index 82ee677b3..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Pro Preview 06-05" -release_date = "2025-06-05" -last_updated = "2025-06-05" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 -cache_read = 0.31 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml deleted file mode 100644 index 0e0d4a881..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Gemini 2.5 Pro" -release_date = "2025-03-20" -last_updated = "2025-06-05" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 -cache_read = 0.31 - -[limit] -context = 1_048_576 -output = 65_536 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml deleted file mode 100644 index e05d22307..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml +++ /dev/null @@ -1,24 +0,0 @@ -name = "Gemini 3 Pro Preview" -release_date = "2025-11-18" -last_updated = "2025-11" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-01" -tool_call = true -open_weights = false - -[cost] -input = 2.00 -output = 12.00 - -[limit] -context = 1_050_000 -output = 66_000 - -[modalities] -input = ["text", "image", "audio", "video", "pdf"] -output = ["text"] - -[provider] -npm = "@openrouter/ai-sdk-provider" diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml deleted file mode 100644 index 4de372415..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Gemma 2 9B (free)" -release_date = "2024-06-28" -last_updated = "2024-06-28" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-06" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 8_192 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml deleted file mode 100644 index 8efc679b2..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "google/gemma-3-12b-it:free" -name = "Gemma 3 12B IT" -release_date = "2025-03-13" -last_updated = "2025-03-13" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = true -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 96000, output = 8192 } - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml deleted file mode 100644 index 5fc7e02d7..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "google/gemma-3-27b-it:free" -name = "Gemma 3 27B IT" -release_date = "2025-03-12" -last_updated = "2025-03-12" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = true -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 96000, output = 8192 } - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml deleted file mode 100644 index 03723bbb3..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "google/gemma-3n-e4b-it:free" -name = "Gemma 3n E4B IT" -release_date = "2025-05-20" -last_updated = "2025-05-20" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = false -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 8192, output = 8192 } - -[modalities] -input = ["text", "image", "audio"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml deleted file mode 100644 index 190fcb985..000000000 --- a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Gemma 3n 4B (free)" -release_date = "2025-05-20" -last_updated = "2025-05-20" -attachment = true -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 8_192 -output = 8_192 - -[modalities] -input = ["text", "image", "audio"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml b/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml deleted file mode 100644 index 0b2502a3c..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml +++ /dev/null @@ -1,19 +0,0 @@ -name = "DeepSeek R1 Distill Llama 70B" -release_date = "2025-01-20" -last_updated = "2025-01-20" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-07" -tool_call = true -open_weights = true -status = "deprecated" - - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml b/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml deleted file mode 100644 index 438069e93..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml +++ /dev/null @@ -1,18 +0,0 @@ -name = "Gemma 2 9B" -release_date = "2024-06-27" -last_updated = "2024-06-27" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-06" -tool_call = true -open_weights = true -status = "deprecated" - -[limit] -context = 8_192 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml b/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml deleted file mode 100644 index f39ab2074..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Llama 3.3 70B Versatile" -release_date = "2024-12-06" -last_updated = "2024-12-06" -attachment = false -reasoning = false -temperature = true -knowledge = "2023-12" -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml b/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml deleted file mode 100644 index bae5b60d1..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml +++ /dev/null @@ -1,19 +0,0 @@ -name = "Llama 3 70B" -release_date = "2024-04-18" -last_updated = "2024-04-18" -attachment = false -reasoning = false -temperature = true -knowledge = "2023-03" -tool_call = true -open_weights = true -status = "deprecated" - - -[limit] -context = 8_192 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml b/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml deleted file mode 100644 index 2c28f1a84..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml +++ /dev/null @@ -1,18 +0,0 @@ -name = "Llama 3 8B" -release_date = "2024-04-18" -last_updated = "2024-04-18" -attachment = false -reasoning = false -temperature = true -knowledge = "2023-03" -tool_call = true -open_weights = true -status = "deprecated" - -[limit] -context = 8_192 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml deleted file mode 100644 index f7ef6016e..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Llama 4 Maverick 17B" -release_date = "2025-04-05" -last_updated = "2025-04-05" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-08" -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml deleted file mode 100644 index a5fe7ff54..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Llama 4 Scout 17B" -release_date = "2025-04-05" -last_updated = "2025-04-05" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-08" -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml deleted file mode 100644 index 7e257022c..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml +++ /dev/null @@ -1,16 +0,0 @@ -name = "Llama Guard 4 12B" -release_date = "2025-04-05" -last_updated = "2025-04-05" -attachment = false -reasoning = false -temperature = true -tool_call = false -open_weights = true - -[limit] -context = 131_072 -output = 128 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml b/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml deleted file mode 100644 index 78b6968e5..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml +++ /dev/null @@ -1,19 +0,0 @@ -name = "Mistral Saba 24B" -release_date = "2025-02-06" -last_updated = "2025-02-06" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-08" -tool_call = true -open_weights = false -status = "deprecated" - - -[limit] -context = 32_768 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml deleted file mode 100644 index 7456acc02..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Kimi K2 Instruct 0905" -release_date = "2025-09-05" -last_updated = "2025-09-05" -attachment = false -reasoning = false -temperature = true -tool_call = true -knowledge = "2024-10" -open_weights = true - -[limit] -context = 262_144 -output = 16_384 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml deleted file mode 100644 index 821613e6f..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml +++ /dev/null @@ -1,18 +0,0 @@ -name = "Kimi K2 Instruct" -release_date = "2025-07-14" -last_updated = "2025-07-14" -attachment = false -reasoning = false -temperature = true -tool_call = true -knowledge = "2024-10" -open_weights = true -status = "deprecated" - -[limit] -context = 131_072 -output = 16_384 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml deleted file mode 100644 index 02d65e606..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml +++ /dev/null @@ -1,16 +0,0 @@ -name = "GPT OSS 120B" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml deleted file mode 100644 index 116e1f0de..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml +++ /dev/null @@ -1,16 +0,0 @@ -name = "GPT OSS 20B" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml b/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml deleted file mode 100644 index a1b0dd799..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Qwen QwQ 32B" -release_date = "2024-11-27" -last_updated = "2024-11-27" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-09" -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 16_384 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml b/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml deleted file mode 100644 index 2afb927c3..000000000 --- a/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Qwen3 32B" -release_date = "2024-12-23" -last_updated = "2024-12-23" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-11-08" -tool_call = true -open_weights = true - -[limit] -context = 131_072 -output = 16_384 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml b/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml deleted file mode 100644 index 642db9246..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Codestral 2508" -release_date = "2025-08-01" -last_updated = "2025-08-01" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.30 -output = 0.90 - -[limit] -context = 256_000 -output = 256_000 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml deleted file mode 100644 index d514e4688..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Devstral Medium" -release_date = "2025-07-10" -last_updated = "2025-07-10" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.40 -output = 2.00 - -[limit] -context = 131_072 -output = 131_072 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml deleted file mode 100644 index 73ad4baee..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Devstral Small" -release_date = "2025-05-07" -last_updated = "2025-05-07" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.06 -output = 0.12 - -[limit] -context = 128_000 -output = 128_000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml deleted file mode 100644 index 86554a6a8..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Devstral Small 2505 (free)" -release_date = "2025-05-21" -last_updated = "2025-05-21" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 32_768 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml deleted file mode 100644 index 1738ab3c2..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Devstral Small 1.1" -release_date = "2025-07-10" -last_updated = "2025-07-10" -attachment = false -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = true - -[cost] -input = 0.10 -output = 0.30 - -[limit] -context = 131_072 -output = 131_072 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml deleted file mode 100644 index d10b1afc8..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Mistral 7B Instruct (free)" -release_date = "2024-05-27" -last_updated = "2024-05-27" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-05" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 32_768 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml deleted file mode 100644 index 5dc17a5f3..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Mistral Medium 3.1" -release_date = "2025-08-12" -last_updated = "2025-08-12" -attachment = true -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = false - -[cost] -input = 0.40 -output = 2.00 - -[limit] -context = 262_144 -output = 262_144 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml deleted file mode 100644 index cbf57bcd8..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Mistral Medium 3" -release_date = "2025-05-07" -last_updated = "2025-05-07" -attachment = true -reasoning = false -temperature = true -knowledge = "2025-05" -tool_call = true -open_weights = false - -[cost] -input = 0.40 -output = 2.00 - -[limit] -context = 131_072 -output = 131_072 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml deleted file mode 100644 index cc5f6e5f1..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Mistral Nemo (free)" -release_date = "2024-07-19" -last_updated = "2024-07-19" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-07" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 131_072 -output = 131_072 - -[modalities] -input = ["text"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml deleted file mode 100644 index fd7611b8b..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "mistralai/mistral-small-3.1-24b-instruct:free" -name = "Mistral Small 3.1 24B Instruct" -release_date = "2025-03-17" -last_updated = "2025-03-17" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = true -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 128000, output = 8192 } - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml deleted file mode 100644 index 4cfdf7060..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml +++ /dev/null @@ -1,16 +0,0 @@ -id = "mistralai/mistral-small-3.2-24b-instruct:free" -name = "Mistral Small 3.2 24B Instruct" -release_date = "2025-06-20" -last_updated = "2025-06-20" -attachment = true -reasoning = false -temperature = true -knowledge = "2024-10" -tool_call = true -open_weights = true -cost = { input = 0, output = 0 } -limit = { context = 96000, output = 8192 } - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml deleted file mode 100644 index df55ac661..000000000 --- a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "Mistral Small 3.2 24B (free)" -release_date = "2025-06-20" -last_updated = "2025-06-20" -attachment = true -reasoning = false -temperature = true -knowledge = "2025-06" -tool_call = true -open_weights = true - -[cost] -input = 0.00 -output = 0.00 - -[limit] -context = 96_000 -output = 96_000 - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-3.5-turbo.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-3.5-turbo.toml new file mode 100644 index 000000000..f425971d6 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-3.5-turbo.toml @@ -0,0 +1,20 @@ +name = "gpt 3.5 turuo" +release_date = "2025-02-10" +last_updated = "2025-02-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 1.5 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4-turbo.toml similarity index 58% rename from providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml rename to providers/cloudflare-ai-gateway/models/openai/gpt-4-turbo.toml index 90c84f3eb..32553f02d 100644 --- a/providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4-turbo.toml @@ -1,16 +1,19 @@ -name = "Llama 3.1 8B Instant" +name = "gpt 4 turuo" release_date = "2024-07-23" last_updated = "2024-07-23" attachment = false reasoning = false temperature = true -knowledge = "2023-12" -tool_call = true -open_weights = true +tool_call = false +open_weights = false + +[cost] +input = 10 +output = 30 [limit] -context = 131_072 -output = 8_192 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml deleted file mode 100644 index 748b01700..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "GPT-4.1 Mini" -release_date = "2025-04-14" -last_updated = "2025-04-14" -attachment = true -reasoning = false -temperature = true -tool_call = true -knowledge = "2024-04" -open_weights = false - -[cost] -input = 0.40 -output = 1.60 -cache_read = 0.10 - -[limit] -context = 1_047_576 -output = 32_768 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml deleted file mode 100644 index eca02a28f..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "GPT-4.1" -release_date = "2025-04-14" -last_updated = "2025-04-14" -attachment = true -reasoning = false -temperature = true -tool_call = true -knowledge = "2024-04" -open_weights = false - -[cost] -input = 2.00 -output = 8.00 -cache_read = 0.50 - -[limit] -context = 1_047_576 -output = 32_768 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4.toml similarity index 65% rename from providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml rename to providers/cloudflare-ai-gateway/models/openai/gpt-4.toml index 4e9ad068f..5ac55c331 100644 --- a/providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4.toml @@ -1,17 +1,19 @@ -name = "Llama Guard 3 8B" +name = "gpt 4" release_date = "2024-07-23" last_updated = "2024-07-23" attachment = false reasoning = false temperature = true tool_call = false -open_weights = true -status = "deprecated" +open_weights = false +[cost] +input = 30 +output = 60 [limit] -context = 8_192 -output = 8_192 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml index 173e77421..35e6bdef9 100644 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml @@ -1,22 +1,20 @@ -name = "GPT-4o-mini" -release_date = "2024-07-18" -last_updated = "2024-07-18" -attachment = true +name = "gpt 4o mini" +release_date = "2024-07-23" +last_updated = "2024-07-23" +attachment = false reasoning = false temperature = true -tool_call = true -knowledge = "2024-10" +tool_call = false open_weights = false [cost] -input = 0.15 -output = 0.60 -cache_read = 0.08 +input = 0 +output = 0 [limit] -context = 128_000 -output = 16_384 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4o.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4o.toml new file mode 100644 index 000000000..c9a08570e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4o.toml @@ -0,0 +1,20 @@ +name = "gpt 4o" +release_date = "2025-02-10" +last_updated = "2025-02-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 2.5 +output = 10 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml deleted file mode 100644 index 527aebdfc..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT-5 Chat (latest)" -release_date = "2025-08-07" -last_updated = "2025-08-07" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-09-30" -tool_call = false -open_weights = false - -[cost] -input = 1.25 -output = 10.00 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml deleted file mode 100644 index a3c834e57..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "GPT-5 Codex" -release_date = "2025-09-15" -last_updated = "2025-09-15" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-10-01" -tool_call = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 -cache_read = 0.125 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml deleted file mode 100644 index 0ae97d15b..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "GPT-5 Image" -release_date = "2025-10-14" -last_updated = "2025-10-14" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-10-01" -tool_call = true -open_weights = false - -[cost] -input = 5.00 -output = 10.00 -cache_read = 1.25 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image", "pdf"] -output = ["text", "image"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml deleted file mode 100644 index 5437addce..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT-5 Mini" -release_date = "2025-08-07" -last_updated = "2025-08-07" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-10-01" -tool_call = true -open_weights = false - -[cost] -input = 0.25 -output = 2.00 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml deleted file mode 100644 index 284ee8d46..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT-5 Nano" -release_date = "2025-08-07" -last_updated = "2025-08-07" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-10-01" -tool_call = true -open_weights = false - -[cost] -input = 0.05 -output = 0.40 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml deleted file mode 100644 index a2a292d83..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT-5 Pro" -release_date = "2025-10-06" -last_updated = "2025-10-06" -attachment = true -reasoning = true -temperature = false -knowledge = "2024-09-30" -tool_call = true -open_weights = false - -[cost] -input = 15.00 -output = 120.00 - -[limit] -context = 400_000 -output = 272_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml deleted file mode 100644 index 5287c7505..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "GPT-5.1 Chat" -release_date = "2025-11-13" -last_updated = "2025-11-13" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-09-30" -tool_call = true -structured_output = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 -cache_read = 0.125 - -[limit] -context = 128_000 -output = 16_384 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml deleted file mode 100644 index 0894af700..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "GPT-5.1-Codex-Mini" -release_date = "2025-11-13" -last_updated = "2025-11-13" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-09-30" -tool_call = true -structured_output = true -open_weights = false - -[cost] -input = 0.25 -output = 2.00 -cache_read = 0.025 - -[limit] -context = 400_000 -output = 100_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml index 38dabafaf..29e1c7a26 100644 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml @@ -1,23 +1,20 @@ -name = "GPT-5.1-Codex" -release_date = "2025-11-13" -last_updated = "2025-11-13" -attachment = true -reasoning = true +name = "gpt 5.1 codex" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false temperature = true -knowledge = "2024-09-30" -tool_call = true -structured_output = true +tool_call = false open_weights = false [cost] input = 1.25 -output = 10.00 -cache_read = 0.125 +output = 10 [limit] -context = 400_000 -output = 128_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml index 37eb1a25c..e6b64c234 100644 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml @@ -1,23 +1,20 @@ -name = "GPT-5.1" -release_date = "2025-11-13" -last_updated = "2025-11-13" -attachment = true -reasoning = true +name = "gpt 5.1" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false temperature = true -knowledge = "2024-09-30" -tool_call = true -structured_output = true +tool_call = false open_weights = false [cost] input = 1.25 -output = 10.00 -cache_read = 0.125 +output = 10 [limit] -context = 400_000 -output = 128_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml deleted file mode 100644 index 2ca19f85e..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT-5" -release_date = "2025-08-07" -last_updated = "2025-08-07" -attachment = true -reasoning = true -temperature = true -knowledge = "2024-10-01" -tool_call = true -open_weights = false - -[cost] -input = 1.25 -output = 10.00 - -[limit] -context = 400_000 -output = 128_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml deleted file mode 100644 index 947815c8d..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml +++ /dev/null @@ -1,20 +0,0 @@ -name = "GPT OSS 120B" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[cost] -input = 0.072 -output = 0.28 - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml deleted file mode 100644 index ec8055a44..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml +++ /dev/null @@ -1,20 +0,0 @@ -name = "GPT OSS 120B (exacto)" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[cost] -input = 0.05 -output = 0.24 - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml deleted file mode 100644 index ade230e00..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml +++ /dev/null @@ -1,20 +0,0 @@ -name = "GPT OSS 20B" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[cost] -input = 0.05 -output = 0.20 - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml deleted file mode 100644 index 844c6be72..000000000 --- a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml +++ /dev/null @@ -1,20 +0,0 @@ -name = "GPT OSS Safeguard 20B" -release_date = "2025-10-29" -last_updated = "2025-10-29" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = false - -[cost] -input = 0.075 -output = 0.30 - -[limit] -context = 131_072 -output = 65_536 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o1-mini.toml b/providers/cloudflare-ai-gateway/models/openai/o1-mini.toml new file mode 100644 index 000000000..ff64059db --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o1-mini.toml @@ -0,0 +1,20 @@ +name = "o1 mini" +release_date = "2025-02-10" +last_updated = "2025-02-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 1.1 +output = 4.4 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o1-preview.toml b/providers/cloudflare-ai-gateway/models/openai/o1-preview.toml new file mode 100644 index 000000000..a2489701d --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o1-preview.toml @@ -0,0 +1,20 @@ +name = "o1 preview" +release_date = "2024-09-12" +last_updated = "2024-09-12" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 15 +output = 60 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o1.toml b/providers/cloudflare-ai-gateway/models/openai/o1.toml new file mode 100644 index 000000000..20868594a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o1.toml @@ -0,0 +1,20 @@ +name = "o1" +release_date = "2025-01-07" +last_updated = "2025-01-07" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 15 +output = 60 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o3-mini.toml b/providers/cloudflare-ai-gateway/models/openai/o3-mini.toml new file mode 100644 index 000000000..6dc255e57 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o3-mini.toml @@ -0,0 +1,20 @@ +name = "o3 mini" +release_date = "2025-02-05" +last_updated = "2025-02-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 1.1 +output = 4.4 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o3-pro.toml b/providers/cloudflare-ai-gateway/models/openai/o3-pro.toml new file mode 100644 index 000000000..fe184a6eb --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o3-pro.toml @@ -0,0 +1,20 @@ +name = "o3 pro" +release_date = "2025-06-11" +last_updated = "2025-06-11" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 20 +output = 80 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar.toml b/providers/cloudflare-ai-gateway/models/openai/o3.toml similarity index 54% rename from providers/cloudflare-ai-gateway/models/perplexity/sonar.toml rename to providers/cloudflare-ai-gateway/models/openai/o3.toml index 90157ebef..f6ef3c17a 100644 --- a/providers/cloudflare-ai-gateway/models/perplexity/sonar.toml +++ b/providers/cloudflare-ai-gateway/models/openai/o3.toml @@ -1,16 +1,19 @@ -name = "Sonar" -release_date = "2024-01-01" -last_updated = "2025-09-01" +name = "o3" +release_date = "2025-06-10" +last_updated = "2025-06-10" attachment = false reasoning = false temperature = true tool_call = false -knowledge = "2025-09-01" open_weights = false +[cost] +input = 2 +output = 8 + [limit] -context = 128_000 -output = 4_096 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml b/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml index 6f24829b3..df5bb2143 100644 --- a/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml +++ b/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml @@ -1,22 +1,20 @@ -name = "o4 Mini" +name = "o4 mini" release_date = "2025-04-16" last_updated = "2025-04-16" -attachment = true -reasoning = true +attachment = false +reasoning = false temperature = true -tool_call = true -knowledge = "2024-06" +tool_call = false open_weights = false [cost] -input = 1.10 -output = 4.40 -cache_read = 0.28 +input = 1.1 +output = 4.4 [limit] -context = 200_000 -output = 100_000 +context = 128000 +output = 16384 [modalities] -input = ["text", "image"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml deleted file mode 100644 index 7fb6424a5..000000000 --- a/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Sonar Pro" -release_date = "2024-01-01" -last_updated = "2025-09-01" -attachment = true -reasoning = false -temperature = true -tool_call = false -knowledge = "2025-09-01" -open_weights = false - -[limit] -context = 200_000 -output = 8_192 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml deleted file mode 100644 index 502331a87..000000000 --- a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Sonar Reasoning Pro" -release_date = "2024-01-01" -last_updated = "2025-09-01" -attachment = true -reasoning = true -temperature = true -tool_call = false -knowledge = "2025-09-01" -open_weights = false - -[limit] -context = 128_000 -output = 4_096 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml deleted file mode 100644 index c0e101623..000000000 --- a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml +++ /dev/null @@ -1,17 +0,0 @@ -name = "Sonar Reasoning" -release_date = "2024-01-01" -last_updated = "2025-09-01" -attachment = false -reasoning = true -temperature = true -tool_call = false -knowledge = "2025-09-01" -open_weights = false - -[limit] -context = 128_000 -output = 4_096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/replicate/deepseek-ai/deepseek-r1.toml b/providers/cloudflare-ai-gateway/models/replicate/deepseek-ai/deepseek-r1.toml new file mode 100644 index 000000000..39cfb3277 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/replicate/deepseek-ai/deepseek-r1.toml @@ -0,0 +1,20 @@ +name = "deepseek r1" +release_date = "2025-03-11" +last_updated = "2025-03-11" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 10 +output = 10 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-70b-instruct.toml b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-70b-instruct.toml new file mode 100644 index 000000000..5e6913683 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-70b-instruct.toml @@ -0,0 +1,20 @@ +name = "meta llama 3 70u instruct" +release_date = "2024-10-08" +last_updated = "2024-10-08" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 2.75 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-8b-instruct.toml b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-8b-instruct.toml new file mode 100644 index 000000000..f948fac4e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3-8b-instruct.toml @@ -0,0 +1,20 @@ +name = "meta llama 3 8u instruct" +release_date = "2025-02-05" +last_updated = "2025-02-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3.1-405b-instruct.toml b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3.1-405b-instruct.toml new file mode 100644 index 000000000..8c9aa497b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/replicate/meta/meta-llama-3.1-405b-instruct.toml @@ -0,0 +1,20 @@ +name = "meta llama 3.1 405u instruct" +release_date = "2024-09-25" +last_updated = "2024-09-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 9.5 +output = 9.5 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/replicate/replicate-internal/llama-405b-instruct-vllm.toml b/providers/cloudflare-ai-gateway/models/replicate/replicate-internal/llama-405b-instruct-vllm.toml new file mode 100644 index 000000000..a1b225b37 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/replicate/replicate-internal/llama-405b-instruct-vllm.toml @@ -0,0 +1,20 @@ +name = "llama 405u instruct vllm" +release_date = "2024-08-27" +last_updated = "2024-08-27" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 9.5 +output = 9.5 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml b/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml index 45bdc25d7..4c689b46e 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml @@ -1,23 +1,20 @@ -# https://developers.cloudflare.com/workers-ai/models/aura-1/ - -name = "@cf/deepgram/aura-1" +name = "aura 1" +release_date = "2025-11-14" +last_updated = "2025-11-14" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2025-08-27" -last_updated = "2025-07-07" +open_weights = false [cost] -# per 1k characters -input = 0.015 -output = 0.015 +input = 0 +output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] input = ["text"] -output = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-en.toml b/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-en.toml new file mode 100644 index 000000000..38981055e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-en.toml @@ -0,0 +1,20 @@ +name = "aura 2 en" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-es.toml b/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-es.toml new file mode 100644 index 000000000..29f31f67b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/aura-2-es.toml @@ -0,0 +1,20 @@ +name = "aura 2 es" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml index a3267b1f3..2d51808ae 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/bart-large-cnn/ - -name = "@cf/facebook/bart-large-cnn" +name = "uart large cnn" +release_date = "2025-04-09" +last_updated = "2025-04-09" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2022-03-02" -last_updated = "2024-02-13" +open_weights = false [cost] input = 0 output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bge-base-en-v1.5.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bge-base-en-v1.5.toml new file mode 100644 index 000000000..d81e25d11 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bge-base-en-v1.5.toml @@ -0,0 +1,20 @@ +name = "uge uase en v1.5" +release_date = "2025-04-03" +last_updated = "2025-04-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bge-large-en-v1.5.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bge-large-en-v1.5.toml new file mode 100644 index 000000000..42b21fccf --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bge-large-en-v1.5.toml @@ -0,0 +1,20 @@ +name = "uge large en v1.5" +release_date = "2025-04-03" +last_updated = "2025-04-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bge-m3.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bge-m3.toml new file mode 100644 index 000000000..b3d3c4a58 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bge-m3.toml @@ -0,0 +1,20 @@ +name = "uge m3" +release_date = "2025-04-03" +last_updated = "2025-04-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bge-reranker-base.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bge-reranker-base.toml new file mode 100644 index 000000000..7235cfdad --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bge-reranker-base.toml @@ -0,0 +1,20 @@ +name = "uge reranker uase" +release_date = "2025-04-09" +last_updated = "2025-04-09" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bge-small-en-v1.5.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bge-small-en-v1.5.toml new file mode 100644 index 000000000..ba59902a1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bge-small-en-v1.5.toml @@ -0,0 +1,20 @@ +name = "uge small en v1.5" +release_date = "2025-04-03" +last_updated = "2025-04-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml deleted file mode 100644 index f6440dc86..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/deepseek-coder-6.7b-base-awq/ - -name = "@hf/thebloke/deepseek-coder-6.7b-base-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-11-05" -last_updated = "2023-11-09" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml deleted file mode 100644 index 01c3b009e..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/deepseek-coder-6.7b-instruct-awq/ - -name = "@hf/thebloke/deepseek-coder-6.7b-instruct-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-11-05" -last_updated = "2023-11-13" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml deleted file mode 100644 index 064b7343d..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/deepseek-math-7b-instruct/ - -name = "@cf/deepseek-ai/deepseek-math-7b-instruct" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-02-05" -last_updated = "2024-02-06" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml index 2ce921daa..39c9896ec 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/deepseek-r1-distill-qwen-32b/ - -name = "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b" +name = "deepseek r1 distill qwen 32b" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false -reasoning = true -tool_call = true +reasoning = false temperature = true -open_weights = true -release_date = "2025-01-20" -last_updated = "2025-02-24" +tool_call = false +open_weights = false [cost] -input = 0.5 +input = 0 output = 4.88 [limit] -context = 80000 -output = 80000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml deleted file mode 100644 index 57314cd84..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/discolm-german-7b-v1-awq/ - -name = "@cf/thebloke/discolm-german-7b-v1-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-01-18" -last_updated = "2024-01-24" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/distilbert-sst-2-int8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/distilbert-sst-2-int8.toml new file mode 100644 index 000000000..bd756fe55 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/distilbert-sst-2-int8.toml @@ -0,0 +1,20 @@ +name = "distiluert sst 2 int8" +release_date = "2025-04-03" +last_updated = "2025-04-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml b/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml deleted file mode 100644 index 8d1712a0c..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/dreamshaper-8-lcm/ - -name = "@cf/lykon/dreamshaper-8-lcm" -attachment = true -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2023-12-06" -last_updated = "2023-12-07" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml deleted file mode 100644 index 543fa2aef..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/falcon-7b-instruct/ - -name = "@cf/tiiuae/falcon-7b-instruct" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-04-25" -last_updated = "2024-10-12" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml b/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml deleted file mode 100644 index 1480fe105..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml +++ /dev/null @@ -1,24 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/flux-1-schnell/ - -name = "@cf/black-forest-labs/flux-1-schnell" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2024-07-31" -last_updated = "2024-08-16" - -[cost] -# per 512 by 512 tile -input = 0.000053 -# per step -output = 0.00011 - -[limit] -context = 2048 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml deleted file mode 100644 index 6e76a054f..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/gemma-2b-it-lora/ - -name = "@cf/google/gemma-2b-it-lora" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-04-02" -last_updated = "2024-04-02" - -[cost] -input = 0 -output = 0 - -[limit] -context = 8192 -output = 8192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml index 0b0f15b18..21742dc78 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/gemma-3-12b-it/ - -name = "@cf/google/gemma-3-12b-it" +name = "gemma 3 12u it" +release_date = "2025-04-11" +last_updated = "2025-04-11" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2025-03-01" -last_updated = "2025-03-21" +tool_call = false +open_weights = false [cost] -input = 0.35 -output = 0.56 +input = 0 +output = 0 [limit] -context = 80000 -output = 80000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml deleted file mode 100644 index 42e88d143..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/gemma-7b-it-lora/ - -name = "@cf/google/gemma-7b-it-lora" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-04-02" -last_updated = "2024-04-02" - -[cost] -input = 0 -output = 0 - -[limit] -context = 3500 -output = 3500 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml deleted file mode 100644 index 7c1e98c99..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/gemma-7b-it/ - -name = "@hf/google/gemma-7b-it" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-02-13" -last_updated = "2024-08-14" - -[cost] -input = 0 -output = 0 - -[limit] -context = 8192 -output = 8192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml index ba1472b48..9dd256a1b 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/gemma-sea-lion-v4-27b-it/ - -name = "@cf/aisingapore/gemma-sea-lion-v4-27b-it" +name = "gemma sea lion v4 27u it" +release_date = "2025-09-25" +last_updated = "2025-09-25" attachment = false reasoning = false -tool_call = true -open_weights = false -release_date = "2025-09-23" -last_updated = "2025-12-02" temperature = true +tool_call = false +open_weights = false -[limit] -context = 128000 +[cost] +input = 0 output = 0 -[cost] -input = 0.35 -output = 0.56 +[limit] +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml index ca7cc8cc3..834df0973 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/gpt-oss-120b/ - -name = "@cf/openai/gpt-oss-120b" +name = "gpt oss 120b" +release_date = "2025-08-05" +last_updated = "2025-08-05" attachment = false -reasoning = true +reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2025-08-04" -last_updated = "2025-08-14" +open_weights = false [cost] -input = 0.35 -output = 0.75 +input = 0 +output = 0 [limit] context = 128000 -output = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml index 4b5af26ab..5d811360d 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/gpt-oss-20b/ - -name = "@cf/openai/gpt-oss-20b" +name = "gpt oss 20b" +release_date = "2025-08-05" +last_updated = "2025-08-05" attachment = false -reasoning = true +reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2025-08-04" -last_updated = "2025-08-14" +open_weights = false [cost] -input = 0.2 -output = 0.3 +input = 0 +output = 0 [limit] context = 128000 -output = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml b/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml index 3ffe69a84..cc6eda186 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/granite-4.0-h-micro/ - -name = "@cf/ibm-granite/granite-4.0-h-micro" +name = "granite 4.0 h micro" +release_date = "2025-10-15" +last_updated = "2025-10-15" attachment = false reasoning = false -tool_call = true -open_weights = false -release_date = "2025-10-07" -last_updated = "2025-12-02" temperature = true +tool_call = false +open_weights = false -[limit] -context = 131000 +[cost] +input = 0 output = 0 -[cost] -input = 0.017 -output = 0.11 +[limit] +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml deleted file mode 100644 index c8fe4427f..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/hermes-2-pro-mistral-7b/ - -name = "@hf/nousresearch/hermes-2-pro-mistral-7b" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-03-11" -last_updated = "2024-09-08" - -[cost] -input = 0 -output = 0 - -[limit] -context = 24000 -output = 24000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/indictrans2-en-indic-1B.toml b/providers/cloudflare-ai-gateway/models/workers-ai/indictrans2-en-indic-1B.toml new file mode 100644 index 000000000..b83d025bc --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/indictrans2-en-indic-1B.toml @@ -0,0 +1,20 @@ +name = "indictrans2 en indic 1B" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml deleted file mode 100644 index 9c0bd41d1..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-2-13b-chat-awq/ - -name = "@hf/thebloke/llama-2-13b-chat-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-09-19" -last_updated = "2023-11-09" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml index 1a8538759..ae6c5bf03 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-fp16/ - -name = "@cf/meta/llama-2-7b-chat-fp16" +name = "llama 2 7u chat fp16" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2023-07-26" -last_updated = "2023-07-26" +tool_call = false +open_weights = false [cost] -input = 0.56 +input = 0 output = 6.67 [limit] -context = 4096 -output = 4096 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml deleted file mode 100644 index 35172ab0c..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-hf-lora/ - -name = "@cf/meta-llama/llama-2-7b-chat-hf-lora" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-07-13" -last_updated = "2024-04-17" - -[cost] -input = 0 -output = 0 - -[limit] -context = 8192 -output = 8192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml deleted file mode 100644 index d9eb362c0..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-int8/ - -name = "@cf/meta/llama-2-7b-chat-int8" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-09-25" -last_updated = "2023-09-25" - -[cost] -input = 0.556 -output = 6.667 - -[limit] -context = 8192 -output = 8192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml index 19de5777e..e38439032 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3-8b-instruct-awq/ - -name = "@cf/meta/llama-3-8b-instruct-awq" +name = "llama 3 8u instruct awq" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-05-09" -last_updated = "2024-05-09" +tool_call = false +open_weights = false [cost] -input = 0.12 -output = 0.27 +input = 0 +output = 0 [limit] -context = 8192 -output = 8192 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml index 15410af48..92d3525f2 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3-8b-instruct/ - -name = "@cf/meta/llama-3-8b-instruct" +name = "llama 3 8u instruct" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-04-17" -last_updated = "2025-06-19" +tool_call = false +open_weights = false [cost] -input = 0.28 -output = 0.83 +input = 0 +output = 0 [limit] -context = 7968 -output = 7968 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml deleted file mode 100644 index 307a85f63..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.1-70b-instruct/ - -name = "@cf/meta/llama-3.1-70b-instruct" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-07-16" -last_updated = "2024-12-15" - -[cost] -input = 0.293 -output = 2.253 - -[limit] -context = 24000 -output = 24000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml index 24b746f22..cd162c09a 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-awq/ - -name = "@cf/meta/llama-3.1-8b-instruct-awq" +name = "llama 3.1 8u instruct awq" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-07-25" -last_updated = "2024-07-25" +tool_call = false +open_weights = false [cost] -input = 0.12 -output = 0.27 +input = 0 +output = 0 [limit] -context = 8192 -output = 8192 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml deleted file mode 100644 index cfff32d0e..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-fast/ - -name = "@cf/meta/llama-3.1-8b-instruct-fast" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-07-18" -last_updated = "2024-09-25" - -[cost] -input = 0.045 -output = 0.384 - -[limit] -context = 128000 -output = 128000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml index 352fff5a9..b38b5c863 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-fp8/ - -name = "@cf/meta/llama-3.1-8b-instruct-fp8" +name = "llama 3.1 8u instruct fp8" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-07-25" -last_updated = "2024-07-25" +tool_call = false +open_weights = false [cost] -input = 0.15 -output = 0.29 +input = 0 +output = 0 [limit] -context = 32000 -output = 32000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml index 26b2a40fe..22d701a33 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct/ - -name = "@cf/meta/llama-3.1-8b-instruct" +name = "llama 3.1 8u instruct" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-07-18" -last_updated = "2024-09-25" +tool_call = false +open_weights = false [cost] -input = 0.28 -output = 0.83 +input = 0 +output = 0 [limit] -context = 7968 -output = 7968 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml index d77963828..5ff407ff5 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.2-11b-vision-instruct/ - -name = "@cf/meta/llama-3.2-11b-vision-instruct" +name = "llama 3.2 11u vision instruct" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-09-18" -last_updated = "2024-12-04" +tool_call = false +open_weights = false [cost] -input = 0.049 -output = 0.68 +input = 0 +output = 0 [limit] context = 128000 -output = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml index 9c6d02bf7..454c117da 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.2-1b-instruct/ - -name = "@cf/meta/llama-3.2-1b-instruct" +name = "llama 3.2 1u instruct" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-09-18" -last_updated = "2024-10-24" +tool_call = false +open_weights = false [cost] -input = 0.027 -output = 0.2 +input = 0 +output = 0 [limit] -context = 60000 -output = 60000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml index 6a0a2aa8b..d25baec63 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.2-3b-instruct/ - -name = "@cf/meta/llama-3.2-3b-instruct" +name = "llama 3.2 3u instruct" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-09-18" -last_updated = "2024-10-24" +tool_call = false +open_weights = false [cost] -input = 0.051 -output = 0.34 +input = 0 +output = 0 [limit] context = 128000 -output = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml index 51f436d4a..c91ce6229 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-3.3-70b-instruct-fp8-fast/ - -name = "@cf/meta/llama-3.3-70b-instruct-fp8-fast" +name = "llama 3.3 70u instruct fp8 fast" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-12-06" -last_updated = "2024-12-06" +tool_call = false +open_weights = false [cost] -input = 0.29 +input = 0 output = 2.25 [limit] -context = 24000 -output = 24000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml index 27ba1174f..d30c849de 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-4-scout-17b-16e-instruct/ - -name = "@cf/meta/llama-4-scout-17b-16e-instruct" +name = "llama 4 scout 17u 16e instruct" +release_date = "2025-04-16" +last_updated = "2025-04-16" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2025-04-02" -last_updated = "2025-05-23" +tool_call = false +open_weights = false [cost] -input = 0.27 -output = 0.85 +input = 0 +output = 0 [limit] -context = 131000 -output = 131000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml index 3155b7c63..2516a845e 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/llama-guard-3-8b/ - -name = "@cf/meta/llama-guard-3-8b" +name = "llama guard 3 8b" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = false temperature = true -open_weights = true -release_date = "2024-07-22" -last_updated = "2024-10-11" +tool_call = false +open_weights = false [cost] -input = 0.48 -output = 0.03 +input = 0 +output = 0 [limit] -context = 131072 -output = 0 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml deleted file mode 100644 index ddc2c123d..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llamaguard-7b-awq/ - -name = "@hf/thebloke/llamaguard-7b-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-12-11" -last_updated = "2023-12-11" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml deleted file mode 100644 index 6c371c836..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/llava-1.5-7b-hf/ - -name = "@cf/llava-hf/llava-1.5-7b-hf" -attachment = true -reasoning = false -tool_call = false -temperature = true -open_weights = true -release_date = "2023-12-05" -last_updated = "2025-06-06" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["image","text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml b/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml deleted file mode 100644 index 523f2125a..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/lucid-origin/ - -name = "@cf/leonardo/lucid-origin" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = false -release_date = "2025-08-25" -last_updated = "2025-08-05" - -[cost] -# 0.007 per 512x512 tile, 0.00013 per step -input = 0.007 -output = 0.007 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml index 99024cf53..2ac034d80 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/m2m100-1.2b/ - -name = "@cf/meta/m2m100-1.2b" +name = "m2m100 1.2b" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2022-03-02" -last_updated = "2023-11-16" +open_weights = false [cost] -input = 0.34 -output = 0.34 +input = 0 +output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml b/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml index 743028594..9e639f90d 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml @@ -1,23 +1,20 @@ -# https://developers.cloudflare.com/workers-ai/models/melotts/ - -name = "@cf/myshell-ai/melotts" -attachment = true +name = "melotts" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2024-07-19" -last_updated = "2024-07-19" +open_weights = false [cost] -# per audio minute -input = 0.0002 +input = 0 output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] input = ["text"] -output = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml deleted file mode 100644 index f91a3ade4..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.1-awq/ - -name = "@hf/thebloke/mistral-7b-instruct-v0.1-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-09-27" -last_updated = "2023-11-09" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml index 74af9cc16..0299c79a4 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.1/ - -name = "@cf/mistral/mistral-7b-instruct-v0.1" +name = "mistral 7u instruct v0.1" +release_date = "2025-04-03" +last_updated = "2025-04-03" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2023-09-27" -last_updated = "2025-07-24" +tool_call = false +open_weights = false [cost] -input = 0.11 -output = 0.19 +input = 0 +output = 0 [limit] -context = 2824 -output = 2824 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml deleted file mode 100644 index 895418742..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.2-lora/ - -name = "@cf/mistral/mistral-7b-instruct-v0.2-lora" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-04-01" -last_updated = "2024-04-01" - -[cost] -input = 0 -output = 0 - -[limit] -context = 15000 -output = 15000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml deleted file mode 100644 index c874e3df7..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.2/ - -name = "@hf/mistral/mistral-7b-instruct-v0.2" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-12-11" -last_updated = "2025-07-24" - -[cost] -input = 0 -output = 0 - -[limit] -context = 3072 -output = 4096 -input = 3072 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml index 2019c66f8..a2fa6fa33 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/mistral-small-3.1-24b-instruct/ - -name = "@cf/mistralai/mistral-small-3.1-24b-instruct" +name = "mistral small 3.1 24u instruct" +release_date = "2025-04-11" +last_updated = "2025-04-11" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2025-03-11" -last_updated = "2025-07-28" +tool_call = false +open_weights = false [cost] -input = 0.35 -output = 0.56 +input = 0 +output = 0 [limit] context = 128000 -output = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml deleted file mode 100644 index bac727eee..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/neural-chat-7b-v3-1-awq/ - -name = "@hf/thebloke/neural-chat-7b-v3-1-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-11-15" -last_updated = "2023-11-17" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml b/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml index 587477f4a..72c1cfb6e 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml @@ -1,22 +1,20 @@ -# https://developers.cloudflare.com/workers-ai/models/nova-3/ - -name = "@cf/deepgram/nova-3" +name = "nova 3" +release_date = "2025-11-14" +last_updated = "2025-11-14" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2025-06-05" -last_updated = "2025-07-08" +open_weights = false [cost] -input = 0.0052 -output = 0.0052 +input = 0 +output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] -input = ["audio"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml b/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml deleted file mode 100644 index 8ae0ee82d..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/openchat-3.5-0106/ - -name = "@cf/openchat/openchat-3.5-0106" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-01-07" -last_updated = "2024-05-18" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 8192 -output = 8192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml deleted file mode 100644 index de9818c32..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/openhermes-2.5-mistral-7b-awq/ - -name = "@hf/thebloke/openhermes-2.5-mistral-7b-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-11-02" -last_updated = "2023-11-09" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml deleted file mode 100644 index f7b41a400..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/phi-2/ - -name = "@cf/microsoft/phi-2" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-12-13" -last_updated = "2024-04-29" - -[cost] -input = 0 -output = 0 - -[limit] -context = 2048 -output = 2048 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml deleted file mode 100644 index cb9eff10a..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/phoenix-1.0/ - -name = "@cf/leonardo/phoenix-1.0" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = false -release_date = "2025-08-25" -last_updated = "2025-08-25" - -[cost] -# 0.0058 per 512x512 step, 0.00011 per step -input = 0.0058 -output = 0.0058 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/plamo-embedding-1b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/plamo-embedding-1b.toml new file mode 100644 index 000000000..7430ec275 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/plamo-embedding-1b.toml @@ -0,0 +1,20 @@ +name = "plamo emuedding 1b" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml deleted file mode 100644 index 02a89d2e2..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen1.5-0.5b-chat/ - -name = "@cf/qwen/qwen1.5-0.5b-chat" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-01-31" -last_updated = "2024-04-30" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 32000 -output = 32000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml deleted file mode 100644 index 8fc56a863..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen1.5-1.8b-chat/ - -name = "@cf/qwen/qwen1.5-1.8b-chat" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-01-30" -last_updated = "2024-04-30" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 32000 -output = 32000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml deleted file mode 100644 index 0ea4a2f81..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen1.5-14b-chat-awq/ - -name = "@cf/qwen/qwen1.5-14b-chat-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-02-03" -last_updated = "2024-04-30" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 7500 -output = 7500 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml deleted file mode 100644 index 2cfdd8f25..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen1.5-7b-chat-awq/ - -name = "@cf/qwen/qwen1.5-7b-chat-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-02-03" -last_updated = "2024-04-30" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 20000 -output = 20000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml index 639fb5929..ac2f93e96 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen2.5-coder-32b-instruct/ - -name = "@cf/qwen/qwen2.5-coder-32b-instruct" +name = "qwen2.5 coder 32u instruct" +release_date = "2025-04-11" +last_updated = "2025-04-11" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2024-11-06" -last_updated = "2025-01-12" +tool_call = false +open_weights = false [cost] -input = 0.66 +input = 0 output = 1 [limit] -context = 32768 -output = 32768 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml index 2e92e4d78..ab502d4e8 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/qwen3-30b-a3b-fp8/ - -name = "@cf/qwen/qwen3-30b-a3b-fp8" +name = "qwen3 30u a3u fp8" +release_date = "2025-11-14" +last_updated = "2025-11-14" attachment = false -reasoning = true -tool_call = true -open_weights = true -release_date = "2025-04-30" -last_updated = "2025-12-02" +reasoning = false temperature = true +tool_call = false +open_weights = false -[limit] -context = 32768 +[cost] +input = 0 output = 0 -[cost] -input = 0.051 -output = 0.34 +[limit] +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-embedding-0.6b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-embedding-0.6b.toml new file mode 100644 index 000000000..2810abe76 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-embedding-0.6b.toml @@ -0,0 +1,20 @@ +name = "qwen3 emuedding 0.6b" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml index 1641cb43e..86f2db731 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml @@ -1,21 +1,19 @@ -# https://developers.cloudflare.com/workers-ai/models/qwq-32b/ - -name = "@cf/qwen/qwq-32b" +name = "qwq 32b" +release_date = "2025-04-11" +last_updated = "2025-04-11" attachment = false reasoning = false -tool_call = true temperature = true -open_weights = true -release_date = "2025-03-05" -last_updated = "2025-03-11" +tool_call = false +open_weights = false [cost] -input = 0.66 +input = 0 output = 1 [limit] -context = 24000 -output = 24000 +context = 128000 +output = 16384 [modalities] input = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml b/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml deleted file mode 100644 index 3c040ddbd..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/resnet-50/ - -name = "@cf/microsoft/resnet-50" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2022-03-16" -last_updated = "2024-02-13" - -[cost] -# per inference request -input = 0.0000025 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/smart-turn-v2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/smart-turn-v2.toml new file mode 100644 index 000000000..2ba3ee7b1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/smart-turn-v2.toml @@ -0,0 +1,20 @@ +name = "smart turn v2" +release_date = "2025-11-14" +last_updated = "2025-11-14" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = false + +[cost] +input = 0 +output = 0 + +[limit] +context = 128000 +output = 16384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml deleted file mode 100644 index 8c8e99942..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/sqlcoder-7b-2/ - -name = "@cf/defog/sqlcoder-7b-2" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-02-05" -last_updated = "2024-02-12" - -[cost] -input = 0 -output = 0 - -[limit] -context = 10000 -output = 10000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml deleted file mode 100644 index 0f55cd660..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-v1-5-img2img/ - -name = "@cf/runwayml/stable-diffusion-v1-5-img2img" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2024-02-27" -last_updated = "2024-02-27" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml deleted file mode 100644 index 2ad25e021..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-v1-5-inpainting/ - -name = "@cf/runwayml/stable-diffusion-v1-5-inpainting" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2024-02-27" -last_updated = "2024-02-27" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml deleted file mode 100644 index f0362810f..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-xl-base-1.0/ - -name = "@cf/stabilityai/stable-diffusion-xl-base-1.0" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2023-07-25" -last_updated = "2023-10-30" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml deleted file mode 100644 index bf716787a..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-xl-lightning/ - -name = "@cf/bytedance/stable-diffusion-xl-lightning" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2024-02-20" -last_updated = "2024-04-03" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["text"] -output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml b/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml deleted file mode 100644 index fa47b3f96..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml +++ /dev/null @@ -1,24 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/starling-lm-7b-beta/ - -name = "@hf/nexusflow/starling-lm-7b-beta" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2024-03-19" -last_updated = "2024-04-03" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 -input = 3072 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml deleted file mode 100644 index a1c067907..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/tinyllama-1.1b-chat-v1.0/ - -name = "@cf/tinyllama/tinyllama-1.1b-chat-v1.0" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-12-30" -last_updated = "2024-03-17" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 2048 -output = 2048 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml b/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml deleted file mode 100644 index ce3a7db6e..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/uform-gen2-qwen-500m/ - -name = "@cf/unum/uform-gen2-qwen-500m" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2024-02-15" -last_updated = "2024-04-24" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["image","text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml b/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml deleted file mode 100644 index 0b43b8de0..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/una-cybertron-7b-v2-bf16/ - -name = "@cf/fblgit/una-cybertron-7b-v2-bf16" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-12-02" -last_updated = "2024-03-08" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 15000 -output = 15000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml index f787da6ef..586f3110e 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml @@ -1,23 +1,20 @@ -# https://developers.cloudflare.com/workers-ai/models/whisper-large-v3-turbo/ - -name = "@cf/openai/whisper-large-v3-turbo" +name = "whisper large v3 turuo" +release_date = "2025-11-14" +last_updated = "2025-11-14" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2024-10-01" -last_updated = "2024-10-04" +open_weights = false [cost] -# per audio minute -input = 0.00051 -output = 0.00051 +input = 0 +output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] -input = ["audio"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml deleted file mode 100644 index 703086d37..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml +++ /dev/null @@ -1,22 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/whisper-tiny-en/ - -name = "@cf/openai/whisper-tiny-en" -attachment = false -reasoning = false -tool_call = false -temperature = false -open_weights = true -release_date = "2022-09-26" -last_updated = "2024-01-22" - -[cost] -input = 0 -output = 0 - -[limit] -context = 0 -output = 0 - -[modalities] -input = ["audio"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml index 442509455..b631e1d5e 100644 --- a/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml +++ b/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml @@ -1,23 +1,20 @@ -# https://developers.cloudflare.com/workers-ai/models/whisper/ - -name = "@cf/openai/whisper" +name = "whisper" +release_date = "2025-11-14" +last_updated = "2025-11-14" attachment = false reasoning = false +temperature = true tool_call = false -temperature = false -open_weights = true -release_date = "2023-11-07" -last_updated = "2024-08-12" +open_weights = false [cost] -# per audio minute -input = 0.00045 -output = 0.00045 +input = 0 +output = 0 [limit] -context = 0 -output = 0 +context = 128000 +output = 16384 [modalities] -input = ["audio"] +input = ["text"] output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml deleted file mode 100644 index db4c96fdd..000000000 --- a/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml +++ /dev/null @@ -1,23 +0,0 @@ -# https://developers.cloudflare.com/workers-ai/models/zephyr-7b-beta-awq/ - -name = "@hf/thebloke/zephyr-7b-beta-awq" -attachment = false -reasoning = false -tool_call = true -temperature = true -open_weights = true -release_date = "2023-10-27" -last_updated = "2023-11-09" -status = "deprecated" - -[cost] -input = 0 -output = 0 - -[limit] -context = 4096 -output = 4096 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml deleted file mode 100644 index 5f2c5141e..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 3 Beta" -release_date = "2025-02-17" -last_updated = "2025-02-17" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 3.00 -output = 15.00 -cache_read = 0.75 -cache_write = 15.00 - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml deleted file mode 100644 index 4bb152bb6..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 3 Mini Beta" -release_date = "2025-02-17" -last_updated = "2025-02-17" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 0.30 -output = 0.50 -cache_read = 0.075 -cache_write = 0.50 - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml deleted file mode 100644 index c1652e201..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 3 Mini" -release_date = "2025-02-17" -last_updated = "2025-02-17" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 0.30 -output = 0.50 -cache_read = 0.075 -cache_write = 0.50 - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml deleted file mode 100644 index 56069a584..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 3" -release_date = "2025-02-17" -last_updated = "2025-02-17" -attachment = false -reasoning = false -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 3.00 -output = 15.00 -cache_read = 0.75 -cache_write = 15.00 - -[limit] -context = 131_072 -output = 8_192 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml deleted file mode 100644 index a592d3f13..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 4 Fast" -release_date = "2025-08-19" -last_updated = "2025-08-19" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 0.20 -output = 0.50 -cache_read = 0.05 -cache_write = 0.05 - -[limit] -context = 2_000_000 -output = 30_000 - -[modalities] -input = ["text", "image"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml deleted file mode 100644 index 17833565b..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 4.1 Fast" -release_date = "2025-11-19" -last_updated = "2025-11-19" -attachment = false -reasoning = true -temperature = true -knowledge = "2024-11" -tool_call = true -open_weights = false - -[cost] -input = 0.20 -output = 0.50 -cache_read = 0.05 -cache_write = 0.05 - -[limit] -context = 2_000_000 -output = 30_000 - -[modalities] -input = ["text", "image"] -output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml deleted file mode 100644 index ef04f7356..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml +++ /dev/null @@ -1,23 +0,0 @@ -name = "Grok 4" -release_date = "2025-07-09" -last_updated = "2025-07-09" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-07" -tool_call = true -open_weights = false - -[cost] -input = 3.00 -output = 15.00 -cache_read = 0.75 -cache_write = 15.00 - -[limit] -context = 256_000 -output = 64_000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml deleted file mode 100644 index 4ec798dd2..000000000 --- a/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml +++ /dev/null @@ -1,22 +0,0 @@ -name = "Grok Code Fast 1" -release_date = "2025-08-26" -last_updated = "2025-08-26" -attachment = false -reasoning = true -temperature = true -knowledge = "2025-08" -tool_call = true -open_weights = false - -[cost] -input = 0.20 -output = 1.50 -cache_read = 0.02 - -[limit] -context = 256_000 -output = 10_000 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/cloudflare-ai-gateway/provider.toml b/providers/cloudflare-ai-gateway/provider.toml index 2fec3c9ec..369e34b75 100644 --- a/providers/cloudflare-ai-gateway/provider.toml +++ b/providers/cloudflare-ai-gateway/provider.toml @@ -1,4 +1,5 @@ name = "Cloudflare AI Gateway" env = ["CLOUDFLARE_API_TOKEN", "CLOUDFLARE_ACCOUNT_ID", "CLOUDFLARE_GATEWAY_ID"] -npm = "ai-gateway-provider" +npm = "@ai-sdk/openai-compatible" +api = "https://gateway.ai.cloudflare.com/v1/${CLOUDFLARE_ACCOUNT_ID}/${CLOUDFLARE_GATEWAY_ID}/compat/" doc = "https://developers.cloudflare.com/ai-gateway/"