diff --git a/providers/cloudflare-ai-gateway/logo.svg b/providers/cloudflare-ai-gateway/logo.svg new file mode 100644 index 000000000..f04d0959f --- /dev/null +++ b/providers/cloudflare-ai-gateway/logo.svg @@ -0,0 +1,6 @@ + + + + + + diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml new file mode 100644 index 000000000..0afeca15b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.5-haiku.toml @@ -0,0 +1,23 @@ +name = "Claude Haiku 3.5" +release_date = "2024-10-22" +last_updated = "2024-10-22" +attachment = true +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-07-31" +open_weights = false + +[cost] +input = 0.80 +output = 4.00 +cache_read = 0.08 +cache_write = 1.00 + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml new file mode 100644 index 000000000..5e4acc601 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-3.7-sonnet.toml @@ -0,0 +1,23 @@ +name = "Claude Sonnet 3.7" +release_date = "2025-02-19" +last_updated = "2025-02-19" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2024-01" +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 +cache_write = 18.75 + +[limit] +context = 200_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml new file mode 100644 index 000000000..9476e8081 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-haiku-4.5.toml @@ -0,0 +1,23 @@ +name = "Claude Haiku 4.5" +release_date = "2025-10-15" +last_updated = "2025-10-15" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-02-28" +open_weights = false + +[cost] +input = 1.00 +output = 5.00 +cache_read = 0.10 +cache_write = 1.25 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml new file mode 100644 index 000000000..a1f0975e2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.1.toml @@ -0,0 +1,23 @@ +name = "Claude Opus 4.1" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-03-31" +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 +cache_write = 18.75 + +[limit] +context = 200_000 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml new file mode 100644 index 000000000..a9addac14 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.5.toml @@ -0,0 +1,23 @@ +name = "Claude Opus 4.5" +release_date = "2025-11-24" +last_updated = "2025-11-24" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-05-30" +open_weights = false + +[cost] +input = 5.00 +output = 25.00 +cache_read = 0.50 +cache_write = 6.25 + +[limit] +context = 200_000 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml new file mode 100644 index 000000000..96019db43 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-opus-4.toml @@ -0,0 +1,23 @@ +name = "Claude Opus 4" +release_date = "2025-05-22" +last_updated = "2025-05-22" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-03-31" +open_weights = false + +[cost] +input = 15.00 +output = 75.00 +cache_read = 1.50 +cache_write = 18.75 + +[limit] +context = 200_000 +output = 32_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml new file mode 100644 index 000000000..328e11098 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.5.toml @@ -0,0 +1,29 @@ +name = "Claude Sonnet 4.5" +release_date = "2025-09-29" +last_updated = "2025-09-29" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-07-31" +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 +cache_write = 3.75 + +[cost.context_over_200k] +input = 6.00 +output = 22.50 +cache_read = 0.60 +cache_write = 7.50 + +[limit] +context = 1_000_000 +output = 64_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml new file mode 100644 index 000000000..9ccbe8098 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/anthropic/claude-sonnet-4.toml @@ -0,0 +1,29 @@ +name = "Claude Sonnet 4" +release_date = "2025-05-22" +last_updated = "2025-05-22" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-03-31" +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.30 +cache_write = 3.75 + +[cost.context_over_200k] +input = 6.00 +output = 22.50 +cache_read = 0.60 +cache_write = 7.50 + +[limit] +context = 200_000 +output = 64_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml new file mode 100644 index 000000000..94d71a57f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3-0324.toml @@ -0,0 +1,16 @@ +id = "deepseek/deepseek-chat-v3-0324:free" +name = "DeepSeek V3 0324" +release_date = "2025-03-24" +last_updated = "2025-03-24" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = false +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 16384, output = 8192 } + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml new file mode 100644 index 000000000..30b01d765 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-chat-v3.1.toml @@ -0,0 +1,21 @@ +name = "DeepSeek-V3.1" +release_date = "2025-08-21" +last_updated = "2025-08-21" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-07" +tool_call = true +open_weights = true + +[cost] +input = 0.20 +output = 0.80 + +[limit] +context = 163_840 +output = 163_840 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml new file mode 100644 index 000000000..736ed3524 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528-qwen3-8b:free.toml @@ -0,0 +1,21 @@ +name = "Deepseek R1 0528 Qwen3 8B (free)" +release_date = "2025-05-29" +last_updated = "2025-05-29" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml new file mode 100644 index 000000000..0d62f4504 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-0528:free.toml @@ -0,0 +1,21 @@ +name = "R1 0528 (free)" +release_date = "2025-05-28" +last_updated = "2025-05-28" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 163_840 +output = 163_840 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml new file mode 100644 index 000000000..cba6b81ff --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-llama-70b.toml @@ -0,0 +1,16 @@ +id = "deepseek/deepseek-r1-distill-llama-70b:free" +name = "DeepSeek R1 Distill Llama 70B" +release_date = "2025-01-23" +last_updated = "2025-01-23" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-10" +tool_call = false +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 8192, output = 8192 } + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml new file mode 100644 index 000000000..500930a64 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1-distill-qwen-14b.toml @@ -0,0 +1,16 @@ +id = "deepseek/deepseek-r1-distill-qwen-14b:free" +name = "DeepSeek R1 Distill Qwen 14B" +release_date = "2025-01-29" +last_updated = "2025-01-29" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-10" +tool_call = false +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 64000, output = 8192 } + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml new file mode 100644 index 000000000..eabdfb36e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-r1:free.toml @@ -0,0 +1,21 @@ +name = "R1 (free)" +release_date = "2025-01-20" +last_updated = "2025-01-20" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 163_840 +output = 163_840 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml new file mode 100644 index 000000000..c87d9aa1a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3-base:free.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3 Base (free)" +release_date = "2025-03-29" +last_updated = "2025-03-29" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-03" +tool_call = false +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 163_840 +output = 163_840 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml new file mode 100644 index 000000000..a78c43ba1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3.1 Terminus" +release_date = "2025-09-22" +last_updated = "2025-09-22" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-07" +tool_call = true +open_weights = true + +[cost] +input = 0.27 +output = 1.00 + +[limit] +context = 131_072 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml new file mode 100644 index 000000000..373c4b575 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.1-terminus:exacto.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3.1 Terminus (exacto)" +release_date = "2025-09-22" +last_updated = "2025-09-22" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-07" +tool_call = true +open_weights = true + +[cost] +input = 0.27 +output = 1.00 + +[limit] +context = 131_072 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml new file mode 100644 index 000000000..023f7d0c8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2-speciale.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3.2 Speciale" +release_date = "2025-12-01" +last_updated = "2025-12-01" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[cost] +input = 0.27 +output = 0.41 + +[limit] +context = 163_840 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml new file mode 100644 index 000000000..ab57aee8b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/deepseek/deepseek-v3.2.toml @@ -0,0 +1,21 @@ +name = "DeepSeek V3.2" +release_date = "2025-12-01" +last_updated = "2025-12-01" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[cost] +input = 0.28 +output = 0.40 + +[limit] +context = 163_840 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml new file mode 100644 index 000000000..5168a0cd2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-001.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.0 Flash" +release_date = "2024-12-11" +last_updated = "2024-12-11" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-06" +tool_call = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 +cache_read = 0.025 + +[limit] +context = 1_048_576 +output = 8_192 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml new file mode 100644 index 000000000..ae135080e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.0-flash-exp:free.toml @@ -0,0 +1,21 @@ +name = "Gemini 2.0 Flash Experimental (free)" +release_date = "2024-12-11" +last_updated = "2024-12-11" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-12" +tool_call = true +open_weights = false + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 1_048_576 +output = 1_048_576 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml new file mode 100644 index 000000000..f0dcb0495 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite-preview-09-2025.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Lite Preview 09-25" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 +cache_read = 0.025 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml new file mode 100644 index 000000000..4a534b571 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-lite.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Lite" +release_date = "2025-06-17" +last_updated = "2025-06-17" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 0.10 +output = 0.40 +cache_read = 0.025 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml new file mode 100644 index 000000000..5ee14ca12 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash-preview-09-2025.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash Preview 09-25" +release_date = "2025-09-25" +last_updated = "2025-09-25" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 0.30 +output = 2.50 +cache_read = 0.031 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml new file mode 100644 index 000000000..3c4458c21 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-flash.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Flash" +release_date = "2025-07-17" +last_updated = "2025-07-17" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 0.30 +output = 2.50 +cache_read = 0.0375 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml new file mode 100644 index 000000000..3618677e9 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-05-06.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Pro Preview 05-06" +release_date = "2025-05-06" +last_updated = "2025-05-06" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.31 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml new file mode 100644 index 000000000..82ee677b3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro-preview-06-05.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Pro Preview 06-05" +release_date = "2025-06-05" +last_updated = "2025-06-05" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.31 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml new file mode 100644 index 000000000..0e0d4a881 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-2.5-pro.toml @@ -0,0 +1,22 @@ +name = "Gemini 2.5 Pro" +release_date = "2025-03-20" +last_updated = "2025-06-05" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.31 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml new file mode 100644 index 000000000..e05d22307 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemini-3-pro-preview.toml @@ -0,0 +1,24 @@ +name = "Gemini 3 Pro Preview" +release_date = "2025-11-18" +last_updated = "2025-11" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-01" +tool_call = true +open_weights = false + +[cost] +input = 2.00 +output = 12.00 + +[limit] +context = 1_050_000 +output = 66_000 + +[modalities] +input = ["text", "image", "audio", "video", "pdf"] +output = ["text"] + +[provider] +npm = "@openrouter/ai-sdk-provider" diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml new file mode 100644 index 000000000..4de372415 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-2-9b-it:free.toml @@ -0,0 +1,21 @@ +name = "Gemma 2 9B (free)" +release_date = "2024-06-28" +last_updated = "2024-06-28" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-06" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml new file mode 100644 index 000000000..8efc679b2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-12b-it.toml @@ -0,0 +1,16 @@ +id = "google/gemma-3-12b-it:free" +name = "Gemma 3 12B IT" +release_date = "2025-03-13" +last_updated = "2025-03-13" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = true +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 96000, output = 8192 } + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml new file mode 100644 index 000000000..5fc7e02d7 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3-27b-it.toml @@ -0,0 +1,16 @@ +id = "google/gemma-3-27b-it:free" +name = "Gemma 3 27B IT" +release_date = "2025-03-12" +last_updated = "2025-03-12" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = true +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 96000, output = 8192 } + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml new file mode 100644 index 000000000..03723bbb3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it.toml @@ -0,0 +1,16 @@ +id = "google/gemma-3n-e4b-it:free" +name = "Gemma 3n E4B IT" +release_date = "2025-05-20" +last_updated = "2025-05-20" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = false +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 8192, output = 8192 } + +[modalities] +input = ["text", "image", "audio"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml new file mode 100644 index 000000000..190fcb985 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/google-ai-studio/gemma-3n-e4b-it:free.toml @@ -0,0 +1,21 @@ +name = "Gemma 3n 4B (free)" +release_date = "2025-05-20" +last_updated = "2025-05-20" +attachment = true +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text", "image", "audio"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml b/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml new file mode 100644 index 000000000..0b2502a3c --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/deepseek-r1-distill-llama-70b.toml @@ -0,0 +1,19 @@ +name = "DeepSeek R1 Distill Llama 70B" +release_date = "2025-01-20" +last_updated = "2025-01-20" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true +status = "deprecated" + + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml b/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml new file mode 100644 index 000000000..438069e93 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/gemma2-9b-it.toml @@ -0,0 +1,18 @@ +name = "Gemma 2 9B" +release_date = "2024-06-27" +last_updated = "2024-06-27" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-06" +tool_call = true +open_weights = true +status = "deprecated" + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml b/providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml new file mode 100644 index 000000000..90c84f3eb --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/llama-3.1-8b-instant.toml @@ -0,0 +1,17 @@ +name = "Llama 3.1 8B Instant" +release_date = "2024-07-23" +last_updated = "2024-07-23" +attachment = false +reasoning = false +temperature = true +knowledge = "2023-12" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml b/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml new file mode 100644 index 000000000..f39ab2074 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/llama-3.3-70b-versatile.toml @@ -0,0 +1,17 @@ +name = "Llama 3.3 70B Versatile" +release_date = "2024-12-06" +last_updated = "2024-12-06" +attachment = false +reasoning = false +temperature = true +knowledge = "2023-12" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml b/providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml new file mode 100644 index 000000000..4e9ad068f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/llama-guard-3-8b.toml @@ -0,0 +1,18 @@ +name = "Llama Guard 3 8B" +release_date = "2024-07-23" +last_updated = "2024-07-23" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true +status = "deprecated" + + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml b/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml new file mode 100644 index 000000000..bae5b60d1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/llama3-70b-8192.toml @@ -0,0 +1,19 @@ +name = "Llama 3 70B" +release_date = "2024-04-18" +last_updated = "2024-04-18" +attachment = false +reasoning = false +temperature = true +knowledge = "2023-03" +tool_call = true +open_weights = true +status = "deprecated" + + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml b/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml new file mode 100644 index 000000000..2c28f1a84 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/llama3-8b-8192.toml @@ -0,0 +1,18 @@ +name = "Llama 3 8B" +release_date = "2024-04-18" +last_updated = "2024-04-18" +attachment = false +reasoning = false +temperature = true +knowledge = "2023-03" +tool_call = true +open_weights = true +status = "deprecated" + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml new file mode 100644 index 000000000..f7ef6016e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-maverick-17b-128e-instruct.toml @@ -0,0 +1,17 @@ +name = "Llama 4 Maverick 17B" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-08" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml new file mode 100644 index 000000000..a5fe7ff54 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-4-scout-17b-16e-instruct.toml @@ -0,0 +1,17 @@ +name = "Llama 4 Scout 17B" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-08" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml new file mode 100644 index 000000000..7e257022c --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/meta-llama/llama-guard-4-12b.toml @@ -0,0 +1,16 @@ +name = "Llama Guard 4 12B" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[limit] +context = 131_072 +output = 128 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml b/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml new file mode 100644 index 000000000..78b6968e5 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/mistral-saba-24b.toml @@ -0,0 +1,19 @@ +name = "Mistral Saba 24B" +release_date = "2025-02-06" +last_updated = "2025-02-06" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-08" +tool_call = true +open_weights = false +status = "deprecated" + + +[limit] +context = 32_768 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml new file mode 100644 index 000000000..7456acc02 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct-0905.toml @@ -0,0 +1,17 @@ +name = "Kimi K2 Instruct 0905" +release_date = "2025-09-05" +last_updated = "2025-09-05" +attachment = false +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-10" +open_weights = true + +[limit] +context = 262_144 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml new file mode 100644 index 000000000..821613e6f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/moonshotai/kimi-k2-instruct.toml @@ -0,0 +1,18 @@ +name = "Kimi K2 Instruct" +release_date = "2025-07-14" +last_updated = "2025-07-14" +attachment = false +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-10" +open_weights = true +status = "deprecated" + +[limit] +context = 131_072 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml new file mode 100644 index 000000000..02d65e606 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-120b.toml @@ -0,0 +1,16 @@ +name = "GPT OSS 120B" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml new file mode 100644 index 000000000..116e1f0de --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/openai/gpt-oss-20b.toml @@ -0,0 +1,16 @@ +name = "GPT OSS 20B" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml b/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml new file mode 100644 index 000000000..a1b0dd799 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/qwen-qwq-32b.toml @@ -0,0 +1,17 @@ +name = "Qwen QwQ 32B" +release_date = "2024-11-27" +last_updated = "2024-11-27" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-09" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml b/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml new file mode 100644 index 000000000..2afb927c3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/groq/qwen/qwen3-32b.toml @@ -0,0 +1,17 @@ +name = "Qwen3 32B" +release_date = "2024-12-23" +last_updated = "2024-12-23" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-11-08" +tool_call = true +open_weights = true + +[limit] +context = 131_072 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml b/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml new file mode 100644 index 000000000..642db9246 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/codestral-2508.toml @@ -0,0 +1,21 @@ +name = "Codestral 2508" +release_date = "2025-08-01" +last_updated = "2025-08-01" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.30 +output = 0.90 + +[limit] +context = 256_000 +output = 256_000 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml new file mode 100644 index 000000000..d514e4688 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/devstral-medium-2507.toml @@ -0,0 +1,21 @@ +name = "Devstral Medium" +release_date = "2025-07-10" +last_updated = "2025-07-10" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.40 +output = 2.00 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml new file mode 100644 index 000000000..73ad4baee --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505.toml @@ -0,0 +1,21 @@ +name = "Devstral Small" +release_date = "2025-05-07" +last_updated = "2025-05-07" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.06 +output = 0.12 + +[limit] +context = 128_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml new file mode 100644 index 000000000..86554a6a8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2505:free.toml @@ -0,0 +1,21 @@ +name = "Devstral Small 2505 (free)" +release_date = "2025-05-21" +last_updated = "2025-05-21" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 32_768 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml new file mode 100644 index 000000000..1738ab3c2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/devstral-small-2507.toml @@ -0,0 +1,21 @@ +name = "Devstral Small 1.1" +release_date = "2025-07-10" +last_updated = "2025-07-10" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = true + +[cost] +input = 0.10 +output = 0.30 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml new file mode 100644 index 000000000..d10b1afc8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-7b-instruct:free.toml @@ -0,0 +1,21 @@ +name = "Mistral 7B Instruct (free)" +release_date = "2024-05-27" +last_updated = "2024-05-27" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-05" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 32_768 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml new file mode 100644 index 000000000..5dc17a5f3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.1.toml @@ -0,0 +1,21 @@ +name = "Mistral Medium 3.1" +release_date = "2025-08-12" +last_updated = "2025-08-12" +attachment = true +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = false + +[cost] +input = 0.40 +output = 2.00 + +[limit] +context = 262_144 +output = 262_144 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml new file mode 100644 index 000000000..cbf57bcd8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-medium-3.toml @@ -0,0 +1,21 @@ +name = "Mistral Medium 3" +release_date = "2025-05-07" +last_updated = "2025-05-07" +attachment = true +reasoning = false +temperature = true +knowledge = "2025-05" +tool_call = true +open_weights = false + +[cost] +input = 0.40 +output = 2.00 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml new file mode 100644 index 000000000..cc5f6e5f1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-nemo:free.toml @@ -0,0 +1,21 @@ +name = "Mistral Nemo (free)" +release_date = "2024-07-19" +last_updated = "2024-07-19" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml new file mode 100644 index 000000000..fd7611b8b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.1-24b-instruct.toml @@ -0,0 +1,16 @@ +id = "mistralai/mistral-small-3.1-24b-instruct:free" +name = "Mistral Small 3.1 24B Instruct" +release_date = "2025-03-17" +last_updated = "2025-03-17" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = true +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 128000, output = 8192 } + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml new file mode 100644 index 000000000..4cfdf7060 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct.toml @@ -0,0 +1,16 @@ +id = "mistralai/mistral-small-3.2-24b-instruct:free" +name = "Mistral Small 3.2 24B Instruct" +release_date = "2025-06-20" +last_updated = "2025-06-20" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = true +open_weights = true +cost = { input = 0, output = 0 } +limit = { context = 96000, output = 8192 } + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml new file mode 100644 index 000000000..df55ac661 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/mistralai/mistral-small-3.2-24b-instruct:free.toml @@ -0,0 +1,21 @@ +name = "Mistral Small 3.2 24B (free)" +release_date = "2025-06-20" +last_updated = "2025-06-20" +attachment = true +reasoning = false +temperature = true +knowledge = "2025-06" +tool_call = true +open_weights = true + +[cost] +input = 0.00 +output = 0.00 + +[limit] +context = 96_000 +output = 96_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml new file mode 100644 index 000000000..748b01700 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1-mini.toml @@ -0,0 +1,22 @@ +name = "GPT-4.1 Mini" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = true +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-04" +open_weights = false + +[cost] +input = 0.40 +output = 1.60 +cache_read = 0.10 + +[limit] +context = 1_047_576 +output = 32_768 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml new file mode 100644 index 000000000..eca02a28f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4.1.toml @@ -0,0 +1,22 @@ +name = "GPT-4.1" +release_date = "2025-04-14" +last_updated = "2025-04-14" +attachment = true +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-04" +open_weights = false + +[cost] +input = 2.00 +output = 8.00 +cache_read = 0.50 + +[limit] +context = 1_047_576 +output = 32_768 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml new file mode 100644 index 000000000..173e77421 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-4o-mini.toml @@ -0,0 +1,22 @@ +name = "GPT-4o-mini" +release_date = "2024-07-18" +last_updated = "2024-07-18" +attachment = true +reasoning = false +temperature = true +tool_call = true +knowledge = "2024-10" +open_weights = false + +[cost] +input = 0.15 +output = 0.60 +cache_read = 0.08 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml new file mode 100644 index 000000000..527aebdfc --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-chat.toml @@ -0,0 +1,21 @@ +name = "GPT-5 Chat (latest)" +release_date = "2025-08-07" +last_updated = "2025-08-07" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-09-30" +tool_call = false +open_weights = false + +[cost] +input = 1.25 +output = 10.00 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml new file mode 100644 index 000000000..a3c834e57 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-codex.toml @@ -0,0 +1,22 @@ +name = "GPT-5 Codex" +release_date = "2025-09-15" +last_updated = "2025-09-15" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-10-01" +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.125 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml new file mode 100644 index 000000000..0ae97d15b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-image.toml @@ -0,0 +1,22 @@ +name = "GPT-5 Image" +release_date = "2025-10-14" +last_updated = "2025-10-14" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-10-01" +tool_call = true +open_weights = false + +[cost] +input = 5.00 +output = 10.00 +cache_read = 1.25 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image", "pdf"] +output = ["text", "image"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml new file mode 100644 index 000000000..5437addce --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-mini.toml @@ -0,0 +1,21 @@ +name = "GPT-5 Mini" +release_date = "2025-08-07" +last_updated = "2025-08-07" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-10-01" +tool_call = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml new file mode 100644 index 000000000..284ee8d46 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-nano.toml @@ -0,0 +1,21 @@ +name = "GPT-5 Nano" +release_date = "2025-08-07" +last_updated = "2025-08-07" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-10-01" +tool_call = true +open_weights = false + +[cost] +input = 0.05 +output = 0.40 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml new file mode 100644 index 000000000..a2a292d83 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5-pro.toml @@ -0,0 +1,21 @@ +name = "GPT-5 Pro" +release_date = "2025-10-06" +last_updated = "2025-10-06" +attachment = true +reasoning = true +temperature = false +knowledge = "2024-09-30" +tool_call = true +open_weights = false + +[cost] +input = 15.00 +output = 120.00 + +[limit] +context = 400_000 +output = 272_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml new file mode 100644 index 000000000..5287c7505 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-chat.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1 Chat" +release_date = "2025-11-13" +last_updated = "2025-11-13" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-09-30" +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.125 + +[limit] +context = 128_000 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml new file mode 100644 index 000000000..0894af700 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex-mini.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1-Codex-Mini" +release_date = "2025-11-13" +last_updated = "2025-11-13" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-09-30" +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 0.25 +output = 2.00 +cache_read = 0.025 + +[limit] +context = 400_000 +output = 100_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml new file mode 100644 index 000000000..38dabafaf --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1-codex.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1-Codex" +release_date = "2025-11-13" +last_updated = "2025-11-13" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-09-30" +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.125 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml new file mode 100644 index 000000000..37eb1a25c --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.1.toml @@ -0,0 +1,23 @@ +name = "GPT-5.1" +release_date = "2025-11-13" +last_updated = "2025-11-13" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-09-30" +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 +cache_read = 0.125 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml new file mode 100644 index 000000000..2ca19f85e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-5.toml @@ -0,0 +1,21 @@ +name = "GPT-5" +release_date = "2025-08-07" +last_updated = "2025-08-07" +attachment = true +reasoning = true +temperature = true +knowledge = "2024-10-01" +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 10.00 + +[limit] +context = 400_000 +output = 128_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml new file mode 100644 index 000000000..947815c8d --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b.toml @@ -0,0 +1,20 @@ +name = "GPT OSS 120B" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.072 +output = 0.28 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml new file mode 100644 index 000000000..ec8055a44 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-120b:exacto.toml @@ -0,0 +1,20 @@ +name = "GPT OSS 120B (exacto)" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.05 +output = 0.24 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml new file mode 100644 index 000000000..ade230e00 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-20b.toml @@ -0,0 +1,20 @@ +name = "GPT OSS 20B" +release_date = "2025-08-05" +last_updated = "2025-08-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.05 +output = 0.20 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml new file mode 100644 index 000000000..844c6be72 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/gpt-oss-safeguard-20b.toml @@ -0,0 +1,20 @@ +name = "GPT OSS Safeguard 20B" +release_date = "2025-10-29" +last_updated = "2025-10-29" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = false + +[cost] +input = 0.075 +output = 0.30 + +[limit] +context = 131_072 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml b/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml new file mode 100644 index 000000000..6f24829b3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/openai/o4-mini.toml @@ -0,0 +1,22 @@ +name = "o4 Mini" +release_date = "2025-04-16" +last_updated = "2025-04-16" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2024-06" +open_weights = false + +[cost] +input = 1.10 +output = 4.40 +cache_read = 0.28 + +[limit] +context = 200_000 +output = 100_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml new file mode 100644 index 000000000..7fb6424a5 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/perplexity/sonar-pro.toml @@ -0,0 +1,17 @@ +name = "Sonar Pro" +release_date = "2024-01-01" +last_updated = "2025-09-01" +attachment = true +reasoning = false +temperature = true +tool_call = false +knowledge = "2025-09-01" +open_weights = false + +[limit] +context = 200_000 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml new file mode 100644 index 000000000..502331a87 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning-pro.toml @@ -0,0 +1,17 @@ +name = "Sonar Reasoning Pro" +release_date = "2024-01-01" +last_updated = "2025-09-01" +attachment = true +reasoning = true +temperature = true +tool_call = false +knowledge = "2025-09-01" +open_weights = false + +[limit] +context = 128_000 +output = 4_096 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml new file mode 100644 index 000000000..c0e101623 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/perplexity/sonar-reasoning.toml @@ -0,0 +1,17 @@ +name = "Sonar Reasoning" +release_date = "2024-01-01" +last_updated = "2025-09-01" +attachment = false +reasoning = true +temperature = true +tool_call = false +knowledge = "2025-09-01" +open_weights = false + +[limit] +context = 128_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/perplexity/sonar.toml b/providers/cloudflare-ai-gateway/models/perplexity/sonar.toml new file mode 100644 index 000000000..90157ebef --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/perplexity/sonar.toml @@ -0,0 +1,17 @@ +name = "Sonar" +release_date = "2024-01-01" +last_updated = "2025-09-01" +attachment = false +reasoning = false +temperature = true +tool_call = false +knowledge = "2025-09-01" +open_weights = false + +[limit] +context = 128_000 +output = 4_096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml b/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml new file mode 100644 index 000000000..45bdc25d7 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/aura-1.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/aura-1/ + +name = "@cf/deepgram/aura-1" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2025-08-27" +last_updated = "2025-07-07" + +[cost] +# per 1k characters +input = 0.015 +output = 0.015 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["audio"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml b/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml new file mode 100644 index 000000000..a3267b1f3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/bart-large-cnn.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/bart-large-cnn/ + +name = "@cf/facebook/bart-large-cnn" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2022-03-02" +last_updated = "2024-02-13" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml new file mode 100644 index 000000000..f6440dc86 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-base-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/deepseek-coder-6.7b-base-awq/ + +name = "@hf/thebloke/deepseek-coder-6.7b-base-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-11-05" +last_updated = "2023-11-09" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml new file mode 100644 index 000000000..01c3b009e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-coder-6.7b-instruct-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/deepseek-coder-6.7b-instruct-awq/ + +name = "@hf/thebloke/deepseek-coder-6.7b-instruct-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-11-05" +last_updated = "2023-11-13" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml new file mode 100644 index 000000000..064b7343d --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-math-7b-instruct.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/deepseek-math-7b-instruct/ + +name = "@cf/deepseek-ai/deepseek-math-7b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-02-05" +last_updated = "2024-02-06" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml new file mode 100644 index 000000000..2ce921daa --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/deepseek-r1-distill-qwen-32b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/deepseek-r1-distill-qwen-32b/ + +name = "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b" +attachment = false +reasoning = true +tool_call = true +temperature = true +open_weights = true +release_date = "2025-01-20" +last_updated = "2025-02-24" + +[cost] +input = 0.5 +output = 4.88 + +[limit] +context = 80000 +output = 80000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml new file mode 100644 index 000000000..57314cd84 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/discolm-german-7b-v1-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/discolm-german-7b-v1-awq/ + +name = "@cf/thebloke/discolm-german-7b-v1-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-01-18" +last_updated = "2024-01-24" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml b/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml new file mode 100644 index 000000000..8d1712a0c --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/dreamshaper-8-lcm.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/dreamshaper-8-lcm/ + +name = "@cf/lykon/dreamshaper-8-lcm" +attachment = true +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2023-12-06" +last_updated = "2023-12-07" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml new file mode 100644 index 000000000..543fa2aef --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/falcon-7b-instruct.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/falcon-7b-instruct/ + +name = "@cf/tiiuae/falcon-7b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-04-25" +last_updated = "2024-10-12" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml b/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml new file mode 100644 index 000000000..1480fe105 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/flux-1-schnell.toml @@ -0,0 +1,24 @@ +# https://developers.cloudflare.com/workers-ai/models/flux-1-schnell/ + +name = "@cf/black-forest-labs/flux-1-schnell" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-07-31" +last_updated = "2024-08-16" + +[cost] +# per 512 by 512 tile +input = 0.000053 +# per step +output = 0.00011 + +[limit] +context = 2048 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml new file mode 100644 index 000000000..6e76a054f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-2b-it-lora.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gemma-2b-it-lora/ + +name = "@cf/google/gemma-2b-it-lora" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-04-02" +last_updated = "2024-04-02" + +[cost] +input = 0 +output = 0 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml new file mode 100644 index 000000000..0b0f15b18 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-3-12b-it.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gemma-3-12b-it/ + +name = "@cf/google/gemma-3-12b-it" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2025-03-01" +last_updated = "2025-03-21" + +[cost] +input = 0.35 +output = 0.56 + +[limit] +context = 80000 +output = 80000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml new file mode 100644 index 000000000..42e88d143 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it-lora.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gemma-7b-it-lora/ + +name = "@cf/google/gemma-7b-it-lora" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-04-02" +last_updated = "2024-04-02" + +[cost] +input = 0 +output = 0 + +[limit] +context = 3500 +output = 3500 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml new file mode 100644 index 000000000..7c1e98c99 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-7b-it.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gemma-7b-it/ + +name = "@hf/google/gemma-7b-it" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-02-13" +last_updated = "2024-08-14" + +[cost] +input = 0 +output = 0 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml new file mode 100644 index 000000000..ba1472b48 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gemma-sea-lion-v4-27b-it.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gemma-sea-lion-v4-27b-it/ + +name = "@cf/aisingapore/gemma-sea-lion-v4-27b-it" +attachment = false +reasoning = false +tool_call = true +open_weights = false +release_date = "2025-09-23" +last_updated = "2025-12-02" +temperature = true + +[limit] +context = 128000 +output = 0 + +[cost] +input = 0.35 +output = 0.56 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml new file mode 100644 index 000000000..ca7cc8cc3 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-120b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gpt-oss-120b/ + +name = "@cf/openai/gpt-oss-120b" +attachment = false +reasoning = true +tool_call = false +temperature = false +open_weights = true +release_date = "2025-08-04" +last_updated = "2025-08-14" + +[cost] +input = 0.35 +output = 0.75 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml new file mode 100644 index 000000000..4b5af26ab --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/gpt-oss-20b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/gpt-oss-20b/ + +name = "@cf/openai/gpt-oss-20b" +attachment = false +reasoning = true +tool_call = false +temperature = false +open_weights = true +release_date = "2025-08-04" +last_updated = "2025-08-14" + +[cost] +input = 0.2 +output = 0.3 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml b/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml new file mode 100644 index 000000000..3ffe69a84 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/granite-4.0-h-micro.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/granite-4.0-h-micro/ + +name = "@cf/ibm-granite/granite-4.0-h-micro" +attachment = false +reasoning = false +tool_call = true +open_weights = false +release_date = "2025-10-07" +last_updated = "2025-12-02" +temperature = true + +[limit] +context = 131000 +output = 0 + +[cost] +input = 0.017 +output = 0.11 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml new file mode 100644 index 000000000..c8fe4427f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/hermes-2-pro-mistral-7b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/hermes-2-pro-mistral-7b/ + +name = "@hf/nousresearch/hermes-2-pro-mistral-7b" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-03-11" +last_updated = "2024-09-08" + +[cost] +input = 0 +output = 0 + +[limit] +context = 24000 +output = 24000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml new file mode 100644 index 000000000..9c0bd41d1 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-13b-chat-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-2-13b-chat-awq/ + +name = "@hf/thebloke/llama-2-13b-chat-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-09-19" +last_updated = "2023-11-09" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml new file mode 100644 index 000000000..1a8538759 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-fp16.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-fp16/ + +name = "@cf/meta/llama-2-7b-chat-fp16" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-07-26" +last_updated = "2023-07-26" + +[cost] +input = 0.56 +output = 6.67 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml new file mode 100644 index 000000000..35172ab0c --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-hf-lora.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-hf-lora/ + +name = "@cf/meta-llama/llama-2-7b-chat-hf-lora" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-07-13" +last_updated = "2024-04-17" + +[cost] +input = 0 +output = 0 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml new file mode 100644 index 000000000..d9eb362c0 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-2-7b-chat-int8.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-2-7b-chat-int8/ + +name = "@cf/meta/llama-2-7b-chat-int8" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-09-25" +last_updated = "2023-09-25" + +[cost] +input = 0.556 +output = 6.667 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml new file mode 100644 index 000000000..19de5777e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct-awq.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3-8b-instruct-awq/ + +name = "@cf/meta/llama-3-8b-instruct-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-05-09" +last_updated = "2024-05-09" + +[cost] +input = 0.12 +output = 0.27 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml new file mode 100644 index 000000000..15410af48 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3-8b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3-8b-instruct/ + +name = "@cf/meta/llama-3-8b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-04-17" +last_updated = "2025-06-19" + +[cost] +input = 0.28 +output = 0.83 + +[limit] +context = 7968 +output = 7968 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml new file mode 100644 index 000000000..307a85f63 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-70b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.1-70b-instruct/ + +name = "@cf/meta/llama-3.1-70b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-07-16" +last_updated = "2024-12-15" + +[cost] +input = 0.293 +output = 2.253 + +[limit] +context = 24000 +output = 24000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml new file mode 100644 index 000000000..24b746f22 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-awq.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-awq/ + +name = "@cf/meta/llama-3.1-8b-instruct-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-07-25" +last_updated = "2024-07-25" + +[cost] +input = 0.12 +output = 0.27 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml new file mode 100644 index 000000000..cfff32d0e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fast.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-fast/ + +name = "@cf/meta/llama-3.1-8b-instruct-fast" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-07-18" +last_updated = "2024-09-25" + +[cost] +input = 0.045 +output = 0.384 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml new file mode 100644 index 000000000..352fff5a9 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct-fp8.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct-fp8/ + +name = "@cf/meta/llama-3.1-8b-instruct-fp8" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-07-25" +last_updated = "2024-07-25" + +[cost] +input = 0.15 +output = 0.29 + +[limit] +context = 32000 +output = 32000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml new file mode 100644 index 000000000..26b2a40fe --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.1-8b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.1-8b-instruct/ + +name = "@cf/meta/llama-3.1-8b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-07-18" +last_updated = "2024-09-25" + +[cost] +input = 0.28 +output = 0.83 + +[limit] +context = 7968 +output = 7968 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml new file mode 100644 index 000000000..d77963828 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-11b-vision-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.2-11b-vision-instruct/ + +name = "@cf/meta/llama-3.2-11b-vision-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-09-18" +last_updated = "2024-12-04" + +[cost] +input = 0.049 +output = 0.68 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml new file mode 100644 index 000000000..9c6d02bf7 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-1b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.2-1b-instruct/ + +name = "@cf/meta/llama-3.2-1b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-09-18" +last_updated = "2024-10-24" + +[cost] +input = 0.027 +output = 0.2 + +[limit] +context = 60000 +output = 60000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml new file mode 100644 index 000000000..6a0a2aa8b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.2-3b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.2-3b-instruct/ + +name = "@cf/meta/llama-3.2-3b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-09-18" +last_updated = "2024-10-24" + +[cost] +input = 0.051 +output = 0.34 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml new file mode 100644 index 000000000..51f436d4a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-3.3-70b-instruct-fp8-fast.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-3.3-70b-instruct-fp8-fast/ + +name = "@cf/meta/llama-3.3-70b-instruct-fp8-fast" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-12-06" +last_updated = "2024-12-06" + +[cost] +input = 0.29 +output = 2.25 + +[limit] +context = 24000 +output = 24000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml new file mode 100644 index 000000000..27ba1174f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-4-scout-17b-16e-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-4-scout-17b-16e-instruct/ + +name = "@cf/meta/llama-4-scout-17b-16e-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2025-04-02" +last_updated = "2025-05-23" + +[cost] +input = 0.27 +output = 0.85 + +[limit] +context = 131000 +output = 131000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml new file mode 100644 index 000000000..3155b7c63 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llama-guard-3-8b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llama-guard-3-8b/ + +name = "@cf/meta/llama-guard-3-8b" +attachment = false +reasoning = false +tool_call = false +temperature = true +open_weights = true +release_date = "2024-07-22" +last_updated = "2024-10-11" + +[cost] +input = 0.48 +output = 0.03 + +[limit] +context = 131072 +output = 0 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml new file mode 100644 index 000000000..ddc2c123d --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llamaguard-7b-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/llamaguard-7b-awq/ + +name = "@hf/thebloke/llamaguard-7b-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-12-11" +last_updated = "2023-12-11" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml b/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml new file mode 100644 index 000000000..6c371c836 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/llava-1.5-7b-hf.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/llava-1.5-7b-hf/ + +name = "@cf/llava-hf/llava-1.5-7b-hf" +attachment = true +reasoning = false +tool_call = false +temperature = true +open_weights = true +release_date = "2023-12-05" +last_updated = "2025-06-06" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["image","text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml b/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml new file mode 100644 index 000000000..523f2125a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/lucid-origin.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/lucid-origin/ + +name = "@cf/leonardo/lucid-origin" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = false +release_date = "2025-08-25" +last_updated = "2025-08-05" + +[cost] +# 0.007 per 512x512 tile, 0.00013 per step +input = 0.007 +output = 0.007 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml new file mode 100644 index 000000000..99024cf53 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/m2m100-1.2b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/m2m100-1.2b/ + +name = "@cf/meta/m2m100-1.2b" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2022-03-02" +last_updated = "2023-11-16" + +[cost] +input = 0.34 +output = 0.34 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml b/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml new file mode 100644 index 000000000..743028594 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/melotts.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/melotts/ + +name = "@cf/myshell-ai/melotts" +attachment = true +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-07-19" +last_updated = "2024-07-19" + +[cost] +# per audio minute +input = 0.0002 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["audio"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml new file mode 100644 index 000000000..f91a3ade4 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.1-awq/ + +name = "@hf/thebloke/mistral-7b-instruct-v0.1-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-09-27" +last_updated = "2023-11-09" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml new file mode 100644 index 000000000..74af9cc16 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.1.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.1/ + +name = "@cf/mistral/mistral-7b-instruct-v0.1" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-09-27" +last_updated = "2025-07-24" + +[cost] +input = 0.11 +output = 0.19 + +[limit] +context = 2824 +output = 2824 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml new file mode 100644 index 000000000..895418742 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2-lora.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.2-lora/ + +name = "@cf/mistral/mistral-7b-instruct-v0.2-lora" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-04-01" +last_updated = "2024-04-01" + +[cost] +input = 0 +output = 0 + +[limit] +context = 15000 +output = 15000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml new file mode 100644 index 000000000..c874e3df7 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-7b-instruct-v0.2.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/mistral-7b-instruct-v0.2/ + +name = "@hf/mistral/mistral-7b-instruct-v0.2" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-12-11" +last_updated = "2025-07-24" + +[cost] +input = 0 +output = 0 + +[limit] +context = 3072 +output = 4096 +input = 3072 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml new file mode 100644 index 000000000..2019c66f8 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/mistral-small-3.1-24b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/mistral-small-3.1-24b-instruct/ + +name = "@cf/mistralai/mistral-small-3.1-24b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2025-03-11" +last_updated = "2025-07-28" + +[cost] +input = 0.35 +output = 0.56 + +[limit] +context = 128000 +output = 128000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml new file mode 100644 index 000000000..bac727eee --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/neural-chat-7b-v3-1-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/neural-chat-7b-v3-1-awq/ + +name = "@hf/thebloke/neural-chat-7b-v3-1-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-11-15" +last_updated = "2023-11-17" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml b/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml new file mode 100644 index 000000000..587477f4a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/nova-3.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/nova-3/ + +name = "@cf/deepgram/nova-3" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2025-06-05" +last_updated = "2025-07-08" + +[cost] +input = 0.0052 +output = 0.0052 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml b/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml new file mode 100644 index 000000000..8ae0ee82d --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/openchat-3.5-0106.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/openchat-3.5-0106/ + +name = "@cf/openchat/openchat-3.5-0106" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-01-07" +last_updated = "2024-05-18" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 8192 +output = 8192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml new file mode 100644 index 000000000..de9818c32 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/openhermes-2.5-mistral-7b-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/openhermes-2.5-mistral-7b-awq/ + +name = "@hf/thebloke/openhermes-2.5-mistral-7b-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-11-02" +last_updated = "2023-11-09" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml new file mode 100644 index 000000000..f7b41a400 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/phi-2.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/phi-2/ + +name = "@cf/microsoft/phi-2" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-12-13" +last_updated = "2024-04-29" + +[cost] +input = 0 +output = 0 + +[limit] +context = 2048 +output = 2048 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml new file mode 100644 index 000000000..cb9eff10a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/phoenix-1.0.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/phoenix-1.0/ + +name = "@cf/leonardo/phoenix-1.0" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = false +release_date = "2025-08-25" +last_updated = "2025-08-25" + +[cost] +# 0.0058 per 512x512 step, 0.00011 per step +input = 0.0058 +output = 0.0058 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml new file mode 100644 index 000000000..02a89d2e2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-0.5b-chat.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen1.5-0.5b-chat/ + +name = "@cf/qwen/qwen1.5-0.5b-chat" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-01-31" +last_updated = "2024-04-30" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 32000 +output = 32000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml new file mode 100644 index 000000000..8fc56a863 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-1.8b-chat.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen1.5-1.8b-chat/ + +name = "@cf/qwen/qwen1.5-1.8b-chat" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-01-30" +last_updated = "2024-04-30" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 32000 +output = 32000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml new file mode 100644 index 000000000..0ea4a2f81 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-14b-chat-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen1.5-14b-chat-awq/ + +name = "@cf/qwen/qwen1.5-14b-chat-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-02-03" +last_updated = "2024-04-30" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 7500 +output = 7500 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml new file mode 100644 index 000000000..2cfdd8f25 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen1.5-7b-chat-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen1.5-7b-chat-awq/ + +name = "@cf/qwen/qwen1.5-7b-chat-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-02-03" +last_updated = "2024-04-30" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 20000 +output = 20000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml new file mode 100644 index 000000000..639fb5929 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen2.5-coder-32b-instruct.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen2.5-coder-32b-instruct/ + +name = "@cf/qwen/qwen2.5-coder-32b-instruct" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-11-06" +last_updated = "2025-01-12" + +[cost] +input = 0.66 +output = 1 + +[limit] +context = 32768 +output = 32768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml new file mode 100644 index 000000000..2e92e4d78 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwen3-30b-a3b-fp8.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/qwen3-30b-a3b-fp8/ + +name = "@cf/qwen/qwen3-30b-a3b-fp8" +attachment = false +reasoning = true +tool_call = true +open_weights = true +release_date = "2025-04-30" +last_updated = "2025-12-02" +temperature = true + +[limit] +context = 32768 +output = 0 + +[cost] +input = 0.051 +output = 0.34 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml b/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml new file mode 100644 index 000000000..1641cb43e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/qwq-32b.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/qwq-32b/ + +name = "@cf/qwen/qwq-32b" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2025-03-05" +last_updated = "2025-03-11" + +[cost] +input = 0.66 +output = 1 + +[limit] +context = 24000 +output = 24000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml b/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml new file mode 100644 index 000000000..3c040ddbd --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/resnet-50.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/resnet-50/ + +name = "@cf/microsoft/resnet-50" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2022-03-16" +last_updated = "2024-02-13" + +[cost] +# per inference request +input = 0.0000025 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml b/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml new file mode 100644 index 000000000..8c8e99942 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/sqlcoder-7b-2.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/sqlcoder-7b-2/ + +name = "@cf/defog/sqlcoder-7b-2" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-02-05" +last_updated = "2024-02-12" + +[cost] +input = 0 +output = 0 + +[limit] +context = 10000 +output = 10000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml new file mode 100644 index 000000000..0f55cd660 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-img2img.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-v1-5-img2img/ + +name = "@cf/runwayml/stable-diffusion-v1-5-img2img" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-02-27" +last_updated = "2024-02-27" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml new file mode 100644 index 000000000..2ad25e021 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-v1-5-inpainting.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-v1-5-inpainting/ + +name = "@cf/runwayml/stable-diffusion-v1-5-inpainting" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-02-27" +last_updated = "2024-02-27" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml new file mode 100644 index 000000000..f0362810f --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-base-1.0.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-xl-base-1.0/ + +name = "@cf/stabilityai/stable-diffusion-xl-base-1.0" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2023-07-25" +last_updated = "2023-10-30" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml new file mode 100644 index 000000000..bf716787a --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/stable-diffusion-xl-lightning.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/stable-diffusion-xl-lightning/ + +name = "@cf/bytedance/stable-diffusion-xl-lightning" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-02-20" +last_updated = "2024-04-03" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["text"] +output = ["image"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml b/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml new file mode 100644 index 000000000..fa47b3f96 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/starling-lm-7b-beta.toml @@ -0,0 +1,24 @@ +# https://developers.cloudflare.com/workers-ai/models/starling-lm-7b-beta/ + +name = "@hf/nexusflow/starling-lm-7b-beta" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2024-03-19" +last_updated = "2024-04-03" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 +input = 3072 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml b/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml new file mode 100644 index 000000000..a1c067907 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/tinyllama-1.1b-chat-v1.0.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/tinyllama-1.1b-chat-v1.0/ + +name = "@cf/tinyllama/tinyllama-1.1b-chat-v1.0" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-12-30" +last_updated = "2024-03-17" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 2048 +output = 2048 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml b/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml new file mode 100644 index 000000000..ce3a7db6e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/uform-gen2-qwen-500m.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/uform-gen2-qwen-500m/ + +name = "@cf/unum/uform-gen2-qwen-500m" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-02-15" +last_updated = "2024-04-24" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["image","text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml b/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml new file mode 100644 index 000000000..0b43b8de0 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/una-cybertron-7b-v2-bf16.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/una-cybertron-7b-v2-bf16/ + +name = "@cf/fblgit/una-cybertron-7b-v2-bf16" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-12-02" +last_updated = "2024-03-08" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 15000 +output = 15000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml new file mode 100644 index 000000000..f787da6ef --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-large-v3-turbo.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/whisper-large-v3-turbo/ + +name = "@cf/openai/whisper-large-v3-turbo" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2024-10-01" +last_updated = "2024-10-04" + +[cost] +# per audio minute +input = 0.00051 +output = 0.00051 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml new file mode 100644 index 000000000..703086d37 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/whisper-tiny-en.toml @@ -0,0 +1,22 @@ +# https://developers.cloudflare.com/workers-ai/models/whisper-tiny-en/ + +name = "@cf/openai/whisper-tiny-en" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2022-09-26" +last_updated = "2024-01-22" + +[cost] +input = 0 +output = 0 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml b/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml new file mode 100644 index 000000000..442509455 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/whisper.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/whisper/ + +name = "@cf/openai/whisper" +attachment = false +reasoning = false +tool_call = false +temperature = false +open_weights = true +release_date = "2023-11-07" +last_updated = "2024-08-12" + +[cost] +# per audio minute +input = 0.00045 +output = 0.00045 + +[limit] +context = 0 +output = 0 + +[modalities] +input = ["audio"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml b/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml new file mode 100644 index 000000000..db4c96fdd --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/workers-ai/zephyr-7b-beta-awq.toml @@ -0,0 +1,23 @@ +# https://developers.cloudflare.com/workers-ai/models/zephyr-7b-beta-awq/ + +name = "@hf/thebloke/zephyr-7b-beta-awq" +attachment = false +reasoning = false +tool_call = true +temperature = true +open_weights = true +release_date = "2023-10-27" +last_updated = "2023-11-09" +status = "deprecated" + +[cost] +input = 0 +output = 0 + +[limit] +context = 4096 +output = 4096 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml new file mode 100644 index 000000000..5f2c5141e --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-beta.toml @@ -0,0 +1,23 @@ +name = "Grok 3 Beta" +release_date = "2025-02-17" +last_updated = "2025-02-17" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.75 +cache_write = 15.00 + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml new file mode 100644 index 000000000..4bb152bb6 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini-beta.toml @@ -0,0 +1,23 @@ +name = "Grok 3 Mini Beta" +release_date = "2025-02-17" +last_updated = "2025-02-17" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 0.30 +output = 0.50 +cache_read = 0.075 +cache_write = 0.50 + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml new file mode 100644 index 000000000..c1652e201 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-3-mini.toml @@ -0,0 +1,23 @@ +name = "Grok 3 Mini" +release_date = "2025-02-17" +last_updated = "2025-02-17" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 0.30 +output = 0.50 +cache_read = 0.075 +cache_write = 0.50 + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml new file mode 100644 index 000000000..56069a584 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-3.toml @@ -0,0 +1,23 @@ +name = "Grok 3" +release_date = "2025-02-17" +last_updated = "2025-02-17" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.75 +cache_write = 15.00 + +[limit] +context = 131_072 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml new file mode 100644 index 000000000..a592d3f13 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-4-fast.toml @@ -0,0 +1,23 @@ +name = "Grok 4 Fast" +release_date = "2025-08-19" +last_updated = "2025-08-19" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 0.20 +output = 0.50 +cache_read = 0.05 +cache_write = 0.05 + +[limit] +context = 2_000_000 +output = 30_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml new file mode 100644 index 000000000..17833565b --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.1-fast.toml @@ -0,0 +1,23 @@ +name = "Grok 4.1 Fast" +release_date = "2025-11-19" +last_updated = "2025-11-19" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-11" +tool_call = true +open_weights = false + +[cost] +input = 0.20 +output = 0.50 +cache_read = 0.05 +cache_write = 0.05 + +[limit] +context = 2_000_000 +output = 30_000 + +[modalities] +input = ["text", "image"] +output = ["text"] \ No newline at end of file diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml new file mode 100644 index 000000000..ef04f7356 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-4.toml @@ -0,0 +1,23 @@ +name = "Grok 4" +release_date = "2025-07-09" +last_updated = "2025-07-09" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-07" +tool_call = true +open_weights = false + +[cost] +input = 3.00 +output = 15.00 +cache_read = 0.75 +cache_write = 15.00 + +[limit] +context = 256_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml b/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml new file mode 100644 index 000000000..4ec798dd2 --- /dev/null +++ b/providers/cloudflare-ai-gateway/models/x-ai/grok-code-fast-1.toml @@ -0,0 +1,22 @@ +name = "Grok Code Fast 1" +release_date = "2025-08-26" +last_updated = "2025-08-26" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-08" +tool_call = true +open_weights = false + +[cost] +input = 0.20 +output = 1.50 +cache_read = 0.02 + +[limit] +context = 256_000 +output = 10_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/cloudflare-ai-gateway/provider.toml b/providers/cloudflare-ai-gateway/provider.toml new file mode 100644 index 000000000..2fec3c9ec --- /dev/null +++ b/providers/cloudflare-ai-gateway/provider.toml @@ -0,0 +1,4 @@ +name = "Cloudflare AI Gateway" +env = ["CLOUDFLARE_API_TOKEN", "CLOUDFLARE_ACCOUNT_ID", "CLOUDFLARE_GATEWAY_ID"] +npm = "ai-gateway-provider" +doc = "https://developers.cloudflare.com/ai-gateway/"