diff --git a/providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml b/providers/novita-ai/models/Sao10K/L3-8B-Stheno-v3.2.toml similarity index 94% rename from providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml rename to providers/novita-ai/models/Sao10K/L3-8B-Stheno-v3.2.toml index dc17bf621..910c5ca4c 100644 --- a/providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml +++ b/providers/novita-ai/models/Sao10K/L3-8B-Stheno-v3.2.toml @@ -1,4 +1,5 @@ name = "L3 8B Stheno V3.2" +family = "llama" release_date = "2024-11-29" last_updated = "2024-11-29" attachment = false diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-14b.toml b/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-14b.toml index 36a9d5d23..67c44946a 100644 --- a/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-14b.toml +++ b/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-14b.toml @@ -3,10 +3,9 @@ family = "deepseek-thinking" release_date = "2025-01-20" last_updated = "2025-01-20" attachment = false -reasoning = true +reasoning = false temperature = true tool_call = false -structured_output = true open_weights = true [cost] diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-32b.toml b/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-32b.toml index 67362cf1c..99b7630b5 100644 --- a/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-32b.toml +++ b/providers/novita-ai/models/deepseek/deepseek-r1-distill-qwen-32b.toml @@ -3,10 +3,9 @@ family = "deepseek-thinking" release_date = "2025-01-20" last_updated = "2025-01-20" attachment = false -reasoning = true +reasoning = false temperature = true tool_call = false -structured_output = true open_weights = true [cost] diff --git a/providers/novita-ai/models/google/gemma-3-12b-it.toml b/providers/novita-ai/models/google/gemma-3-12b-it.toml index 0b11a0478..672f8fe9a 100644 --- a/providers/novita-ai/models/google/gemma-3-12b-it.toml +++ b/providers/novita-ai/models/google/gemma-3-12b-it.toml @@ -5,7 +5,6 @@ last_updated = "2025-03-13" attachment = true reasoning = false temperature = true -knowledge = "2024-10" tool_call = false open_weights = true diff --git a/providers/novita-ai/models/google/gemma-4-26b-a4b-it.toml b/providers/novita-ai/models/google/gemma-4-26b-a4b-it.toml index 7bc2cc537..8ddfe8a97 100644 --- a/providers/novita-ai/models/google/gemma-4-26b-a4b-it.toml +++ b/providers/novita-ai/models/google/gemma-4-26b-a4b-it.toml @@ -6,6 +6,7 @@ attachment = true reasoning = true temperature = true tool_call = true +structured_output = true open_weights = true [cost] diff --git a/providers/novita-ai/models/google/gemma-4-31b-it.toml b/providers/novita-ai/models/google/gemma-4-31b-it.toml index f09240ddb..426813f03 100644 --- a/providers/novita-ai/models/google/gemma-4-31b-it.toml +++ b/providers/novita-ai/models/google/gemma-4-31b-it.toml @@ -6,6 +6,7 @@ attachment = true reasoning = true temperature = true tool_call = true +structured_output = true open_weights = true [cost] diff --git a/providers/novita-ai/models/inclusionai/ling-2.6-flash.toml b/providers/novita-ai/models/inclusionai/ling-2.6-flash.toml new file mode 100644 index 000000000..efb3d3621 --- /dev/null +++ b/providers/novita-ai/models/inclusionai/ling-2.6-flash.toml @@ -0,0 +1,23 @@ +name = "Ling-2.6-flash" +family = "ling" +release_date = "2026-04-24" +last_updated = "2026-04-24" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.1 +output = 0.3 +cache_read = 0.02 + +[limit] +context = 262_144 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-3.2-3b-instruct.toml b/providers/novita-ai/models/meta-llama/llama-3.2-3b-instruct.toml index 9ad1ed1e5..28c9b40b9 100644 --- a/providers/novita-ai/models/meta-llama/llama-3.2-3b-instruct.toml +++ b/providers/novita-ai/models/meta-llama/llama-3.2-3b-instruct.toml @@ -6,7 +6,6 @@ attachment = false reasoning = false temperature = true tool_call = false -structured_output = true open_weights = true [cost] diff --git a/providers/novita-ai/models/moonshotai/kimi-k2.6.toml b/providers/novita-ai/models/moonshotai/kimi-k2.6.toml index a0820d644..377bf6fed 100644 --- a/providers/novita-ai/models/moonshotai/kimi-k2.6.toml +++ b/providers/novita-ai/models/moonshotai/kimi-k2.6.toml @@ -1,27 +1,2 @@ -name = "Kimi K2.6" -family = "kimi" -release_date = "2026-04-21" -last_updated = "2026-04-21" -attachment = true -reasoning = true -temperature = true -tool_call = true -structured_output = true -knowledge = "2025-01" -open_weights = true - -[cost] -input = 0.95 -output = 4.0 -cache_read = 0.16 - -[limit] -context = 262_144 -output = 262_144 - -[interleaved] -field = "reasoning_content" - -[modalities] -input = ["text", "image", "video"] -output = ["text"] +[extends] +from = "moonshotai/kimi-k2.6" diff --git a/providers/novita-ai/models/qwen/qwen3.6-27b.toml b/providers/novita-ai/models/qwen/qwen3.6-27b.toml deleted file mode 100644 index a53da6569..000000000 --- a/providers/novita-ai/models/qwen/qwen3.6-27b.toml +++ /dev/null @@ -1,26 +0,0 @@ -name = "Qwen3.6-27B" -family = "qwen3.6" -release_date = "2026-04-02" -last_updated = "2026-04-02" -attachment = true -reasoning = true -temperature = true -knowledge = "2025-04" -tool_call = true -structured_output = true -open_weights = false - -[interleaved] -field = "reasoning_content" - -[cost] -input = 0.6 -output = 3.6 - -[limit] -context = 262_144 -output = 65_536 - -[modalities] -input = ["text", "image", "video"] -output = ["text"]