From a414765865c57211c2003411a834a72ea75ad6fb Mon Sep 17 00:00:00 2001 From: wassel alazhar Date: Fri, 12 Jun 2026 19:08:15 +0200 Subject: [PATCH 1/3] Update Umans AI Coding Plan and add Umans AI (pay-per-token) provider Umans AI Coding Plan (subscription): - Add umans-kimi-k2.7 (Kimi K2.7 Code) model - Add umans-flash-beta (deprecated alias for umans-flash) - Fix umans-glm-5.1: add vision modality (via handoff) and interleaved reasoning - Fix umans-flash: add interleaved reasoning field - Fix umans-qwen3.6-35b-a3b: add interleaved reasoning field - Add reasoning_options to all models - Add explicit name field to models using base_model Umans AI (new provider - pay-per-token for orgs): - New provider for organization service-account usage - Per-token pricing from the org billing page: - Kimi K2.6: /bin/bash.95/.00 (input/output), /bin/bash.20 cache read - Kimi K2.7 Code: /bin/bash.95/.00, /bin/bash.19 cache read - GLM 5.1: .40/.40, /bin/bash.29 cache read - Umans Flash (Qwen3.6-35B-A3B): /bin/bash.15/.00, /bin/bash.05 cache read - Umans Coder: routes to Kimi K2.6 rates - Same endpoint (api.code.umans.ai), different billing model --- .../models/umans-coder.toml | 2 +- .../models/umans-flash-beta.toml | 18 ++++++++++++ .../models/umans-flash.toml | 5 +++- .../models/umans-glm-5.1.toml | 4 +++ .../models/umans-kimi-k2.6.toml | 6 ++-- .../models/umans-kimi-k2.7.toml | 12 ++++++++ .../models/umans-qwen3.6-35b-a3b.toml | 5 +++- providers/umans-ai/logo.svg | 29 +++++++++++++++++++ providers/umans-ai/models/umans-coder.toml | 17 +++++++++++ providers/umans-ai/models/umans-flash.toml | 17 +++++++++++ providers/umans-ai/models/umans-glm-5.1.toml | 18 ++++++++++++ .../umans-ai/models/umans-kimi-k2.6.toml | 14 +++++++++ .../umans-ai/models/umans-kimi-k2.7.toml | 14 +++++++++ providers/umans-ai/provider.toml | 5 ++++ 14 files changed, 159 insertions(+), 7 deletions(-) create mode 100644 providers/umans-ai-coding-plan/models/umans-flash-beta.toml create mode 100644 providers/umans-ai-coding-plan/models/umans-kimi-k2.7.toml create mode 100644 providers/umans-ai/logo.svg create mode 100644 providers/umans-ai/models/umans-coder.toml create mode 100644 providers/umans-ai/models/umans-flash.toml create mode 100644 providers/umans-ai/models/umans-glm-5.1.toml create mode 100644 providers/umans-ai/models/umans-kimi-k2.6.toml create mode 100644 providers/umans-ai/models/umans-kimi-k2.7.toml create mode 100644 providers/umans-ai/provider.toml diff --git a/providers/umans-ai-coding-plan/models/umans-coder.toml b/providers/umans-ai-coding-plan/models/umans-coder.toml index 6f9cab75a9..a5a37bbf48 100644 --- a/providers/umans-ai-coding-plan/models/umans-coder.toml +++ b/providers/umans-ai-coding-plan/models/umans-coder.toml @@ -1,6 +1,6 @@ base_model = "moonshotai/kimi-k2.6" name = "Umans Coder" -temperature = false +reasoning_options = [{ type = "toggle" }] [interleaved] field = "reasoning_content" diff --git a/providers/umans-ai-coding-plan/models/umans-flash-beta.toml b/providers/umans-ai-coding-plan/models/umans-flash-beta.toml new file mode 100644 index 0000000000..8ab3c44b6b --- /dev/null +++ b/providers/umans-ai-coding-plan/models/umans-flash-beta.toml @@ -0,0 +1,18 @@ +base_model = "alibaba/qwen3.6-35b-a3b" +name = "Umans Flash Beta (deprecated)" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0 +output = 0 +cache_read = 0 +cache_write = 0 + +[limit] +output = 262_144 + +[modalities] +input = ["text", "image"] diff --git a/providers/umans-ai-coding-plan/models/umans-flash.toml b/providers/umans-ai-coding-plan/models/umans-flash.toml index 2c3c61f7b6..0b4bdf1af4 100644 --- a/providers/umans-ai-coding-plan/models/umans-flash.toml +++ b/providers/umans-ai-coding-plan/models/umans-flash.toml @@ -1,6 +1,9 @@ base_model = "alibaba/qwen3.6-35b-a3b" name = "Umans Flash" -temperature = false +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" [cost] input = 0 diff --git a/providers/umans-ai-coding-plan/models/umans-glm-5.1.toml b/providers/umans-ai-coding-plan/models/umans-glm-5.1.toml index 33237f3481..ff343e1e7f 100644 --- a/providers/umans-ai-coding-plan/models/umans-glm-5.1.toml +++ b/providers/umans-ai-coding-plan/models/umans-glm-5.1.toml @@ -1,5 +1,6 @@ base_model = "zhipuai/glm-5.1" name = "GLM 5.1" +reasoning_options = [{ type = "toggle" }] [interleaved] field = "reasoning_content" @@ -12,3 +13,6 @@ cache_write = 0 [limit] context = 204_800 + +[modalities] +input = ["text", "image"] diff --git a/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml b/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml index 321bfb0d5b..5e5d6a1185 100644 --- a/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml +++ b/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml @@ -1,5 +1,6 @@ base_model = "moonshotai/kimi-k2.6" -temperature = false +name = "Kimi K2.6" +reasoning_options = [{ type = "toggle" }] [interleaved] field = "reasoning_content" @@ -9,6 +10,3 @@ input = 0 output = 0 cache_read = 0 cache_write = 0 - -[modalities] -input = ["text", "image"] diff --git a/providers/umans-ai-coding-plan/models/umans-kimi-k2.7.toml b/providers/umans-ai-coding-plan/models/umans-kimi-k2.7.toml new file mode 100644 index 0000000000..6b066993ee --- /dev/null +++ b/providers/umans-ai-coding-plan/models/umans-kimi-k2.7.toml @@ -0,0 +1,12 @@ +base_model = "moonshotai/kimi-k2.7-code" +name = "Kimi K2.7 Code" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0 +output = 0 +cache_read = 0 +cache_write = 0 diff --git a/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml b/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml index 4743836bbe..dea5a2f6f1 100644 --- a/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml +++ b/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml @@ -1,6 +1,9 @@ base_model = "alibaba/qwen3.6-35b-a3b" name = "Qwen3.6 35B A3B" -temperature = false +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" [cost] input = 0 diff --git a/providers/umans-ai/logo.svg b/providers/umans-ai/logo.svg new file mode 100644 index 0000000000..511d4de99e --- /dev/null +++ b/providers/umans-ai/logo.svg @@ -0,0 +1,29 @@ + + + + + + + + + + + + + + + + + + + + + diff --git a/providers/umans-ai/models/umans-coder.toml b/providers/umans-ai/models/umans-coder.toml new file mode 100644 index 0000000000..a5f43d806a --- /dev/null +++ b/providers/umans-ai/models/umans-coder.toml @@ -0,0 +1,17 @@ +base_model = "moonshotai/kimi-k2.6" +name = "Umans Coder" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.95 +output = 4.00 +cache_read = 0.20 + +[limit] +output = 32_768 + +[modalities] +input = ["text", "image"] diff --git a/providers/umans-ai/models/umans-flash.toml b/providers/umans-ai/models/umans-flash.toml new file mode 100644 index 0000000000..e4d7527c1c --- /dev/null +++ b/providers/umans-ai/models/umans-flash.toml @@ -0,0 +1,17 @@ +base_model = "alibaba/qwen3.6-35b-a3b" +name = "Umans Flash" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.15 +output = 1.00 +cache_read = 0.05 + +[limit] +output = 32_768 + +[modalities] +input = ["text", "image"] diff --git a/providers/umans-ai/models/umans-glm-5.1.toml b/providers/umans-ai/models/umans-glm-5.1.toml new file mode 100644 index 0000000000..35efd66ebc --- /dev/null +++ b/providers/umans-ai/models/umans-glm-5.1.toml @@ -0,0 +1,18 @@ +base_model = "zhipuai/glm-5.1" +name = "GLM 5.1" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 1.40 +output = 4.40 +cache_read = 0.29 + +[limit] +context = 204_800 +output = 131_072 + +[modalities] +input = ["text", "image"] diff --git a/providers/umans-ai/models/umans-kimi-k2.6.toml b/providers/umans-ai/models/umans-kimi-k2.6.toml new file mode 100644 index 0000000000..936d7b99f3 --- /dev/null +++ b/providers/umans-ai/models/umans-kimi-k2.6.toml @@ -0,0 +1,14 @@ +base_model = "moonshotai/kimi-k2.6" +name = "Kimi K2.6" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.95 +output = 4.00 +cache_read = 0.20 + +[limit] +output = 32_768 diff --git a/providers/umans-ai/models/umans-kimi-k2.7.toml b/providers/umans-ai/models/umans-kimi-k2.7.toml new file mode 100644 index 0000000000..35aa47af5a --- /dev/null +++ b/providers/umans-ai/models/umans-kimi-k2.7.toml @@ -0,0 +1,14 @@ +base_model = "moonshotai/kimi-k2.7-code" +name = "Kimi K2.7 Code" +reasoning_options = [{ type = "toggle" }] + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.95 +output = 4.00 +cache_read = 0.19 + +[limit] +output = 32_768 diff --git a/providers/umans-ai/provider.toml b/providers/umans-ai/provider.toml new file mode 100644 index 0000000000..50c077cd38 --- /dev/null +++ b/providers/umans-ai/provider.toml @@ -0,0 +1,5 @@ +name = "Umans AI" +env = ["UMANS_AI_API_KEY"] +npm = "@ai-sdk/openai-compatible" +doc = "https://app.umans.ai/offers/code/docs/orgs" +api = "https://api.code.umans.ai/v1" From 735e5f7f08dafa544336327e97a17fcf49aafef9 Mon Sep 17 00:00:00 2001 From: wassel alazhar Date: Fri, 12 Jun 2026 19:16:05 +0200 Subject: [PATCH 2/3] Remove umans-flash-beta from Coding Plan (deprecated, sunset 2026-06-07) --- .../models/umans-flash-beta.toml | 18 ------------------ 1 file changed, 18 deletions(-) delete mode 100644 providers/umans-ai-coding-plan/models/umans-flash-beta.toml diff --git a/providers/umans-ai-coding-plan/models/umans-flash-beta.toml b/providers/umans-ai-coding-plan/models/umans-flash-beta.toml deleted file mode 100644 index 8ab3c44b6b..0000000000 --- a/providers/umans-ai-coding-plan/models/umans-flash-beta.toml +++ /dev/null @@ -1,18 +0,0 @@ -base_model = "alibaba/qwen3.6-35b-a3b" -name = "Umans Flash Beta (deprecated)" -reasoning_options = [{ type = "toggle" }] - -[interleaved] -field = "reasoning_content" - -[cost] -input = 0 -output = 0 -cache_read = 0 -cache_write = 0 - -[limit] -output = 262_144 - -[modalities] -input = ["text", "image"] From 9fdad9f497ab176ece206f64a9e009095470e267 Mon Sep 17 00:00:00 2001 From: wassel alazhar Date: Fri, 12 Jun 2026 19:28:31 +0200 Subject: [PATCH 3/3] Add temperature = false for Kimi and Flash models (locked by Umans) --- providers/umans-ai-coding-plan/models/umans-coder.toml | 1 + providers/umans-ai-coding-plan/models/umans-flash.toml | 1 + providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml | 1 + providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml | 1 + providers/umans-ai/models/umans-coder.toml | 1 + providers/umans-ai/models/umans-flash.toml | 1 + providers/umans-ai/models/umans-kimi-k2.6.toml | 1 + 7 files changed, 7 insertions(+) diff --git a/providers/umans-ai-coding-plan/models/umans-coder.toml b/providers/umans-ai-coding-plan/models/umans-coder.toml index a5a37bbf48..8d4f7fa501 100644 --- a/providers/umans-ai-coding-plan/models/umans-coder.toml +++ b/providers/umans-ai-coding-plan/models/umans-coder.toml @@ -1,5 +1,6 @@ base_model = "moonshotai/kimi-k2.6" name = "Umans Coder" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai-coding-plan/models/umans-flash.toml b/providers/umans-ai-coding-plan/models/umans-flash.toml index 0b4bdf1af4..31a3e8c262 100644 --- a/providers/umans-ai-coding-plan/models/umans-flash.toml +++ b/providers/umans-ai-coding-plan/models/umans-flash.toml @@ -1,5 +1,6 @@ base_model = "alibaba/qwen3.6-35b-a3b" name = "Umans Flash" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml b/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml index 5e5d6a1185..f1c2d0def6 100644 --- a/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml +++ b/providers/umans-ai-coding-plan/models/umans-kimi-k2.6.toml @@ -1,5 +1,6 @@ base_model = "moonshotai/kimi-k2.6" name = "Kimi K2.6" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml b/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml index dea5a2f6f1..8ca6e3ee2b 100644 --- a/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml +++ b/providers/umans-ai-coding-plan/models/umans-qwen3.6-35b-a3b.toml @@ -1,5 +1,6 @@ base_model = "alibaba/qwen3.6-35b-a3b" name = "Qwen3.6 35B A3B" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai/models/umans-coder.toml b/providers/umans-ai/models/umans-coder.toml index a5f43d806a..c7675426ad 100644 --- a/providers/umans-ai/models/umans-coder.toml +++ b/providers/umans-ai/models/umans-coder.toml @@ -1,5 +1,6 @@ base_model = "moonshotai/kimi-k2.6" name = "Umans Coder" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai/models/umans-flash.toml b/providers/umans-ai/models/umans-flash.toml index e4d7527c1c..b0becf0ef2 100644 --- a/providers/umans-ai/models/umans-flash.toml +++ b/providers/umans-ai/models/umans-flash.toml @@ -1,5 +1,6 @@ base_model = "alibaba/qwen3.6-35b-a3b" name = "Umans Flash" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved] diff --git a/providers/umans-ai/models/umans-kimi-k2.6.toml b/providers/umans-ai/models/umans-kimi-k2.6.toml index 936d7b99f3..a8b29dd850 100644 --- a/providers/umans-ai/models/umans-kimi-k2.6.toml +++ b/providers/umans-ai/models/umans-kimi-k2.6.toml @@ -1,5 +1,6 @@ base_model = "moonshotai/kimi-k2.6" name = "Kimi K2.6" +temperature = false reasoning_options = [{ type = "toggle" }] [interleaved]