diff --git a/providers/huawei-cloud-maas/models/DeepSeek-V3.toml b/providers/huawei-cloud-maas/models/DeepSeek-V3.toml new file mode 100644 index 000000000..b851e486a --- /dev/null +++ b/providers/huawei-cloud-maas/models/DeepSeek-V3.toml @@ -0,0 +1,23 @@ +name = "DeepSeek V3" +family = "deepseek" +release_date = "2025-09-29" +last_updated = "2026-05-12" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[cost] +input = 0.27 +output = 1.078 + +[limit] +context = 128_000 +input = 128_000 +output = 64_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/huawei-cloud-maas/models/deepseek-r1-250528.toml b/providers/huawei-cloud-maas/models/deepseek-r1-250528.toml new file mode 100644 index 000000000..422fae4f9 --- /dev/null +++ b/providers/huawei-cloud-maas/models/deepseek-r1-250528.toml @@ -0,0 +1,26 @@ +name = "DeepSeek R1 0528" +family = "deepseek-thinking" +release_date = "2025-09-29" +last_updated = "2026-05-12" +attachment = false +reasoning = true +temperature = false +knowledge = "2024-07" +tool_call = true +open_weights = true + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.539 +output = 2.156 + +[limit] +context = 128_000 +input = 96_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/huawei-cloud-maas/models/deepseek-v3.1-terminus.toml b/providers/huawei-cloud-maas/models/deepseek-v3.1-terminus.toml new file mode 100644 index 000000000..1cbdcc555 --- /dev/null +++ b/providers/huawei-cloud-maas/models/deepseek-v3.1-terminus.toml @@ -0,0 +1,26 @@ +name = "DeepSeek V3.1" +family = "deepseek-thinking" +release_date = "2025-11-24" +last_updated = "2026-05-12" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.539 +output = 1.617 + +[limit] +context = 128_000 +input = 96_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/huawei-cloud-maas/models/deepseek-v3.2.toml b/providers/huawei-cloud-maas/models/deepseek-v3.2.toml new file mode 100644 index 000000000..a36ccedd8 --- /dev/null +++ b/providers/huawei-cloud-maas/models/deepseek-v3.2.toml @@ -0,0 +1,26 @@ +name = "DeepSeek V3.2" +family = "deepseek-thinking" +release_date = "2025-12-15" +last_updated = "2026-05-12" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +open_weights = true + +[interleaved] +field = "reasoning_content" + +[cost] +input = 0.27 +output = 0.404 + +[limit] +context = 160_000 +input = 128_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/huawei-cloud-maas/models/deepseek-v4-flash.toml b/providers/huawei-cloud-maas/models/deepseek-v4-flash.toml new file mode 100644 index 000000000..01ca98675 --- /dev/null +++ b/providers/huawei-cloud-maas/models/deepseek-v4-flash.toml @@ -0,0 +1,14 @@ +last_updated = "2026-05-12" + +[extends] +from = "deepseek/deepseek-v4-flash" +omit = ["cost.cache_read", "structured_output"] + +[cost] +input = 0.135 +output = 0.27 + +[limit] +context = 1_000_000 +input = 1_000_000 +output = 128_000 diff --git a/providers/huawei-cloud-maas/models/deepseek-v4-pro.toml b/providers/huawei-cloud-maas/models/deepseek-v4-pro.toml new file mode 100644 index 000000000..c3d043190 --- /dev/null +++ b/providers/huawei-cloud-maas/models/deepseek-v4-pro.toml @@ -0,0 +1,14 @@ +last_updated = "2026-05-12" + +[extends] +from = "deepseek/deepseek-v4-pro" +omit = ["cost.cache_read", "structured_output"] + +[cost] +input = 1.617 +output = 3.235 + +[limit] +context = 1_000_000 +input = 1_000_000 +output = 128_000 diff --git a/providers/huawei-cloud-maas/models/glm-5.1.toml b/providers/huawei-cloud-maas/models/glm-5.1.toml new file mode 100644 index 000000000..e7907b113 --- /dev/null +++ b/providers/huawei-cloud-maas/models/glm-5.1.toml @@ -0,0 +1,20 @@ +release_date = "2026-04-07" +last_updated = "2026-05-12" + +[extends] +from = "zai/glm-5.1" +omit = ["cost.cache_read", "cost.cache_write", "structured_output"] + +[cost] +input = 0.809 +output = 3.235 + +[[cost.tiers]] +tier = { size = 32_000 } +input = 1.078 +output = 3.774 + +[limit] +context = 198_000 +input = 192_000 +output = 128_000 diff --git a/providers/huawei-cloud-maas/models/glm-5.toml b/providers/huawei-cloud-maas/models/glm-5.toml new file mode 100644 index 000000000..99635cc03 --- /dev/null +++ b/providers/huawei-cloud-maas/models/glm-5.toml @@ -0,0 +1,20 @@ +release_date = "2026-02-12" +last_updated = "2026-05-12" + +[extends] +from = "zai/glm-5" +omit = ["cost.cache_read", "cost.cache_write"] + +[cost] +input = 0.539 +output = 2.426 + +[[cost.tiers]] +tier = { size = 32_000 } +input = 0.809 +output = 2.965 + +[limit] +context = 198_000 +input = 192_000 +output = 64_000 diff --git a/providers/huawei-cloud-maas/provider.toml b/providers/huawei-cloud-maas/provider.toml new file mode 100644 index 000000000..ad0173871 --- /dev/null +++ b/providers/huawei-cloud-maas/provider.toml @@ -0,0 +1,5 @@ +name = "Huawei Cloud MaaS" +env = ["HUAWEI_CLOUD_MAAS_API_KEY"] +npm = "@ai-sdk/openai-compatible" +api = "https://api-ap-southeast-1.modelarts-maas.com/openai/v1" +doc = "https://support.huaweicloud.com/intl/en-us/model-call-maas/model-call-021.html"