Files
param-hub-python/data/models.json

223 lines
5.7 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
[
{
"id": "gpt4",
"name": "GPT-4",
"organization": "OpenAI",
"parameters": 1760,
"architecture": "Transformer",
"context_length": 8192,
"input_price": 0.03,
"output_price": 0.06,
"mmlu": 86.4,
"humaneval": 67,
"is_open_source": false,
"license": "Proprietary",
"description": "OpenAI最强大的多模态大模型",
"created_at": "2024-01-01",
"updated_at": "2026-04-28 11:57:02",
"raw_text": "\nGPT-4 Turbo version with 128K context length, price is $10 per 1M input tokens",
"subcategory_id": "chat",
"views": 0,
"images": [],
"publish_date": "2023-03-14"
},
{
"id": "gpt4turbo",
"name": "GPT-4 Turbo",
"organization": "OpenAI",
"parameters": 1760,
"architecture": "Transformer",
"context_length": 128000,
"input_price": 0.01,
"output_price": 0.03,
"mmlu": 86.4,
"humaneval": 67.0,
"is_open_source": false,
"license": "Proprietary",
"description": "GPT-4增强版128K上下文",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2023-11-06"
},
{
"id": "gpt35",
"name": "GPT-3.5 Turbo",
"organization": "OpenAI",
"parameters": 175,
"architecture": "Transformer",
"context_length": 16385,
"input_price": 0.0005,
"output_price": 0.0015,
"mmlu": 70.0,
"humaneval": 48.1,
"is_open_source": false,
"license": "Proprietary",
"description": "性价比高的通用模型",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2023-03-01"
},
{
"id": "claude3opus",
"name": "Claude 3 Opus",
"organization": "Anthropic",
"parameters": 400,
"architecture": "Transformer",
"context_length": 200000,
"input_price": 0.015,
"output_price": 0.075,
"mmlu": 86.8,
"humaneval": 84.9,
"is_open_source": false,
"license": "Proprietary",
"description": "Anthropic最强模型200K上下文",
"created_at": "2024-01-01",
"subcategory_id": "code",
"publish_date": "2024-03-04"
},
{
"id": "claude3sonnet",
"name": "Claude 3 Sonnet",
"organization": "Anthropic",
"parameters": 175,
"architecture": "Transformer",
"context_length": 200000,
"input_price": 0.003,
"output_price": 0.015,
"mmlu": 79.0,
"humaneval": 73.0,
"is_open_source": false,
"license": "Proprietary",
"description": "平衡性能与成本",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2024-03-04"
},
{
"id": "llama270b",
"name": "Llama 2 70B",
"organization": "Meta",
"parameters": 70,
"architecture": "Transformer",
"context_length": 4096,
"input_price": 0,
"output_price": 0,
"mmlu": 69.8,
"humaneval": 29.9,
"is_open_source": true,
"license": "Llama 2 Community",
"description": "Meta开源大模型70B参数",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2023-07-18"
},
{
"id": "llama3",
"name": "Llama 3 70B",
"organization": "Meta",
"parameters": 70,
"architecture": "Transformer",
"context_length": 8192,
"input_price": 0,
"output_price": 0,
"mmlu": 82.0,
"humaneval": 81.7,
"is_open_source": true,
"license": "Llama 3 Community",
"description": "Meta最新开源模型性能接近GPT-4",
"created_at": "2024-01-01",
"subcategory_id": "code",
"publish_date": "2024-04-18"
},
{
"id": "mistral7b",
"name": "Mistral 7B",
"organization": "Mistral AI",
"parameters": 7,
"architecture": "Transformer",
"context_length": 32768,
"input_price": 0,
"output_price": 0,
"mmlu": 62.5,
"humaneval": 26.8,
"is_open_source": true,
"license": "Apache 2.0",
"description": "小巧高效的开源模型",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2023-09-27"
},
{
"id": "mixtral8x7b",
"name": "Mixtral 8x7B",
"organization": "Mistral AI",
"parameters": 47,
"architecture": "MoE",
"context_length": 32768,
"input_price": 0,
"output_price": 0,
"mmlu": 70.6,
"humaneval": 40.2,
"is_open_source": true,
"license": "Apache 2.0",
"description": "MoE架构高效推理",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2023-12-11"
},
{
"id": "qwen72b",
"name": "Qwen 72B",
"organization": "Alibaba",
"parameters": 72,
"architecture": "Transformer",
"context_length": 32768,
"input_price": 0,
"output_price": 0,
"mmlu": 83.1,
"humaneval": 65.4,
"is_open_source": true,
"license": "Apache 2.0",
"description": "阿里开源大模型,中文能力强",
"created_at": "2024-01-01",
"subcategory_id": "chat",
"publish_date": "2024-02-05"
},
{
"id": "deepseekv3",
"name": "DeepSeek V3",
"organization": "DeepSeek",
"parameters": 685,
"architecture": "MoE",
"context_length": 128000,
"input_price": 0.00014,
"output_price": 0.00028,
"mmlu": 88.5,
"humaneval": 86.2,
"is_open_source": true,
"license": "MIT",
"description": "DeepSeek最新模型性价比极高",
"created_at": "2024-01-01",
"subcategory_id": "code",
"publish_date": "2024-12-26"
},
{
"id": "glm4",
"name": "GLM-4",
"organization": "Zhipu AI",
"parameters": 130,
"architecture": "Transformer",
"context_length": 128000,
"input_price": 0.014,
"output_price": 0.014,
"mmlu": 81.0,
"humaneval": 70.0,
"is_open_source": false,
"license": "Proprietary",
"description": "智谱AI大模型中文能力强",
"created_at": "2024-01-01",
"visible": true,
"subcategory_id": "chat",
"publish_date": "2024-01-01"
}
]