2b:["$","div",null,{"className":"space-y-4 max-w-4xl mx-auto","children":[["$","div",null,{"className":"text-center","children":[["$","h2",null,{"className":"text-2xl font-bold","children":"Performance Metrics"}],["$","p",null,{"className":"text-muted-foreground","children":"Context window and performance specifications"}]]}],["$","$L31",null,{"modelA":{"modelId":"gpt-4.1-mini-2025-04-14","name":"GPT-4.1 mini","organizationId":"openai","fineTunedFromModelId":null,"description":"GPT-4.1 mini provides a balance between intelligence, speed, and cost. It's a significant leap in small model performance, even beating GPT-4o in many benchmarks while reducing latency and cost.","releaseDate":"2025-04-14","announcementDate":"2025-04-14","licenseId":"proprietary","multimodal":true,"knowledgeCutoff":"2024-05-31","paramCount":null,"trainingTokens":null,"contextWindow":null,"availableInZeroeval":true,"sourceApiRef":"https://platform.openai.com/docs/models/gpt-4.1-mini","sourcePlayground":"https://platform.openai.com/playground?mode=chat&model=gpt-4.1-mini","sourcePaper":null,"sourceScorecardBlogLink":"https://openai.com/index/gpt-4-1/","sourceRepoLink":null,"sourceWeightsLink":null,"modelFamilyId":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.821Z","updatedAt":"$D2025-07-19T19:49:05.821Z","organization":{"organizationId":"openai","name":"OpenAI","website":"https://openai.com","description":"Leading AI research company","country":"US","manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.815Z","updatedAt":"$D2025-07-19T19:49:05.815Z"},"license":{"licenseId":"proprietary","name":"Proprietary","allowCommercial":false,"description":"Proprietary license - usage restrictions apply","createdAt":"$D2025-07-19T19:49:05.425Z","updatedAt":"$D2025-07-19T19:49:05.425Z"},"benchmarks":[{"modelBenchmarkId":20999674,"benchmarkId":"aider-polyglot","modelId":"gpt-4.1-mini-2025-04-14","score":0.347,"normalizedScore":0.347,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.382Z","updatedAt":"$D2025-07-19T19:56:12.382Z","benchmark":{"benchmarkId":"aider-polyglot","name":"Aider-Polyglot","category":null}},{"modelBenchmarkId":19775831,"benchmarkId":"aider-polyglot-edit","modelId":"gpt-4.1-mini-2025-04-14","score":0.316,"normalizedScore":0.316,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.801Z","updatedAt":"$D2025-07-19T19:56:13.801Z","benchmark":{"benchmarkId":"aider-polyglot-edit","name":"Aider-Polyglot Edit","category":null}},{"modelBenchmarkId":50596634,"benchmarkId":"aime-2024","modelId":"gpt-4.1-mini-2025-04-14","score":0.496,"normalizedScore":0.496,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.013Z","updatedAt":"$D2025-07-19T19:56:12.013Z","benchmark":{"benchmarkId":"aime-2024","name":"AIME 2024","category":null}},{"modelBenchmarkId":19268144,"benchmarkId":"charxiv-d","modelId":"gpt-4.1-mini-2025-04-14","score":0.884,"normalizedScore":0.884,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.327Z","updatedAt":"$D2025-07-19T19:56:15.327Z","benchmark":{"benchmarkId":"charxiv-d","name":"CharXiv-D","category":null}},{"modelBenchmarkId":48682364,"benchmarkId":"charxiv-r","modelId":"gpt-4.1-mini-2025-04-14","score":0.568,"normalizedScore":0.568,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.195Z","updatedAt":"$D2025-07-19T19:56:15.195Z","benchmark":{"benchmarkId":"charxiv-r","name":"CharXiv-R","category":null}},{"modelBenchmarkId":54800268,"benchmarkId":"collie","modelId":"gpt-4.1-mini-2025-04-14","score":0.546,"normalizedScore":0.546,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.255Z","updatedAt":"$D2025-07-19T19:56:15.255Z","benchmark":{"benchmarkId":"collie","name":"COLLIE","category":null}},{"modelBenchmarkId":14464711,"benchmarkId":"complexfuncbench","modelId":"gpt-4.1-mini-2025-04-14","score":0.493,"normalizedScore":0.493,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.339Z","updatedAt":"$D2025-07-19T19:56:15.339Z","benchmark":{"benchmarkId":"complexfuncbench","name":"ComplexFuncBench","category":null}},{"modelBenchmarkId":63047684,"benchmarkId":"gpqa","modelId":"gpt-4.1-mini-2025-04-14","score":0.65,"normalizedScore":0.65,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Diamond","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.752Z","updatedAt":"$D2025-07-19T19:56:11.752Z","benchmark":{"benchmarkId":"gpqa","name":"GPQA","category":null}},{"modelBenchmarkId":81783465,"benchmarkId":"graphwalks-bfs-<128k","modelId":"gpt-4.1-mini-2025-04-14","score":0.617,"normalizedScore":0.617,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.289Z","updatedAt":"$D2025-07-19T19:56:15.289Z","benchmark":{"benchmarkId":"graphwalks-bfs-<128k","name":"Graphwalks BFS <128k","category":null}},{"modelBenchmarkId":23207414,"benchmarkId":"graphwalks-bfs->128k","modelId":"gpt-4.1-mini-2025-04-14","score":0.15,"normalizedScore":0.15,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.298Z","updatedAt":"$D2025-07-19T19:56:15.298Z","benchmark":{"benchmarkId":"graphwalks-bfs->128k","name":"Graphwalks BFS >128k","category":null}},{"modelBenchmarkId":62920483,"benchmarkId":"graphwalks-parents-<128k","modelId":"gpt-4.1-mini-2025-04-14","score":0.605,"normalizedScore":0.605,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.306Z","updatedAt":"$D2025-07-19T19:56:15.306Z","benchmark":{"benchmarkId":"graphwalks-parents-<128k","name":"Graphwalks parents <128k","category":null}},{"modelBenchmarkId":25881624,"benchmarkId":"graphwalks-parents->128k","modelId":"gpt-4.1-mini-2025-04-14","score":0.11,"normalizedScore":0.11,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.319Z","updatedAt":"$D2025-07-19T19:56:15.319Z","benchmark":{"benchmarkId":"graphwalks-parents->128k","name":"Graphwalks parents >128k","category":null}},{"modelBenchmarkId":13385197,"benchmarkId":"ifeval","modelId":"gpt-4.1-mini-2025-04-14","score":0.841,"normalizedScore":0.841,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.299Z","updatedAt":"$D2025-07-19T19:56:12.299Z","benchmark":{"benchmarkId":"ifeval","name":"IFEval","category":null}},{"modelBenchmarkId":98018770,"benchmarkId":"internal-api-instruction-following-(hard)","modelId":"gpt-4.1-mini-2025-04-14","score":0.451,"normalizedScore":0.451,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.225Z","updatedAt":"$D2025-07-19T19:56:15.225Z","benchmark":{"benchmarkId":"internal-api-instruction-following-(hard)","name":"Internal API instruction following (hard)","category":null}},{"modelBenchmarkId":55383595,"benchmarkId":"mathvista","modelId":"gpt-4.1-mini-2025-04-14","score":0.731,"normalizedScore":0.731,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.114Z","updatedAt":"$D2025-07-19T19:56:12.114Z","benchmark":{"benchmarkId":"mathvista","name":"MathVista","category":null}},{"modelBenchmarkId":87196944,"benchmarkId":"mmlu","modelId":"gpt-4.1-mini-2025-04-14","score":0.875,"normalizedScore":0.875,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.317Z","updatedAt":"$D2025-07-19T19:56:11.317Z","benchmark":{"benchmarkId":"mmlu","name":"MMLU","category":null}},{"modelBenchmarkId":57899708,"benchmarkId":"mmmlu","modelId":"gpt-4.1-mini-2025-04-14","score":0.785,"normalizedScore":0.785,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.157Z","updatedAt":"$D2025-07-19T19:56:14.157Z","benchmark":{"benchmarkId":"mmmlu","name":"MMMLU","category":null}},{"modelBenchmarkId":3263010,"benchmarkId":"mmmu","modelId":"gpt-4.1-mini-2025-04-14","score":0.727,"normalizedScore":0.727,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.217Z","updatedAt":"$D2025-07-19T19:56:12.217Z","benchmark":{"benchmarkId":"mmmu","name":"MMMU","category":null}},{"modelBenchmarkId":88024590,"benchmarkId":"multichallenge","modelId":"gpt-4.1-mini-2025-04-14","score":0.358,"normalizedScore":0.358,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark (GPT-4o grader)","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.555Z","updatedAt":"$D2025-07-19T19:56:12.555Z","benchmark":{"benchmarkId":"multichallenge","name":"Multi-Challenge","category":null}},{"modelBenchmarkId":31261885,"benchmarkId":"multichallenge-(o3-mini-grader)","modelId":"gpt-4.1-mini-2025-04-14","score":0.422,"normalizedScore":0.422,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark (o3-mini grader, see footnote [3])","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.239Z","updatedAt":"$D2025-07-19T19:56:15.239Z","benchmark":{"benchmarkId":"multichallenge-(o3-mini-grader)","name":"MultiChallenge (o3-mini grader)","category":null}},{"modelBenchmarkId":3507329,"benchmarkId":"multi-if","modelId":"gpt-4.1-mini-2025-04-14","score":0.67,"normalizedScore":0.67,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.643Z","updatedAt":"$D2025-07-19T19:56:14.643Z","benchmark":{"benchmarkId":"multi-if","name":"Multi-IF","category":null}},{"modelBenchmarkId":89233557,"benchmarkId":"openai-mrcr:-2-needle-128k","modelId":"gpt-4.1-mini-2025-04-14","score":0.472,"normalizedScore":0.472,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.270Z","updatedAt":"$D2025-07-19T19:56:15.270Z","benchmark":{"benchmarkId":"openai-mrcr:-2-needle-128k","name":"OpenAI-MRCR: 2 needle 128k","category":null}},{"modelBenchmarkId":55508918,"benchmarkId":"openai-mrcr:-2-needle-1m","modelId":"gpt-4.1-mini-2025-04-14","score":0.333,"normalizedScore":0.333,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.282Z","updatedAt":"$D2025-07-19T19:56:15.282Z","benchmark":{"benchmarkId":"openai-mrcr:-2-needle-1m","name":"OpenAI-MRCR: 2 needle 1M","category":null}},{"modelBenchmarkId":77208761,"benchmarkId":"swe-bench-verified","modelId":"gpt-4.1-mini-2025-04-14","score":0.236,"normalizedScore":0.236,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Internal methodology, see source footnote [2]","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.852Z","updatedAt":"$D2025-07-19T19:56:13.852Z","benchmark":{"benchmarkId":"swe-bench-verified","name":"SWE-Bench Verified","category":null}},{"modelBenchmarkId":33227965,"benchmarkId":"tau-bench-airline","modelId":"gpt-4.1-mini-2025-04-14","score":0.36,"normalizedScore":0.36,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Avg 5 runs, no custom tools/prompting (footnote [4])","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.007Z","updatedAt":"$D2025-07-19T19:56:15.007Z","benchmark":{"benchmarkId":"tau-bench-airline","name":"TAU-bench Airline","category":null}},{"modelBenchmarkId":856642,"benchmarkId":"tau-bench-retail","modelId":"gpt-4.1-mini-2025-04-14","score":0.558,"normalizedScore":0.558,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"Avg 5 runs, no custom tools/prompting (footnote [4], GPT-4o user model)","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.978Z","updatedAt":"$D2025-07-19T19:56:14.978Z","benchmark":{"benchmarkId":"tau-bench-retail","name":"TAU-bench Retail","category":null}},{"modelBenchmarkId":22930371,"benchmarkId":"aime-2025","modelId":"gpt-4.1-mini-2025-04-14","score":0.402,"normalizedScore":0.402,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"GPT-4.1 mini with no tools - Competition mathematics (AIME 2025).","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-24T12:00:00.000Z","updatedAt":"$D2025-07-24T12:00:00.000Z","benchmark":{"benchmarkId":"aime-2025","name":"AIME 2025","category":null}},{"modelBenchmarkId":72477603,"benchmarkId":"humanity's-last-exam","modelId":"gpt-4.1-mini-2025-04-14","score":0.037,"normalizedScore":0.037,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"GPT-4.1 mini with no tools - Expert-level questions across subjects.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-24T12:00:00.000Z","updatedAt":"$D2025-07-24T12:00:00.000Z","benchmark":{"benchmarkId":"humanity's-last-exam","name":"Humanity's Last Exam","category":null}},{"modelBenchmarkId":80376631,"benchmarkId":"hmmt-2025","modelId":"gpt-4.1-mini-2025-04-14","score":0.35,"normalizedScore":0.35,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/introducing-gpt-5-for-developers/","verifiedByLlmstats":false,"analysisMethod":"GPT-4.1 mini with no tools - Harvard-MIT Mathematics Tournament.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-24T12:00:00.000Z","updatedAt":"$D2025-07-24T12:00:00.000Z","benchmark":{"benchmarkId":"hmmt-2025","name":"HMMT 2025","category":null}}],"providers":[{"modelProviderId":96073975,"modelId":"gpt-4.1-mini-2025-04-14","providerId":"openai","providerModelIdUsed":"gpt-4.1-mini-2025-04-14","deprecatedAt":null,"inputCentsPerMillionTokens":40,"outputCentsPerMillionTokens":160,"quantization":null,"maxInputTokens":1047576,"maxOutputTokens":32768,"throughput":150,"latency":5,"featureWebSearch":false,"featureFunctionCalling":true,"featureStructuredOutput":true,"featureCodeExecution":false,"featureBatchInference":true,"featureFinetuning":false,"inputModalityText":true,"inputModalityImage":true,"inputModalityAudio":false,"inputModalityVideo":false,"outputModalityText":true,"outputModalityImage":false,"outputModalityAudio":false,"outputModalityVideo":false,"createdAt":"$D2025-07-19T19:49:17.152Z","updatedAt":"$D2025-07-19T19:49:17.152Z","modelName":"GPT-4.1 mini","organizationId":"openai","provider":{"providerId":"openai","name":"OpenAI","website":"https://openai.com","createdAt":"$D2025-07-19T19:49:17.121Z","updatedAt":"$D2025-07-19T19:49:17.121Z"}},{"modelProviderId":8813777,"modelId":"gpt-4.1-mini-2025-04-14","providerId":"zeroeval","providerModelIdUsed":"gpt-4.1-mini-2025-04-14","deprecatedAt":null,"inputCentsPerMillionTokens":40,"outputCentsPerMillionTokens":160,"quantization":null,"maxInputTokens":1047576,"maxOutputTokens":32768,"throughput":150,"latency":5,"featureWebSearch":false,"featureFunctionCalling":true,"featureStructuredOutput":true,"featureCodeExecution":false,"featureBatchInference":true,"featureFinetuning":false,"inputModalityText":true,"inputModalityImage":true,"inputModalityAudio":false,"inputModalityVideo":false,"outputModalityText":true,"outputModalityImage":false,"outputModalityAudio":false,"outputModalityVideo":false,"createdAt":"$D2025-07-19T19:49:17.174Z","updatedAt":"$D2025-07-19T19:49:17.174Z","modelName":"GPT-4.1 mini","organizationId":"openai","provider":{"providerId":"zeroeval","name":"ZeroEval","website":"https://zeroeval.com","createdAt":"$D2025-07-15T06:36:02.543Z","updatedAt":"$D2025-07-15T06:36:02.543Z"}}]},"modelB":{"modelId":"granite-4.0-tiny-preview","name":"IBM Granite 4.0 Tiny Preview","organizationId":"ibm","fineTunedFromModelId":null,"description":"A preliminary version of the smallest model in the upcoming Granite 4.0 family, released May 2025. It utilizes a novel hybrid Mamba-2/Transformer, fine-grained mixture of experts (MoE) architecture (7B total parameters, 1B active at inference). This preview version is partially trained (2.5T tokens) but demonstrates significant memory efficiency and performance potential, validated for at least 128K context length without positional encoding.","releaseDate":"2025-05-02","announcementDate":"2025-05-02","licenseId":"apache_2_0","multimodal":false,"knowledgeCutoff":null,"paramCount":"$n7000000000","trainingTokens":"$n2500000000000","contextWindow":null,"availableInZeroeval":true,"sourceApiRef":"https://www.ibm.com/granite/docs/","sourcePlayground":"https://www.ibm.com/granite/playground/","sourcePaper":null,"sourceScorecardBlogLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","sourceRepoLink":null,"sourceWeightsLink":"https://huggingface.co/ibm-granite/granite-4.0-tiny-preview","modelFamilyId":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.720Z","updatedAt":"$D2025-07-19T19:49:05.720Z","organization":{"organizationId":"ibm","name":"IBM","website":"https://ibm.com","description":"Technology and consulting company","country":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.719Z","updatedAt":"$D2025-07-19T19:49:05.719Z"},"license":{"licenseId":"apache_2_0","name":"Apache 2.0","allowCommercial":true,"description":"Apache License 2.0 - allows commercial use","createdAt":"$D2025-07-19T19:49:05.605Z","updatedAt":"$D2025-07-19T19:49:05.605Z"},"benchmarks":[{"modelBenchmarkId":84495703,"benchmarkId":"alpacaeval-2.0","modelId":"granite-4.0-tiny-preview","score":0.3516,"normalizedScore":0.3516,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/ibm-granite/granite-4.0-tiny-preview","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.045Z","updatedAt":"$D2025-07-19T19:56:15.045Z","benchmark":{"benchmarkId":"alpacaeval-2.0","name":"AlpacaEval 2.0","category":null}},{"modelBenchmarkId":31062309,"benchmarkId":"arena-hard","modelId":"granite-4.0-tiny-preview","score":0.267,"normalizedScore":0.267,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/ibm-granite/granite-4.0-tiny-preview","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.108Z","updatedAt":"$D2025-07-19T19:56:14.108Z","benchmark":{"benchmarkId":"arena-hard","name":"Arena Hard","category":null}},{"modelBenchmarkId":1453040,"benchmarkId":"attaq","modelId":"granite-4.0-tiny-preview","score":0.861,"normalizedScore":0.861,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.083Z","updatedAt":"$D2025-07-19T19:56:15.083Z","benchmark":{"benchmarkId":"attaq","name":"AttaQ","category":null}},{"modelBenchmarkId":27482610,"benchmarkId":"big-bench-hard","modelId":"granite-4.0-tiny-preview","score":0.557,"normalizedScore":0.557,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.247Z","updatedAt":"$D2025-07-19T19:56:13.247Z","benchmark":{"benchmarkId":"big-bench-hard","name":"BIG-Bench Hard","category":null}},{"modelBenchmarkId":64206389,"benchmarkId":"drop","modelId":"granite-4.0-tiny-preview","score":0.462,"normalizedScore":0.462,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.009Z","updatedAt":"$D2025-07-19T19:56:13.009Z","benchmark":{"benchmarkId":"drop","name":"DROP","category":null}},{"modelBenchmarkId":45229738,"benchmarkId":"gsm8k","modelId":"granite-4.0-tiny-preview","score":0.701,"normalizedScore":0.701,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.094Z","updatedAt":"$D2025-07-19T19:56:13.094Z","benchmark":{"benchmarkId":"gsm8k","name":"GSM8k","category":null}},{"modelBenchmarkId":3067633,"benchmarkId":"humaneval","modelId":"granite-4.0-tiny-preview","score":0.824,"normalizedScore":0.824,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.663Z","updatedAt":"$D2025-07-19T19:56:12.663Z","benchmark":{"benchmarkId":"humaneval","name":"HumanEval","category":null}},{"modelBenchmarkId":74880951,"benchmarkId":"humaneval+","modelId":"granite-4.0-tiny-preview","score":0.783,"normalizedScore":0.783,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.074Z","updatedAt":"$D2025-07-19T19:56:14.074Z","benchmark":{"benchmarkId":"humaneval+","name":"HumanEval+","category":null}},{"modelBenchmarkId":33454641,"benchmarkId":"ifeval","modelId":"granite-4.0-tiny-preview","score":0.63,"normalizedScore":0.63,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.285Z","updatedAt":"$D2025-07-19T19:56:12.285Z","benchmark":{"benchmarkId":"ifeval","name":"IFEval","category":null}},{"modelBenchmarkId":5288234,"benchmarkId":"mmlu","modelId":"granite-4.0-tiny-preview","score":0.604,"normalizedScore":0.604,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.287Z","updatedAt":"$D2025-07-19T19:56:11.287Z","benchmark":{"benchmarkId":"mmlu","name":"MMLU","category":null}},{"modelBenchmarkId":87015563,"benchmarkId":"popqa","modelId":"granite-4.0-tiny-preview","score":0.229,"normalizedScore":0.229,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.075Z","updatedAt":"$D2025-07-19T19:56:15.075Z","benchmark":{"benchmarkId":"popqa","name":"PopQA","category":null}},{"modelBenchmarkId":20402547,"benchmarkId":"truthfulqa","modelId":"granite-4.0-tiny-preview","score":0.581,"normalizedScore":0.581,"isSelfReported":true,"selfReportedSourceLink":"https://www.ibm.com/new/announcements/ibm-granite-4-0-tiny-preview-sneak-peek","verifiedByLlmstats":false,"analysisMethod":"Score","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.358Z","updatedAt":"$D2025-07-19T19:56:11.358Z","benchmark":{"benchmarkId":"truthfulqa","name":"TruthfulQA","category":null}}],"providers":[]},"commonBenchmarks":[{"benchmarkId":"aider-polyglot","name":"Aider-Polyglot","category":null,"modelA":0.347,"modelB":0},{"benchmarkId":"aider-polyglot-edit","name":"Aider-Polyglot Edit","category":null,"modelA":0.316,"modelB":0},{"benchmarkId":"aime-2024","name":"AIME 2024","category":null,"modelA":0.496,"modelB":0},{"benchmarkId":"charxiv-d","name":"CharXiv-D","category":null,"modelA":0.884,"modelB":0},{"benchmarkId":"charxiv-r","name":"CharXiv-R","category":null,"modelA":0.568,"modelB":0},{"benchmarkId":"collie","name":"COLLIE","category":null,"modelA":0.546,"modelB":0},{"benchmarkId":"complexfuncbench","name":"ComplexFuncBench","category":null,"modelA":0.493,"modelB":0},{"benchmarkId":"gpqa","name":"GPQA","category":null,"modelA":0.65,"modelB":0},{"benchmarkId":"graphwalks-bfs-<128k","name":"Graphwalks BFS <128k","category":null,"modelA":0.617,"modelB":0},{"benchmarkId":"graphwalks-bfs->128k","name":"Graphwalks BFS >128k","category":null,"modelA":0.15,"modelB":0},{"benchmarkId":"graphwalks-parents-<128k","name":"Graphwalks parents <128k","category":null,"modelA":0.605,"modelB":0},{"benchmarkId":"graphwalks-parents->128k","name":"Graphwalks parents >128k","category":null,"modelA":0.11,"modelB":0},{"benchmarkId":"ifeval","name":"IFEval","category":null,"modelA":0.841,"modelB":0.63},{"benchmarkId":"internal-api-instruction-following-(hard)","name":"Internal API instruction following (hard)","category":null,"modelA":0.451,"modelB":0},{"benchmarkId":"mathvista","name":"MathVista","category":null,"modelA":0.731,"modelB":0},{"benchmarkId":"mmlu","name":"MMLU","category":null,"modelA":0.875,"modelB":0.604},{"benchmarkId":"mmmlu","name":"MMMLU","category":null,"modelA":0.785,"modelB":0},{"benchmarkId":"mmmu","name":"MMMU","category":null,"modelA":0.727,"modelB":0},{"benchmarkId":"multichallenge","name":"Multi-Challenge","category":null,"modelA":0.358,"modelB":0},{"benchmarkId":"multichallenge-(o3-mini-grader)","name":"MultiChallenge (o3-mini grader)","category":null,"modelA":0.422,"modelB":0},{"benchmarkId":"multi-if","name":"Multi-IF","category":null,"modelA":0.67,"modelB":0},{"benchmarkId":"openai-mrcr:-2-needle-128k","name":"OpenAI-MRCR: 2 needle 128k","category":null,"modelA":0.472,"modelB":0},{"benchmarkId":"openai-mrcr:-2-needle-1m","name":"OpenAI-MRCR: 2 needle 1M","category":null,"modelA":0.333,"modelB":0},{"benchmarkId":"swe-bench-verified","name":"SWE-Bench Verified","category":null,"modelA":0.236,"modelB":0},{"benchmarkId":"tau-bench-airline","name":"TAU-bench Airline","category":null,"modelA":0.36,"modelB":0},{"benchmarkId":"tau-bench-retail","name":"TAU-bench Retail","category":null,"modelA":0.558,"modelB":0},{"benchmarkId":"aime-2025","name":"AIME 2025","category":null,"modelA":0.402,"modelB":0},{"benchmarkId":"humanity's-last-exam","name":"Humanity's Last Exam","category":null,"modelA":0.037,"modelB":0},{"benchmarkId":"hmmt-2025","name":"HMMT 2025","category":null,"modelA":0.35,"modelB":0},{"benchmarkId":"alpacaeval-2.0","name":"AlpacaEval 2.0","category":null,"modelA":0,"modelB":0.3516},{"benchmarkId":"arena-hard","name":"Arena Hard","category":null,"modelA":0,"modelB":0.267},{"benchmarkId":"attaq","name":"AttaQ","category":null,"modelA":0,"modelB":0.861},{"benchmarkId":"big-bench-hard","name":"BIG-Bench Hard","category":null,"modelA":0,"modelB":0.557},{"benchmarkId":"drop","name":"DROP","category":null,"modelA":0,"modelB":0.462},{"benchmarkId":"gsm8k","name":"GSM8k","category":null,"modelA":0,"modelB":0.701},{"benchmarkId":"humaneval","name":"HumanEval","category":null,"modelA":0,"modelB":0.824},{"benchmarkId":"humaneval+","name":"HumanEval+","category":null,"modelA":0,"modelB":0.783},{"benchmarkId":"popqa","name":"PopQA","category":null,"modelA":0,"modelB":0.229},{"benchmarkId":"truthfulqa","name":"TruthfulQA","category":null,"modelA":0,"modelB":0.581}]}],"$L32"]}]

GPT-4.1 mini vs IBM Granite 4.0 Tiny Preview

Performance Metrics

Provider Availability & Performance