2b:["$","div",null,{"className":"space-y-4 max-w-4xl mx-auto","children":[["$","div",null,{"className":"text-center","children":[["$","h2",null,{"className":"text-2xl font-bold","children":"Performance Metrics"}],["$","p",null,{"className":"text-muted-foreground","children":"Context window and performance specifications"}]]}],["$","$L30",null,{"modelA":{"modelId":"gemma-3n-e2b-it","name":"Gemma 3n E2B Instructed","organizationId":"google","fineTunedFromModelId":null,"description":"$31","releaseDate":"2025-06-26","announcementDate":"2025-06-26","licenseId":"proprietary","multimodal":true,"knowledgeCutoff":"2024-06-01","paramCount":"$n8000000000","trainingTokens":"$n11000000000000","contextWindow":null,"availableInZeroeval":true,"sourceApiRef":"https://huggingface.co/blog/gemma3n","sourcePlayground":"https://aistudio.google.com/","sourcePaper":null,"sourceScorecardBlogLink":"https://ai.google.dev/gemma/docs/gemma-3n","sourceRepoLink":null,"sourceWeightsLink":"https://huggingface.co/google/gemma-3n-E2B-it","modelFamilyId":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.541Z","updatedAt":"$D2025-07-19T19:49:05.541Z","organization":{"organizationId":"google","name":"Google","website":"https://google.com","description":"Technology giant with AI research","country":"US","manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.437Z","updatedAt":"$D2025-07-19T19:49:05.437Z"},"license":{"licenseId":"proprietary","name":"Proprietary","allowCommercial":false,"description":"Proprietary license - usage restrictions apply","createdAt":"$D2025-07-19T19:49:05.425Z","updatedAt":"$D2025-07-19T19:49:05.425Z"},"benchmarks":[{"modelBenchmarkId":73331332,"benchmarkId":"aime-2025","modelId":"gemma-3n-e2b-it","score":0.067,"normalizedScore":0.067,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Accuracy. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.437Z","updatedAt":"$D2025-07-19T19:56:12.437Z","benchmark":{"benchmarkId":"aime-2025","name":"AIME 2025","category":null}},{"modelBenchmarkId":16591705,"benchmarkId":"codegolf-v2.2","modelId":"gemma-3n-e2b-it","score":0.11,"normalizedScore":0.11,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"pass@1. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.787Z","updatedAt":"$D2025-07-19T19:56:13.787Z","benchmark":{"benchmarkId":"codegolf-v2.2","name":"Codegolf v2.2","category":null}},{"modelBenchmarkId":79591241,"benchmarkId":"eclektic","modelId":"gemma-3n-e2b-it","score":0.025,"normalizedScore":0.025,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.575Z","updatedAt":"$D2025-07-19T19:56:13.575Z","benchmark":{"benchmarkId":"eclektic","name":"ECLeKTic","category":null}},{"modelBenchmarkId":25709715,"benchmarkId":"global-mmlu","modelId":"gemma-3n-e2b-it","score":0.551,"normalizedScore":0.551,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.758Z","updatedAt":"$D2025-07-19T19:56:13.758Z","benchmark":{"benchmarkId":"global-mmlu","name":"Global-MMLU","category":null}},{"modelBenchmarkId":89220103,"benchmarkId":"global-mmlu-lite","modelId":"gemma-3n-e2b-it","score":0.59,"normalizedScore":0.59,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Accuracy. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.560Z","updatedAt":"$D2025-07-19T19:56:13.560Z","benchmark":{"benchmarkId":"global-mmlu-lite","name":"Global-MMLU-Lite","category":null}},{"modelBenchmarkId":77750193,"benchmarkId":"gpqa","modelId":"gemma-3n-e2b-it","score":0.248,"normalizedScore":0.248,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Diamond. 0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.641Z","updatedAt":"$D2025-07-19T19:56:11.641Z","benchmark":{"benchmarkId":"gpqa","name":"GPQA","category":null}},{"modelBenchmarkId":55000073,"benchmarkId":"hiddenmath","modelId":"gemma-3n-e2b-it","score":0.277,"normalizedScore":0.277,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Accuracy. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.451Z","updatedAt":"$D2025-07-19T19:56:13.451Z","benchmark":{"benchmarkId":"hiddenmath","name":"HiddenMath","category":null}},{"modelBenchmarkId":13910732,"benchmarkId":"humaneval","modelId":"gemma-3n-e2b-it","score":0.665,"normalizedScore":0.665,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"pass@1. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.626Z","updatedAt":"$D2025-07-19T19:56:12.626Z","benchmark":{"benchmarkId":"humaneval","name":"HumanEval","category":null}},{"modelBenchmarkId":65008584,"benchmarkId":"include","modelId":"gemma-3n-e2b-it","score":0.386,"normalizedScore":0.386,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.735Z","updatedAt":"$D2025-07-19T19:56:13.735Z","benchmark":{"benchmarkId":"include","name":"Include","category":null}},{"modelBenchmarkId":95105332,"benchmarkId":"livecodebench","modelId":"gemma-3n-e2b-it","score":0.132,"normalizedScore":0.132,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"pass@1. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.320Z","updatedAt":"$D2025-07-19T19:56:13.320Z","benchmark":{"benchmarkId":"livecodebench","name":"LiveCodeBench","category":null}},{"modelBenchmarkId":90227300,"benchmarkId":"livecodebench-v5","modelId":"gemma-3n-e2b-it","score":0.186,"normalizedScore":0.186,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"pass@1. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.777Z","updatedAt":"$D2025-07-19T19:56:13.777Z","benchmark":{"benchmarkId":"livecodebench-v5","name":"LiveCodeBench v5","category":null}},{"modelBenchmarkId":44312292,"benchmarkId":"mbpp","modelId":"gemma-3n-e2b-it","score":0.566,"normalizedScore":0.566,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"pass@1. 3-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.477Z","updatedAt":"$D2025-07-19T19:56:13.477Z","benchmark":{"benchmarkId":"mbpp","name":"MBPP","category":null}},{"modelBenchmarkId":82423968,"benchmarkId":"mgsm","modelId":"gemma-3n-e2b-it","score":0.531,"normalizedScore":0.531,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.679Z","updatedAt":"$D2025-07-19T19:56:13.679Z","benchmark":{"benchmarkId":"mgsm","name":"MGSM","category":null}},{"modelBenchmarkId":78409353,"benchmarkId":"mmlu","modelId":"gemma-3n-e2b-it","score":0.601,"normalizedScore":0.601,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Accuracy. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.234Z","updatedAt":"$D2025-07-19T19:56:11.234Z","benchmark":{"benchmarkId":"mmlu","name":"MMLU","category":null}},{"modelBenchmarkId":5201026,"benchmarkId":"mmlu-pro","modelId":"gemma-3n-e2b-it","score":0.405,"normalizedScore":0.405,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Accuracy. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.439Z","updatedAt":"$D2025-07-19T19:56:11.439Z","benchmark":{"benchmarkId":"mmlu-pro","name":"MMLU-Pro","category":null}},{"modelBenchmarkId":35031274,"benchmarkId":"mmlu-prox","modelId":"gemma-3n-e2b-it","score":0.081,"normalizedScore":0.081,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.746Z","updatedAt":"$D2025-07-19T19:56:13.746Z","benchmark":{"benchmarkId":"mmlu-prox","name":"MMLU-ProX","category":null}},{"modelBenchmarkId":32299646,"benchmarkId":"openai-mmlu","modelId":"gemma-3n-e2b-it","score":0.223,"normalizedScore":0.223,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"0-shot","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.047Z","updatedAt":"$D2025-07-19T19:56:14.047Z","benchmark":{"benchmarkId":"openai-mmlu","name":"OpenAI MMLU","category":null}},{"modelBenchmarkId":84702041,"benchmarkId":"wmt24++","modelId":"gemma-3n-e2b-it","score":0.427,"normalizedScore":0.427,"isSelfReported":true,"selfReportedSourceLink":"https://huggingface.co/google/gemma-3n-E2B-it","verifiedByLlmstats":false,"analysisMethod":"Character-level F-score. 0-shot.","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.592Z","updatedAt":"$D2025-07-19T19:56:13.592Z","benchmark":{"benchmarkId":"wmt24++","name":"WMT24++","category":null}}],"providers":[]},"modelB":{"modelId":"gpt-4.1-nano-2025-04-14","name":"GPT-4.1 nano","organizationId":"openai","fineTunedFromModelId":null,"description":"GPT-4.1 nano is OpenAI's fastest and cheapest model available in the GPT-4.1 family. It delivers exceptional performance at a small size with its 1 million token context window. Ideal for tasks like classification or autocompletion.","releaseDate":"2025-04-14","announcementDate":"2025-04-14","licenseId":"proprietary","multimodal":true,"knowledgeCutoff":"2024-05-31","paramCount":null,"trainingTokens":null,"contextWindow":null,"availableInZeroeval":true,"sourceApiRef":"https://platform.openai.com/docs/models/gpt-4.1-nano","sourcePlayground":"https://platform.openai.com/playground?mode=chat&model=gpt-4.1-nano","sourcePaper":null,"sourceScorecardBlogLink":"https://openai.com/index/gpt-4-1/","sourceRepoLink":null,"sourceWeightsLink":null,"modelFamilyId":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.827Z","updatedAt":"$D2025-07-19T19:49:05.827Z","organization":{"organizationId":"openai","name":"OpenAI","website":"https://openai.com","description":"Leading AI research company","country":"US","manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:49:05.815Z","updatedAt":"$D2025-07-19T19:49:05.815Z"},"license":{"licenseId":"proprietary","name":"Proprietary","allowCommercial":false,"description":"Proprietary license - usage restrictions apply","createdAt":"$D2025-07-19T19:49:05.425Z","updatedAt":"$D2025-07-19T19:49:05.425Z"},"benchmarks":[{"modelBenchmarkId":28966632,"benchmarkId":"gpqa","modelId":"gpt-4.1-nano-2025-04-14","score":0.503,"normalizedScore":0.503,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Diamond","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.756Z","updatedAt":"$D2025-07-19T19:56:11.756Z","benchmark":{"benchmarkId":"gpqa","name":"GPQA","category":null}},{"modelBenchmarkId":50563589,"benchmarkId":"aider-polyglot","modelId":"gpt-4.1-nano-2025-04-14","score":0.098,"normalizedScore":0.098,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.385Z","updatedAt":"$D2025-07-19T19:56:12.385Z","benchmark":{"benchmarkId":"aider-polyglot","name":"Aider-Polyglot","category":null}},{"modelBenchmarkId":40228686,"benchmarkId":"aider-polyglot-edit","modelId":"gpt-4.1-nano-2025-04-14","score":0.062,"normalizedScore":0.062,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:13.804Z","updatedAt":"$D2025-07-19T19:56:13.804Z","benchmark":{"benchmarkId":"aider-polyglot-edit","name":"Aider-Polyglot Edit","category":null}},{"modelBenchmarkId":79685580,"benchmarkId":"aime-2024","modelId":"gpt-4.1-nano-2025-04-14","score":0.294,"normalizedScore":0.294,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.016Z","updatedAt":"$D2025-07-19T19:56:12.016Z","benchmark":{"benchmarkId":"aime-2024","name":"AIME 2024","category":null}},{"modelBenchmarkId":60968493,"benchmarkId":"charxiv-d","modelId":"gpt-4.1-nano-2025-04-14","score":0.739,"normalizedScore":0.739,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.329Z","updatedAt":"$D2025-07-19T19:56:15.329Z","benchmark":{"benchmarkId":"charxiv-d","name":"CharXiv-D","category":null}},{"modelBenchmarkId":69763687,"benchmarkId":"charxiv-r","modelId":"gpt-4.1-nano-2025-04-14","score":0.405,"normalizedScore":0.405,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.199Z","updatedAt":"$D2025-07-19T19:56:15.199Z","benchmark":{"benchmarkId":"charxiv-r","name":"CharXiv-R","category":null}},{"modelBenchmarkId":57873323,"benchmarkId":"collie","modelId":"gpt-4.1-nano-2025-04-14","score":0.425,"normalizedScore":0.425,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.257Z","updatedAt":"$D2025-07-19T19:56:15.257Z","benchmark":{"benchmarkId":"collie","name":"COLLIE","category":null}},{"modelBenchmarkId":24000327,"benchmarkId":"complexfuncbench","modelId":"gpt-4.1-nano-2025-04-14","score":0.057,"normalizedScore":0.057,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.341Z","updatedAt":"$D2025-07-19T19:56:15.341Z","benchmark":{"benchmarkId":"complexfuncbench","name":"ComplexFuncBench","category":null}},{"modelBenchmarkId":10683071,"benchmarkId":"graphwalks-bfs-<128k","modelId":"gpt-4.1-nano-2025-04-14","score":0.25,"normalizedScore":0.25,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.291Z","updatedAt":"$D2025-07-19T19:56:15.291Z","benchmark":{"benchmarkId":"graphwalks-bfs-<128k","name":"Graphwalks BFS <128k","category":null}},{"modelBenchmarkId":79823219,"benchmarkId":"graphwalks-bfs->128k","modelId":"gpt-4.1-nano-2025-04-14","score":0.029,"normalizedScore":0.029,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.300Z","updatedAt":"$D2025-07-19T19:56:15.300Z","benchmark":{"benchmarkId":"graphwalks-bfs->128k","name":"Graphwalks BFS >128k","category":null}},{"modelBenchmarkId":53356392,"benchmarkId":"graphwalks-parents-<128k","modelId":"gpt-4.1-nano-2025-04-14","score":0.094,"normalizedScore":0.094,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.308Z","updatedAt":"$D2025-07-19T19:56:15.308Z","benchmark":{"benchmarkId":"graphwalks-parents-<128k","name":"Graphwalks parents <128k","category":null}},{"modelBenchmarkId":73650664,"benchmarkId":"graphwalks-parents->128k","modelId":"gpt-4.1-nano-2025-04-14","score":0.056,"normalizedScore":0.056,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.322Z","updatedAt":"$D2025-07-19T19:56:15.322Z","benchmark":{"benchmarkId":"graphwalks-parents->128k","name":"Graphwalks parents >128k","category":null}},{"modelBenchmarkId":99668791,"benchmarkId":"ifeval","modelId":"gpt-4.1-nano-2025-04-14","score":0.745,"normalizedScore":0.745,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.300Z","updatedAt":"$D2025-07-19T19:56:12.300Z","benchmark":{"benchmarkId":"ifeval","name":"IFEval","category":null}},{"modelBenchmarkId":50707194,"benchmarkId":"internal-api-instruction-following-(hard)","modelId":"gpt-4.1-nano-2025-04-14","score":0.316,"normalizedScore":0.316,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.227Z","updatedAt":"$D2025-07-19T19:56:15.227Z","benchmark":{"benchmarkId":"internal-api-instruction-following-(hard)","name":"Internal API instruction following (hard)","category":null}},{"modelBenchmarkId":63845223,"benchmarkId":"mathvista","modelId":"gpt-4.1-nano-2025-04-14","score":0.562,"normalizedScore":0.562,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.117Z","updatedAt":"$D2025-07-19T19:56:12.117Z","benchmark":{"benchmarkId":"mathvista","name":"MathVista","category":null}},{"modelBenchmarkId":3334690,"benchmarkId":"mmlu","modelId":"gpt-4.1-nano-2025-04-14","score":0.801,"normalizedScore":0.801,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:11.319Z","updatedAt":"$D2025-07-19T19:56:11.319Z","benchmark":{"benchmarkId":"mmlu","name":"MMLU","category":null}},{"modelBenchmarkId":15269168,"benchmarkId":"mmmlu","modelId":"gpt-4.1-nano-2025-04-14","score":0.669,"normalizedScore":0.669,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.159Z","updatedAt":"$D2025-07-19T19:56:14.159Z","benchmark":{"benchmarkId":"mmmlu","name":"MMMLU","category":null}},{"modelBenchmarkId":66885700,"benchmarkId":"mmmu","modelId":"gpt-4.1-nano-2025-04-14","score":0.554,"normalizedScore":0.554,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.220Z","updatedAt":"$D2025-07-19T19:56:12.220Z","benchmark":{"benchmarkId":"mmmu","name":"MMMU","category":null}},{"modelBenchmarkId":92717299,"benchmarkId":"multichallenge","modelId":"gpt-4.1-nano-2025-04-14","score":0.15,"normalizedScore":0.15,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark (GPT-4o grader)","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:12.557Z","updatedAt":"$D2025-07-19T19:56:12.557Z","benchmark":{"benchmarkId":"multichallenge","name":"Multi-Challenge","category":null}},{"modelBenchmarkId":1209227,"benchmarkId":"multichallenge-(o3-mini-grader)","modelId":"gpt-4.1-nano-2025-04-14","score":0.311,"normalizedScore":0.311,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark (o3-mini grader, see footnote [3])","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.241Z","updatedAt":"$D2025-07-19T19:56:15.241Z","benchmark":{"benchmarkId":"multichallenge-(o3-mini-grader)","name":"MultiChallenge (o3-mini grader)","category":null}},{"modelBenchmarkId":63618984,"benchmarkId":"multi-if","modelId":"gpt-4.1-nano-2025-04-14","score":0.572,"normalizedScore":0.572,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Standard benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.645Z","updatedAt":"$D2025-07-19T19:56:14.645Z","benchmark":{"benchmarkId":"multi-if","name":"Multi-IF","category":null}},{"modelBenchmarkId":47892249,"benchmarkId":"openai-mrcr:-2-needle-128k","modelId":"gpt-4.1-nano-2025-04-14","score":0.366,"normalizedScore":0.366,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.272Z","updatedAt":"$D2025-07-19T19:56:15.272Z","benchmark":{"benchmarkId":"openai-mrcr:-2-needle-128k","name":"OpenAI-MRCR: 2 needle 128k","category":null}},{"modelBenchmarkId":40440719,"benchmarkId":"openai-mrcr:-2-needle-1m","modelId":"gpt-4.1-nano-2025-04-14","score":0.12,"normalizedScore":0.12,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Internal benchmark","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.284Z","updatedAt":"$D2025-07-19T19:56:15.284Z","benchmark":{"benchmarkId":"openai-mrcr:-2-needle-1m","name":"OpenAI-MRCR: 2 needle 1M","category":null}},{"modelBenchmarkId":33929639,"benchmarkId":"tau-bench-airline","modelId":"gpt-4.1-nano-2025-04-14","score":0.14,"normalizedScore":0.14,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Avg 5 runs, no custom tools/prompting (footnote [4])","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:15.011Z","updatedAt":"$D2025-07-19T19:56:15.011Z","benchmark":{"benchmarkId":"tau-bench-airline","name":"TAU-bench Airline","category":null}},{"modelBenchmarkId":73811397,"benchmarkId":"tau-bench-retail","modelId":"gpt-4.1-nano-2025-04-14","score":0.226,"normalizedScore":0.226,"isSelfReported":true,"selfReportedSourceLink":"https://openai.com/index/gpt-4-1/","verifiedByLlmstats":false,"analysisMethod":"Avg 5 runs, no custom tools/prompting (footnote [4], GPT-4o user model)","verificationProviderId":null,"verificationHardware":null,"verificationDate":null,"verificationNotes":null,"manualEdits":null,"editedBy":null,"editedAt":null,"createdAt":"$D2025-07-19T19:56:14.982Z","updatedAt":"$D2025-07-19T19:56:14.982Z","benchmark":{"benchmarkId":"tau-bench-retail","name":"TAU-bench Retail","category":null}}],"providers":[{"modelProviderId":95388903,"modelId":"gpt-4.1-nano-2025-04-14","providerId":"openai","providerModelIdUsed":"gpt-4.1-nano-2025-04-14","deprecatedAt":null,"inputCentsPerMillionTokens":10,"outputCentsPerMillionTokens":40,"quantization":null,"maxInputTokens":1047576,"maxOutputTokens":32768,"throughput":200,"latency":2,"featureWebSearch":false,"featureFunctionCalling":true,"featureStructuredOutput":true,"featureCodeExecution":false,"featureBatchInference":true,"featureFinetuning":false,"inputModalityText":true,"inputModalityImage":true,"inputModalityAudio":false,"inputModalityVideo":false,"outputModalityText":true,"outputModalityImage":false,"outputModalityAudio":false,"outputModalityVideo":false,"createdAt":"$D2025-07-19T19:49:17.154Z","updatedAt":"$D2025-07-19T19:49:17.154Z","modelName":"GPT-4.1 nano","organizationId":"openai","provider":{"providerId":"openai","name":"OpenAI","website":"https://openai.com","createdAt":"$D2025-07-19T19:49:17.121Z","updatedAt":"$D2025-07-19T19:49:17.121Z"}}]},"commonBenchmarks":[{"benchmarkId":"aime-2025","name":"AIME 2025","category":null,"modelA":0.067,"modelB":0},{"benchmarkId":"codegolf-v2.2","name":"Codegolf v2.2","category":null,"modelA":0.11,"modelB":0},{"benchmarkId":"eclektic","name":"ECLeKTic","category":null,"modelA":0.025,"modelB":0},{"benchmarkId":"global-mmlu","name":"Global-MMLU","category":null,"modelA":0.551,"modelB":0},{"benchmarkId":"global-mmlu-lite","name":"Global-MMLU-Lite","category":null,"modelA":0.59,"modelB":0},{"benchmarkId":"gpqa","name":"GPQA","category":null,"modelA":0.248,"modelB":0.503},{"benchmarkId":"hiddenmath","name":"HiddenMath","category":null,"modelA":0.277,"modelB":0},{"benchmarkId":"humaneval","name":"HumanEval","category":null,"modelA":0.665,"modelB":0},{"benchmarkId":"include","name":"Include","category":null,"modelA":0.386,"modelB":0},{"benchmarkId":"livecodebench","name":"LiveCodeBench","category":null,"modelA":0.132,"modelB":0},{"benchmarkId":"livecodebench-v5","name":"LiveCodeBench v5","category":null,"modelA":0.186,"modelB":0},{"benchmarkId":"mbpp","name":"MBPP","category":null,"modelA":0.566,"modelB":0},{"benchmarkId":"mgsm","name":"MGSM","category":null,"modelA":0.531,"modelB":0},{"benchmarkId":"mmlu","name":"MMLU","category":null,"modelA":0.601,"modelB":0.801},{"benchmarkId":"mmlu-pro","name":"MMLU-Pro","category":null,"modelA":0.405,"modelB":0},{"benchmarkId":"mmlu-prox","name":"MMLU-ProX","category":null,"modelA":0.081,"modelB":0},{"benchmarkId":"openai-mmlu","name":"OpenAI MMLU","category":null,"modelA":0.223,"modelB":0},{"benchmarkId":"wmt24++","name":"WMT24++","category":null,"modelA":0.427,"modelB":0},{"benchmarkId":"aider-polyglot","name":"Aider-Polyglot","category":null,"modelA":0,"modelB":0.098},{"benchmarkId":"aider-polyglot-edit","name":"Aider-Polyglot Edit","category":null,"modelA":0,"modelB":0.062},{"benchmarkId":"aime-2024","name":"AIME 2024","category":null,"modelA":0,"modelB":0.294},{"benchmarkId":"charxiv-d","name":"CharXiv-D","category":null,"modelA":0,"modelB":0.739},{"benchmarkId":"charxiv-r","name":"CharXiv-R","category":null,"modelA":0,"modelB":0.405},{"benchmarkId":"collie","name":"COLLIE","category":null,"modelA":0,"modelB":0.425},{"benchmarkId":"complexfuncbench","name":"ComplexFuncBench","category":null,"modelA":0,"modelB":0.057},{"benchmarkId":"graphwalks-bfs-<128k","name":"Graphwalks BFS <128k","category":null,"modelA":0,"modelB":0.25},{"benchmarkId":"graphwalks-bfs->128k","name":"Graphwalks BFS >128k","category":null,"modelA":0,"modelB":0.029},{"benchmarkId":"graphwalks-parents-<128k","name":"Graphwalks parents <128k","category":null,"modelA":0,"modelB":0.094},{"benchmarkId":"graphwalks-parents->128k","name":"Graphwalks parents >128k","category":null,"modelA":0,"modelB":0.056},{"benchmarkId":"ifeval","name":"IFEval","category":null,"modelA":0,"modelB":0.745},{"benchmarkId":"internal-api-instruction-following-(hard)","name":"Internal API instruction following (hard)","category":null,"modelA":0,"modelB":0.316},{"benchmarkId":"mathvista","name":"MathVista","category":null,"modelA":0,"modelB":0.562},{"benchmarkId":"mmmlu","name":"MMMLU","category":null,"modelA":0,"modelB":0.669},{"benchmarkId":"mmmu","name":"MMMU","category":null,"modelA":0,"modelB":0.554},{"benchmarkId":"multichallenge","name":"Multi-Challenge","category":null,"modelA":0,"modelB":0.15},{"benchmarkId":"multichallenge-(o3-mini-grader)","name":"MultiChallenge (o3-mini grader)","category":null,"modelA":0,"modelB":0.311},{"benchmarkId":"multi-if","name":"Multi-IF","category":null,"modelA":0,"modelB":0.572},{"benchmarkId":"openai-mrcr:-2-needle-128k","name":"OpenAI-MRCR: 2 needle 128k","category":null,"modelA":0,"modelB":0.366},{"benchmarkId":"openai-mrcr:-2-needle-1m","name":"OpenAI-MRCR: 2 needle 1M","category":null,"modelA":0,"modelB":0.12},{"benchmarkId":"tau-bench-airline","name":"TAU-bench Airline","category":null,"modelA":0,"modelB":0.14},{"benchmarkId":"tau-bench-retail","name":"TAU-bench Retail","category":null,"modelA":0,"modelB":0.226}]}],"$L32"]}]

Gemma 3n E2B Instructed vs GPT-4.1 nano

Performance Metrics

Provider Availability & Performance