NeurIPS 2025 E2LM Competition: Early Training Evaluation of Language Models Leaderboard

{
  • "headers": [
    • "Submission ID",
    • "Team",
    • "Submitter",
    • "Signal Quality",
    • "Ranking Consistency",
    • "Scientific Compliance",
    • "Global Score",
    • "Submission Time",
    • "Description"
    ],
  • "data": [
    • [
      • "18ce18709a",
      • "Nobelist",
      • "pkuHaowei",
      • 0.96,
      • 0.84,
      • 0.42,
      • 0.73,
      • "2025-08-19T06:05:53",
      • "Another MMLU-Var test with updated hf_token"
      ],
    • [
      • "22fb4b9aa6",
      • "ShAIkespear",
      • "ESmike",
      • 0.16,
      • 0.49,
      • 0.07,
      • 0.16,
      • "2025-09-10T19:25:19",
      • "Second Test"
      ],
    • [
      • "5845c5c8be",
      • "morai",
      • "giovanivaldrighi",
      • 0.26,
      • 0.72,
      • 0.24,
      • 0.3,
      • "2025-08-22T11:53:41",
      • "Task focused in STEM topics for MMLU using prompt engineering."
      ]
    ],
  • "metadata": null
}