SaylorTwift's picture
SaylorTwift HF Staff
it's not really pretty make it better. Also, I want the bottom part of the cards to be hidden at only showed when clicking the card
77bb77e verified
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>EvalFlip - AI Benchmark Universe</title>
<link rel="stylesheet" href="style.css">
<link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap" rel="stylesheet">
<script src="https://cdn.tailwindcss.com"></script>
<script src="https://cdn.jsdelivr.net/npm/feather-icons/dist/feather.min.js"></script>
<script src="https://unpkg.com/feather-icons"></script>
<script src="components/navbar.js"></script>
<script src="components/footer.js"></script>
<script src="script.js"></script>
</head>
<body class="bg-gray-50 min-h-screen flex flex-col">
<custom-navbar></custom-navbar>
<main class="flex-grow container mx-auto px-4 py-8">
<h1 class="text-4xl font-bold text-center mb-12 text-gray-800">AI Benchmark Universe</h1>
<div class="grid grid-cols-1 md:grid-cols-2 lg:grid-cols-3 gap-8">
<!-- GSM8k Benchmark Card -->
<div class="eval-card" data-eval="gsm8k">
<div class="card-inner">
<div class="card-front bg-indigo-600 text-white p-6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<div class="flex items-center gap-2 mb-4">
<i data-feather="cpu" class="w-6 h-6"></i>
<h2 class="text-2xl font-bold">GSM8k</h2>
</div>
<p class="text-indigo-100 mb-4">Grade School Math with 8.5K problems</p>
<div class="flex flex-wrap gap-2">
<span class="badge">Mathematics</span>
<span class="badge">Reasoning</span>
</div>
</div>
<div class="mt-4 text-sm text-indigo-200 flex items-center gap-1">
<i data-feather="database"></i>
<span>8,500 examples</span>
</div>
</div>
<div class="card-back bg-white p–6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<h2 class="text-2xl font-bold text-indigo-600 mb-4">GSM8k Details</h2>
<p class="text-gray-700 mb-4">A benchmark for mathematical reasoning, testing grade school math problems requiring multi-step reasoning.</p>
<div class="space-y-3">
<div>
<h3 class="font-semibold text-gray-800">Evaluation Type:</h3>
<p class="text-gray-600">Mathematics, Reasoning</p>
</div>
<div>
<h3 class="font-semibold text-gray-800">Example:</h3>
<p class="text-gray-600">"John has 5 apples. He gives 2 to Mary and buys 3 more. How many does he have now?"</p>
</div>
</div>
</div>
<a href="#" class="text-indigo-600 hover:text-indigo-800 text-sm flex items-center gap-1">
<i data-feather="external-link"></i>
<span>View Full Details</span>
</a>
</div>
</div>
</div>
<!-- GPQA Benchmark Card -->
<div class="eval-card" data-eval="gpqa">
<div class="card-inner">
<div class="card-front bg-emerald-600 text-white p-6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<div class="flex items-center gap-2 mb-4">
<i data-feather="book" class="w-6 h-6"></i>
<h2 class="text-2xl font-bold">GPQA</h2>
</div>
<p class="text-emerald-100 mb-4">General Purpose Question Answering</p>
<div class="flex flex-wrap gap-2">
<span class="badge">QA</span>
<span class="badge">Knowledge</span>
</div>
</div>
<div class="mt-4 text-sm text-emerald-200 flex items-center gap-1">
<i data-feather="database"></i>
<span>Multi-domain</span>
</div>
</div>
<div class="card-back bg-white p–6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<h2 class="text-2xl font-bold text-emerald-600 mb-4">GPQA Details</h2>
<p class="text-gray-700 mb-4">A comprehensive benchmark testing general knowledge across multiple domains.</p>
<div class="space-y-3">
<div>
<h3 class="font-semibold text-gray-800">Evaluation Type:</h3>
<p class="text-gray-600">Question Answering</p>
</div>
<div>
<h3 class="font-semibold text-gray-800">Example:</h3>
<p class="text-gray-600">"What is the capital of France?"</p>
</div>
</div>
</div>
<a href="#" class="text-emerald-600 hover:text-emerald-800 text-sm flex items-center gap-1">
<i data-feather="external-link"></i>
<span>View Full Details</span>
</a>
</div>
</div>
</div>
<!-- MMLU Benchmark Card -->
<div class="eval-card" data-eval="mmlu">
<div class="card-inner">
<div class="card-front bg-amber-600 text-white p-6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<div class="flex items-center gap-2 mb-4">
<i data-feather="layers" class="w-6 h-6"></i>
<h2 class="text-2xl font-bold">MMLU</h2>
</div>
<p class="text-amber-100 mb-4">Massive Multitask Language Understanding</p>
<div class="flex flex-wrap gap-2">
<span class="badge">ML</span>
<span class="badge">Multitask</span>
</div>
</div>
<div class="mt-4 text-sm text-amber-200 flex items-center gap-1">
<i data-feather="database"></i>
<span>57 subjects</span>
</div>
</div>
<div class="card-back bg-white p–6 rounded-xl shadow-xl flex flex-col justify-between">
<div>
<h2 class="text-2xl font-bold text-amber-600 mb-4">MMLU Details</h2>
<p class="text-gray-700 mb-4">Tests understanding across 57 subjects including STEM, humanities and more.</p>
<div class="space-y-3">
<div>
<h3 class="font-semibold text-gray-800">Evaluation Type:</h3>
<p class="text-gray-600">Multitask Understanding</p>
</div>
<div>
<h3 class="font-semibold text-gray-800">Example:</h3>
<p class="text-gray-600">"Explain the concept of entropy in thermodynamics."</p>
</div>
</div>
</div>
<a href="#" class="text
<script src="https://huggingface.co/deepsite/deepsite-badge.js"></script>
</body>
</html>