luisrguerra's picture
Update index.html
cf01265 verified
raw
history blame
2.68 kB
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>Guerra LLM Ranking</title>
<script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.1/dist/chart.umd.min.js"></script>
</head>
<body>
<canvas id="radarChart" height="750"></canvas>
<script>
let data = {
labels: ['MMLU', 'MT-bench','Arena Elo'],
datasets: [
{
label: 'GPT-4-Turbo',
data: [null, 93.2,124.9],
borderWidth: 2
},
{
label: 'GPT-4-0314',
data: [86.4, 86.4,119.0],
borderWidth: 2
},
{
label: 'GPT-3.5-Turbo-0314',
data: [70.0, 79.4,112.3],
borderWidth: 2
},
{
label: 'Mistral Medium',
data: [75.3, 86.1,115.0],
borderWidth: 2
},
{
label: 'Mixtral 8x7B Instruct v0.1',
data: [70.6, 83.0,112.3],
borderWidth: 2
},
{
label: 'Claude 2.0',
data: [78.5, 80.6,113.1],
borderWidth: 2
},
{
label: 'Claude 1.0',
data: [77.0, 79.0,114.9],
borderWidth: 2
},
{
label: 'Claude Instant 1',
data: [73.4, 78.5,110.9],
borderWidth: 2
},
{
label: 'Gemini Pro',
data: [71.8, null,111.4],
borderWidth: 2
},
{
label: 'Yi 34B Chat',
data: [73.5, null,111.1],
borderWidth: 2
},
{
label: 'Falcon 180B Chat',
data: [68.0, null,103.1],
borderWidth: 2
},
{
label: 'LLama 2 70B Chat',
data: [63.0, 68.6,107.9],
borderWidth: 2
},
]
};
let options = {
responsive: true,
maintainAspectRatio: false,
scale: {
ticks: {
stepSize: 10,
}
},
};
let ctx = document.getElementById('radarChart').getContext('2d');
new Chart(ctx, {
type: 'radar',
data: data,
options: options
});
</script>
</body>
</html>