Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 8 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -13,3 +13,11 @@ llmsql_workdir

evaluation_*
coverage.xml

.idea

# Sphinx build
docs/_build/
docs/.doctrees/
*.doctree
*.pickle
2 changes: 1 addition & 1 deletion docs/_build/html/.buildinfo
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Sphinx build info version 1
# This file records the configuration used when building these files. When it is not found, a full rebuild will be done.
config: ba6688d44e6ba22fb6e40076d1af75c2
config: 3caef0746bc07fabd8f91030ce7b6533
tags: 645f666f9bcd5a90fca523b33c5a78b7
Binary file removed docs/_build/html/.doctrees/docs/index.doctree
Binary file not shown.
Binary file removed docs/_build/html/.doctrees/environment.pickle
Binary file not shown.
4 changes: 2 additions & 2 deletions docs/_build/html/_static/documentation_options.js
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
const DOCUMENTATION_OPTIONS = {
VERSION: '0.1.14',
VERSION: '0.1.15',
LANGUAGE: 'en',
COLLAPSE_INDEX: false,
BUILDER: 'html',
Expand All @@ -10,4 +10,4 @@ const DOCUMENTATION_OPTIONS = {
NAVIGATION_WITH_KEYS: false,
SHOW_SEARCH_SUMMARY: true,
ENABLE_SEARCH_SHORTCUTS: true,
};
};
106 changes: 106 additions & 0 deletions docs/_build/html/_static/leaderboard.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,106 @@
[
{
"model": "openai/gpt-oss-120b",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.9049,
"date": "2026-02-24"
},
{
"model": "openai/gpt-oss-20b",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.8871,
"date": "2026-02-24"
},
{
"model": "meta-llama/Llama-3.3-70B-Instruct",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.8607,
"date": "2026-02-24"
},
{
"model": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.8519,
"date": "2026-02-24"
},
{
"model": "Qwen/Qwen2.5-7B-Instruct",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.794,
"date": "2026-02-24"
},
{
"model": "mistralai/Mistral-Nemo-Instruct-2407",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.7599,
"date": "2026-02-24"
},
{
"model": "Qwen/Qwen2.5-1.5B-Instruct",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.6401,
"date": "2026-02-24"
},
{
"model": "meta-llama/Llama-3.2-3B-Instruct",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.5415,
"date": "2026-02-24"
},
{
"model": "CYFRAGOVPL/PLLuM-12B-chat",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.5224,
"date": "2026-02-24"
},
{
"model": "Qwen/Qwen3-0.6B",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.4983,
"date": "2026-02-24"
},
{
"model": "CYFRAGOVPL/PLLuM-12B-nc-chat",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.4044,
"date": "2026-02-24"
},
{
"model": "CYFRAGOVPL/pllum-12b-nc-chat-250715",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.3727,
"date": "2026-02-24"
},
{
"model": "meta-llama/Llama-3.2-1B-Instruct",
"type": "open-source",
"fewshots": 5,
"backend": "vllm",
"accuracy": 0.2678,
"date": "2026-02-24"
}
]
85 changes: 85 additions & 0 deletions docs/_build/html/_static/scripts/front_page.js
Original file line number Diff line number Diff line change
Expand Up @@ -48,3 +48,88 @@ if (searchInput) {
}
});
}

document.addEventListener("DOMContentLoaded", async () => {
const container = document.getElementById('leaderboard-container');
if (!container) return;

try {
const response = await fetch('_static/leaderboard.json');
const rows = await response.json();
renderLeaderboard(rows);
} catch (e) {
container.innerHTML = '<p>Error loading leaderboard 😢</p>';
console.error(e);
}
});

function renderLeaderboard(rows) {
const container = document.getElementById('leaderboard-container');
container.innerHTML = '';

const table = document.createElement('table');
table.className = 'leaderboard-table';

const thead = document.createElement('thead');
thead.innerHTML = `
<tr>
<th>Rank</th>
<th>Model</th>
<th>Type</th>
<th>Fewshots</th>
<th>Backend</th>
<th>Accuracy</th>
<th>Date</th>
</tr>`;
table.appendChild(thead);

const tbody = document.createElement('tbody');
rows.forEach((row, i) => {
const tr = document.createElement('tr');

// Берём только вторую часть после слеша
const modelName = row.model.includes('/') ? row.model.split('/')[1] : row.model;

// Модель с ссылкой
const modelCell = document.createElement('td');
if (row.url) {
const a = document.createElement('a');
a.href = row.url;
a.target = "_blank";
a.rel = "noopener";
a.textContent = modelName; // <-- здесь только вторая часть
modelCell.appendChild(a);
} else {
modelCell.textContent = modelName;
}

// Accuracy
const accuracyCell = document.createElement('td');
const barContainer = document.createElement('div');
barContainer.className = 'accuracy-bar';
const fill = document.createElement('div');
fill.className = 'fill';
fill.style.width = `${(row.accuracy*100).toFixed(2)}%`;
const text = document.createElement('span');
text.textContent = `${(row.accuracy*100).toFixed(2)}%`;
barContainer.appendChild(fill);
barContainer.appendChild(text);
accuracyCell.appendChild(barContainer);

// Вставка остальных ячеек
tr.innerHTML += `<td>${i+1}</td>`;
tr.appendChild(modelCell);
tr.innerHTML += `
<td>${row.type}</td>
<td>${row.fewshots}</td>
<td>${row.backend}</td>
`;
tr.appendChild(accuracyCell);
tr.innerHTML += `<td>${row.date}</td>`;

tbody.appendChild(tr);
});

table.appendChild(tbody);
container.appendChild(table);
}
67 changes: 67 additions & 0 deletions docs/_build/html/_static/styles/front_page.css
Original file line number Diff line number Diff line change
Expand Up @@ -248,3 +248,70 @@ pre span {
background: none !important;
color: inherit !important;
}

.leaderboard-box {
padding: 1rem;
background: #fff;
border-radius: 12px;
box-shadow: 0 6px 20px rgba(0,0,0,0.08);
overflow-x: auto;
}

.leaderboard-table {
width: 100%;
border-collapse: collapse;
font-family: 'Inter', 'Roboto', sans-serif;
font-size: 0.95rem;
text-align: center;
}

.leaderboard-table th {
background: linear-gradient(180deg, #f6f6f6 0%, #e9e9e9 100%);
color: #111827;
font-weight: 600;
font-size: 0.95rem;
padding: 14px 10px;
text-transform: uppercase;
letter-spacing: 0.5px;
border-bottom: 2px solid #ddd;
text-align: center;
box-shadow: inset 0 -1px 0 rgba(0,0,0,0.05);
}

.leaderboard-table td {
padding: 10px;
border-bottom: 1px solid #e0e0e0;
}

.leaderboard-table tbody tr:nth-child(even) {
background-color: #f9f9f9;
}

/* Accuracy bar */
.accuracy-bar {
position: relative;
width: 100%;
height: 20px;
background: #e0e0e0;
border-radius: 10px;
overflow: hidden;
}

.accuracy-bar .fill {
height: 100%;
background: linear-gradient(90deg,#4caf50,#81c784);
border-radius: 10px 0 0 10px;
}

.accuracy-bar span {
position: absolute;
width: 100%;
text-align: center;
top: 0;
left: 0;
font-size: 0.8rem;
font-weight: 600;
line-height: 20px;
color: #000;
}

31 changes: 19 additions & 12 deletions docs/_build/html/docs/evaluation.html
Original file line number Diff line number Diff line change
Expand Up @@ -5,21 +5,23 @@
<meta charset="utf-8" />
<meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="viewport" content="width=device-width, initial-scale=1" />

<title>Evaluation API Reference &#8212; LLMSQL 0.1.14 documentation</title>
<title>Evaluation API Reference &#8212; LLMSQL 0.1.15 documentation</title>
<link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=5349f25f" />
<link rel="stylesheet" type="text/css" href="../_static/basic.css?v=29da98fa" />
<link rel="stylesheet" type="text/css" href="../_static/basic.css?v=29da98fa" />
<link rel="stylesheet" type="text/css" href="../_static/copybutton.css?v=76b2166b" />
<link rel="stylesheet" type="text/css" href="../_static/styles/front_page.css?v=9e26f69c" />
<script src="../_static/documentation_options.js?v=468bc497"></script>
<link rel="stylesheet" type="text/css" href="../_static/styles/front_page.css?v=047bfc79" />
<script src="../_static/documentation_options.js?v=e2f3408e"></script>
<script src="../_static/doctools.js?v=9bcbadda"></script>
<script src="../_static/sphinx_highlight.js?v=dc90522c"></script>
<script src="../_static/clipboard.min.js?v=a7894cd8"></script>
<script src="../_static/copybutton.js?v=ccdb6887"></script>
<script src="../_static/scripts/front_page.js?v=a59558f4"></script>
<script src="../_static/scripts/front_page.js?v=0a79e239"></script>
<link rel="icon" href="../_static/favicon.png"/>
<link rel="index" title="Index" href="../genindex.html" />
<link rel="search" title="Search" href="../search.html" />
<link rel="prev" title="Inference API Reference" href="inference.html" />
<link rel="prev" title="Inference API Reference" href="inference.html" />
<link rel="prev" title="Inference API Reference" href="inference.html" />
</head><body>
<div class="related" role="navigation" aria-label="Related">
<h3>Navigation</h3>
Expand All @@ -30,17 +32,20 @@ <h3>Navigation</h3>
<li class="right" >
<a href="inference.html" title="Inference API Reference"
accesskey="P">previous</a> |</li>
<li class="nav-item nav-item-0"><a href="../index.html">LLMSQL 0.1.14 documentation</a> &#187;</li>
<li class="nav-item nav-item-0"><a href="../index.html">LLMSQL 0.1.15 documentation</a> &#187;</li>
<li class="nav-item nav-item-1"><a href="index.html" accesskey="U">LLMSQL package Documentation</a> &#187;</li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
</ul>
</div>
</div>
</div>

<div class="document">
<div class="documentwrapper">
<div class="bodywrapper">
<div class="body" role="main">



<section id="evaluation-api-reference">
<h1>Evaluation API Reference<a class="headerlink" href="#evaluation-api-reference" title="Link to this heading">¶</a></h1>
<p>The <cite>evaluate()</cite> function allows you to benchmark Text-to-SQL model outputs
Expand Down Expand Up @@ -173,6 +178,7 @@ <h3><a href="../index.html">Table of Contents</a></h3>
<li><a class="reference internal" href="#input-format">Input Format</a></li>
<li><a class="reference internal" href="#output-metrics">Output Metrics</a></li>
<li><a class="reference internal" href="#report-saving">Report Saving</a></li>
<li><a class="reference internal" href="#report-saving">Report Saving</a></li>
</ul>
</li>
</ul>
Expand Down Expand Up @@ -213,12 +219,13 @@ <h3>Navigation</h3>
<li class="right" >
<a href="inference.html" title="Inference API Reference"
>previous</a> |</li>
<li class="nav-item nav-item-0"><a href="../index.html">LLMSQL 0.1.14 documentation</a> &#187;</li>
<li class="nav-item nav-item-0"><a href="../index.html">LLMSQL 0.1.15 documentation</a> &#187;</li>
<li class="nav-item nav-item-1"><a href="index.html" >LLMSQL package Documentation</a> &#187;</li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
<li class="nav-item nav-item-this"><a href="">Evaluation API Reference</a></li>
</ul>
</div>
<div class="footer" role="contentinfo">
</div>
</body>
</html>
</html>
Loading