mirror of
https://github.com/multipleof4/lynchmark.git
synced 2026-01-13 16:17:54 +00:00
150 lines
7.5 KiB
HTML
150 lines
7.5 KiB
HTML
<!DOCTYPE html>
|
||
<html lang="en">
|
||
<head>
|
||
<meta charset="UTF-8"><meta name="viewport" content="width=device-width, initial-scale=1.0">
|
||
<title>Lynchmark Debug – Test Execution Details</title>
|
||
<link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&family=DM+Serif+Display:ital@0;1&family=IBM+Plex+Mono:wght@400;500&display=swap" rel="stylesheet">
|
||
<script src="https://cdn.tailwindcss.com"></script>
|
||
<style>
|
||
body{font-family:Inter,system-ui,-apple-system,Segoe UI,Roboto,Ubuntu,Cantarell,Noto Sans,sans-serif}
|
||
.mono{font-family:"IBM Plex Mono",ui-monospace,SFMono-Regular,Menlo,monospace}
|
||
pre{white-space:pre-wrap;word-break:break-word}
|
||
</style>
|
||
</head>
|
||
<body class="bg-gray-50 text-gray-800">
|
||
<main class="max-w-5xl mx-auto flex flex-col min-h-screen p-6 lg:p-8">
|
||
<header class="text-center mb-10">
|
||
<h1 class="text-4xl font-bold text-gray-900 mb-2">Lynchmark Debug</h1>
|
||
<p class="text-base text-gray-600 max-w-lg mx-auto">
|
||
Detailed test execution output showing runtime results vs expected values for each model and test.
|
||
</p>
|
||
</header>
|
||
|
||
<div id="results-container" class="flex flex-col gap-6 flex-grow">
|
||
</div>
|
||
|
||
<footer class="mt-10 flex justify-center">
|
||
<a href="/" class="inline-flex items-center gap-2 text-gray-600 hover:text-gray-900 mr-4">
|
||
<span class="mono text-xs font-medium">← Back to Results</span>
|
||
</a>
|
||
<a href="https://github.com/multipleof4/lynchmark" class="inline-flex items-center gap-2 text-gray-600 hover:text-gray-900" target="_blank" rel="noopener noreferrer">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" aria-hidden="true" class="w-5 h-5 fill-current">
|
||
<path d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52 0-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.012 8.012 0 0 0 16 8c0-4.42-3.58-8-8-8z"/>
|
||
</svg>
|
||
<span class="mono text-xs font-medium">@multipleof4/lynchmark</span>
|
||
</a>
|
||
</footer>
|
||
</main>
|
||
<script type="module">
|
||
const get=id=>document.getElementById(id);
|
||
const container=get('results-container');
|
||
|
||
const run=async()=>{
|
||
const readme=await fetch('./README').then(r=>r.text());
|
||
const genTimes=await fetch('./results.json').then(r=>r.json());
|
||
const models=readme.match(/<!-- MODELS_START -->\n([\s\S]+?)\n<!-- MODELS_END -->/)[1].trim().split('\n');
|
||
const tests=[...new Set(Object.values(genTimes).flatMap(Object.keys))].sort();
|
||
|
||
for(const model of models){
|
||
const sModel=model.replace(/[\/:]/g,'_');
|
||
const card=document.createElement('section');
|
||
card.className='rounded-2xl border border-gray-200 bg-white shadow-sm overflow-hidden mb-6';
|
||
card.innerHTML=`
|
||
<div class="bg-gray-50 px-5 py-3 border-b border-gray-200">
|
||
<p class="mono text-sm text-gray-700 font-medium">${model}</p>
|
||
</div>
|
||
<div class="p-4 space-y-4" id="list-${sModel}"></div>`;
|
||
container.appendChild(card);
|
||
const list=get(`list-${sModel}`);
|
||
|
||
for(const test of tests){
|
||
const testDiv=document.createElement('div');
|
||
testDiv.className='border border-gray-200 rounded-lg p-4 bg-gray-50';
|
||
list.appendChild(testDiv);
|
||
const time=genTimes[model]?.[test];
|
||
|
||
if(time===null){
|
||
testDiv.innerHTML=`
|
||
<div class="flex items-center gap-2 mb-2">
|
||
<span class="text-lg">—</span>
|
||
<span class="font-semibold text-gray-800">${test}</span>
|
||
<span class="mono text-gray-500 ml-auto text-sm">N/A</span>
|
||
</div>
|
||
<p class="text-sm text-gray-600">Test not run or generation failed</p>`;
|
||
continue;
|
||
}
|
||
|
||
testDiv.innerHTML=`
|
||
<div class="flex items-center gap-2 mb-2">
|
||
<svg class="animate-spin h-5 w-5 text-gray-400" xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24"><circle class="opacity-25" cx="12" cy="12" r="10" stroke="currentColor" stroke-width="4"></circle><path class="opacity-75" fill="currentColor" d="M4 12a8 8 0 018-8V0C5.373 0 0 5.373 0 12h4zm2 5.291A7.962 7.962 0 014 12H0c0 3.042 1.135 5.824 3 7.938l3-2.647z"></path></svg>
|
||
<span class="font-semibold text-gray-800">${test}</span>
|
||
<span class="mono text-gray-500 ml-auto text-sm">...</span>
|
||
</div>
|
||
<p class="text-sm text-gray-600">Running test...</p>`;
|
||
|
||
let status='✅',error=null,actual=null,expected=null;
|
||
try{
|
||
const tMod=await import(`./tests/${test}/test.js`);
|
||
const lMod=await import(`./tests/${test}/outputs/${sModel}.js`);
|
||
|
||
const testFn=tMod.default.runTest;
|
||
const origTest=testFn.toString();
|
||
const expectedMatch=origTest.match(/assert\.(strictEqual|deepStrictEqual)\(([^,]+),\s*([^,)]+)/);
|
||
|
||
if(expectedMatch){
|
||
expected=expectedMatch[3].trim();
|
||
}
|
||
|
||
let capturedActual=null;
|
||
const wrappedFn=async fn=>{
|
||
const result=await fn(lMod.default);
|
||
capturedActual=result;
|
||
return result;
|
||
};
|
||
|
||
const testP=(async()=>{
|
||
try{
|
||
await testFn(async(...args)=>{
|
||
const result=await lMod.default(...args);
|
||
actual=result;
|
||
return result;
|
||
});
|
||
}catch(e){
|
||
throw e;
|
||
}
|
||
})();
|
||
await Promise.race([testP,new Promise((_,r)=>setTimeout(()=>r(new Error('Timeout')),12000))]);
|
||
}catch(e){
|
||
console.error(`${model} - ${test}:`,e);
|
||
status='❌';
|
||
error=e.message;
|
||
}
|
||
|
||
const timeStr=time?.toFixed(3)??'N/A';
|
||
const statusColor=status==='✅'?'text-green-600':'text-red-600';
|
||
|
||
testDiv.innerHTML=`
|
||
<div class="flex items-center gap-2 mb-3">
|
||
<span class="text-lg ${statusColor}">${status}</span>
|
||
<span class="font-semibold text-gray-800">${test}</span>
|
||
<span class="mono text-gray-500 ml-auto text-sm">${timeStr}s</span>
|
||
</div>
|
||
${error?`<div class="mb-3 p-3 bg-red-50 border border-red-200 rounded"><p class="text-sm font-medium text-red-800 mb-1">Error:</p><pre class="mono text-xs text-red-700">${error}</pre></div>`:''}
|
||
<div class="grid grid-cols-2 gap-3">
|
||
<div class="p-3 bg-white border border-gray-200 rounded">
|
||
<p class="text-xs font-semibold text-gray-600 mb-2">ACTUAL OUTPUT</p>
|
||
<pre class="mono text-xs text-gray-800">${actual!==null?JSON.stringify(actual,null,2):'N/A'}</pre>
|
||
</div>
|
||
<div class="p-3 bg-white border border-gray-200 rounded">
|
||
<p class="text-xs font-semibold text-gray-600 mb-2">EXPECTED</p>
|
||
<pre class="mono text-xs text-gray-800">${expected??'N/A'}</pre>
|
||
</div>
|
||
</div>`;
|
||
}
|
||
}
|
||
};
|
||
run();
|
||
</script>
|
||
</body>
|
||
</html>
|