Docs: Update benchmark results

This commit is contained in:
github-actions[bot]
2025-11-18 17:37:06 +00:00
parent 39d057f079
commit afcfd09537
84 changed files with 1086 additions and 1088 deletions

View File

@@ -1,79 +1,80 @@
{
"openai/gpt-5.1-codex": {
"1_dijkstra": 15.241279893,
"2_convex_hull": 13.933983282,
"3_lis": 3.980165064000001,
"4_determinant": 6.332550646999996,
"5_markdown_parser": 3.2380716380000014,
"6_csv_processor": 26.09038364200001,
"7_scheduler": 130.18603798900003,
"8_json_validator": 8.38715121099999,
"9_stream_visualizer": 12.031535295999987
},
"openai/gpt-5.1-chat": {
"1_dijkstra": 2.65463601799999,
"2_convex_hull": 3.1764218759999787,
"3_lis": 2.5808361240000233,
"4_determinant": 1.857067280999996,
"5_markdown_parser": 2.1500550130000047,
"6_csv_processor": 2.8134082990000024,
"7_scheduler": 6.116577822999999,
"8_json_validator": 1.477971265,
"9_stream_visualizer": 1.7076946140000073
},
"google/gemini-2.5-pro": {
"1_dijkstra": 33.989065073000006,
"2_convex_hull": 56.566219838000016,
"3_lis": 52.14045403000002,
"4_determinant": 14.913826469999972,
"5_markdown_parser": 26.86344819299999,
"6_csv_processor": 49.397067434999975,
"7_scheduler": 52.55558026300004,
"8_json_validator": 19.59284627099999,
"9_stream_visualizer": 36.41860035799991
"google/gemini-3-pro-preview": {
"10_scrypt_hash": 39.295109482,
"11_geospatial": 38.59770959899999,
"1_dijkstra": 34.202315816,
"2_convex_hull": 34.06182440299999,
"3_lis": 25.023427584999997,
"4_determinant": 28.093709440000005,
"5_markdown_parser": 28.463938538000015,
"6_csv_processor": 38.290726488999994,
"7_scheduler": 67.523956824,
"8_json_validator": 16.506907749000007,
"9_stream_visualizer": 51.923362084000026
},
"anthropic/claude-sonnet-4.5 TEMP:0.7": {
"1_dijkstra": 4.49742717099993,
"2_convex_hull": 4.570548665000009,
"3_lis": 2.375867489000084,
"4_determinant": 1.5574152070001,
"5_markdown_parser": 1.8310976730000694,
"6_csv_processor": 4.079893573999987,
"7_scheduler": 12.446870330999955,
"8_json_validator": 2.8953664760000537,
"9_stream_visualizer": 5.022439357000054
"10_scrypt_hash": 2.994402775000024,
"11_geospatial": 3.173007857000048,
"1_dijkstra": 4.721320241999987,
"2_convex_hull": 4.782739678999991,
"3_lis": 2.566319416000042,
"4_determinant": 2.087922611000016,
"5_markdown_parser": 2.1563547050000054,
"6_csv_processor": 4.368516923999996,
"7_scheduler": 10.690530350000016,
"8_json_validator": 2.9041606949999696,
"9_stream_visualizer": 4.411488517000049
},
"openai/gpt-5.1-codex": {
"10_scrypt_hash": 19.945625629000016,
"11_geospatial": 7.752952860000019,
"1_dijkstra": 18.825615109000005,
"2_convex_hull": 24.519327066999978,
"3_lis": 13.449256432000023,
"4_determinant": 3.5313777560000306,
"5_markdown_parser": 4.871686004000018,
"6_csv_processor": 31.731031262999984,
"7_scheduler": 91.32724592999998,
"8_json_validator": 11.784968072999968,
"9_stream_visualizer": 17.32446443499997
},
"moonshotai/kimi-k2-thinking": {
"1_dijkstra": 34.72660079400001,
"2_convex_hull": 42.421906253,
"3_lis": 52.291474074000014,
"4_determinant": 37.432558806,
"5_markdown_parser": 35.437114885999996,
"6_csv_processor": 91.85763109999999,
"7_scheduler": 184.65146969499997,
"8_json_validator": 81.96185510699998,
"9_stream_visualizer": 31.27018206100003
"10_scrypt_hash": 54.48318050600006,
"11_geospatial": 123.94316572699998,
"1_dijkstra": 20.75571812199999,
"2_convex_hull": 281.26114928399994,
"3_lis": 78.25152572599984,
"4_determinant": 67.81623509099987,
"5_markdown_parser": 154.2897356459999,
"6_csv_processor": 85.1170599280002,
"7_scheduler": 389.4384002489999,
"8_json_validator": 17.501368902000134,
"9_stream_visualizer": 98.03424570999994
},
"google/gemini-2.5-pro": {
"10_scrypt_hash": 33.5175050580001,
"11_geospatial": 31.009794073000318,
"1_dijkstra": 45.908529550999866,
"2_convex_hull": 85.32745476700039,
"3_lis": 32.75355649500014,
"4_determinant": 27.239392394999975,
"5_markdown_parser": 27.228569728999865,
"6_csv_processor": 69.48256337699992,
"7_scheduler": 54.015430929000026,
"8_json_validator": 29.125379850999916,
"9_stream_visualizer": 36.110917992000005
},
"openrouter/sherlock-think-alpha": {
"1_dijkstra": 34.012272204,
"2_convex_hull": 47.377176928,
"3_lis": 18.49963934400001,
"4_determinant": 20.327296623999995,
"5_markdown_parser": 34.069916891999995,
"6_csv_processor": 19.902450771000005,
"7_scheduler": 82.133111714,
"8_json_validator": 31.42142794699996,
"9_stream_visualizer": 35.74114956699999
},
"openrouter/sherlock-dash-alpha": {
"1_dijkstra": 2.7058817040000003,
"2_convex_hull": 3.9343546879999995,
"3_lis": 1.2894778209999995,
"4_determinant": 0.611742537,
"5_markdown_parser": 4.020213965999999,
"6_csv_processor": 3.107556931000001,
"7_scheduler": 7.806581231,
"8_json_validator": 1.4850442509999993,
"9_stream_visualizer": 2.5679872179999985
"10_scrypt_hash": 9.486372194000054,
"11_geospatial": 15.555460506999864,
"1_dijkstra": 21.514197755000087,
"2_convex_hull": 35.37556943300041,
"3_lis": 17.00031832400011,
"4_determinant": 8.939955472999719,
"5_markdown_parser": 15.81524256400019,
"6_csv_processor": 23.44287434099987,
"7_scheduler": 68.04158863600017,
"8_json_validator": 19.484740249000023,
"9_stream_visualizer": 28.426358369000255
}
}