Spaces:
Running
Running
Commit
·
e0290d0
1
Parent(s):
ad26110
Update: Add Verilator as a new sim
Browse files- app.py +62 -11
- results/aggregated_scores.csv +0 -28
- results/aggregated_scores_icarus.csv +29 -0
- results/aggregated_scores_verilator.csv +29 -0
- results/parse.py +9 -7
- results/results.csv +0 -30
- results/results_icarus.csv +30 -0
- results/{results.json → results_icarus.json} +0 -0
- results/results_verilator.csv +30 -0
- results/results_verilator.json +0 -0
app.py
CHANGED
@@ -171,8 +171,14 @@ function refresh() {
|
|
171 |
with gr.Blocks(
|
172 |
css=custom_css, js=js_func, theme=gr.themes.Default(primary_hue=colors.emerald)
|
173 |
) as app:
|
174 |
-
|
175 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
176 |
tasks = ["Spec-to-RTL", "Code Completion", "Line Completion"]
|
177 |
s2r_benchs = ["VerilogEval S2R", "RTLLM"]
|
178 |
cc_benchs = ["VerilogEval MC", "VeriGen"]
|
@@ -225,27 +231,35 @@ with gr.Blocks(
|
|
225 |
)
|
226 |
gr.HTML(
|
227 |
"""
|
228 |
-
|
229 |
-
|
230 |
-
|
231 |
-
|
232 |
-
|
233 |
-
|
234 |
-
|
|
|
235 |
)
|
236 |
with gr.Tabs():
|
237 |
with gr.Tab("Leaderboard"):
|
238 |
with gr.Row(equal_height=True):
|
239 |
-
with gr.Column():
|
240 |
task_radio = gr.Radio(
|
241 |
choices=tasks, label="Select Task", value="Spec-to-RTL"
|
242 |
)
|
243 |
-
with gr.Column():
|
244 |
benchmark_radio = gr.Radio(
|
245 |
choices=["All"] + s2r_benchs,
|
246 |
label="Select Benchmark",
|
247 |
value="All",
|
248 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
249 |
|
250 |
with gr.Row(equal_height=True):
|
251 |
search_box = gr.Textbox(
|
@@ -447,6 +461,28 @@ with gr.Blocks(
|
|
447 |
fig = generate_scatter_plot(benchmark, metric)
|
448 |
return gr.update(value=benchmark), fig
|
449 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
450 |
bubble_benchmark.change(
|
451 |
fn=on_benchmark_change,
|
452 |
inputs=[bubble_benchmark, bubble_metric],
|
@@ -481,6 +517,21 @@ with gr.Blocks(
|
|
481 |
""",
|
482 |
)
|
483 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
484 |
|
485 |
app.launch(
|
486 |
allowed_paths=[
|
|
|
171 |
with gr.Blocks(
|
172 |
css=custom_css, js=js_func, theme=gr.themes.Default(primary_hue=colors.emerald)
|
173 |
) as app:
|
174 |
+
df_icarus, benchmarks, metrics, default_metric = read_data(
|
175 |
+
"results/results_icarus.json"
|
176 |
+
)
|
177 |
+
df_agg_icarus = parse_agg("results/aggregated_scores_icarus.csv")
|
178 |
+
df_verilator, _, _, _ = read_data("results/results_verilator.json")
|
179 |
+
df_agg_verilator = parse_agg("results/aggregated_scores_verilator.csv")
|
180 |
+
df = df_icarus
|
181 |
+
df_agg = df_agg_icarus
|
182 |
tasks = ["Spec-to-RTL", "Code Completion", "Line Completion"]
|
183 |
s2r_benchs = ["VerilogEval S2R", "RTLLM"]
|
184 |
cc_benchs = ["VerilogEval MC", "VeriGen"]
|
|
|
231 |
)
|
232 |
gr.HTML(
|
233 |
"""
|
234 |
+
<div style=" margin-top:-10px !important;">
|
235 |
+
<p style="margin-bottom: 15px; text-align: start !important;">Welcome to the TuRTLe Model Leaderboard! TuRTLe is a <b>unified evaluation framework designed to systematically assess Large Language Models (LLMs) in RTL (Register-Transfer Level) generation</b> for hardware design.
|
236 |
+
Evaluation criteria include <b>syntax correctness, functional accuracy, synthesizability, and post-synthesis quality</b> (PPA: Power, Performance, Area). TuRTLe integrates multiple benchmarks to highlight strengths and weaknesses of available LLMs.
|
237 |
+
Use the filters below to explore different RTL benchmarks, simulators and models.</p>
|
238 |
+
<p style="margin-top:10px; text-align:start !important;"> <span style="font-variant:small-caps; font-weight:bold;">UPDATE (JULY 2025)</span>: We have added Verilator as a second simulator, the original Icarus data is still available. You can now filter the data by simulator</p>
|
239 |
+
<p style="margin-top: -6px; text-align: start !important; "><span style="font-variant: small-caps; font-weight: bold;">UPDATE (JUNE 2025)</span>: We make our framework open-source on GitHub and we add 7 new recent models! For a total of 40 base and instruct models and 5 RTL benchmarks</p>
|
240 |
+
</div>
|
241 |
+
"""
|
242 |
)
|
243 |
with gr.Tabs():
|
244 |
with gr.Tab("Leaderboard"):
|
245 |
with gr.Row(equal_height=True):
|
246 |
+
with gr.Column(scale=4):
|
247 |
task_radio = gr.Radio(
|
248 |
choices=tasks, label="Select Task", value="Spec-to-RTL"
|
249 |
)
|
250 |
+
with gr.Column(scale=3):
|
251 |
benchmark_radio = gr.Radio(
|
252 |
choices=["All"] + s2r_benchs,
|
253 |
label="Select Benchmark",
|
254 |
value="All",
|
255 |
)
|
256 |
+
with gr.Column(scale=2, min_width=180):
|
257 |
+
simulator_radio = gr.Radio(
|
258 |
+
choices=["Icarus", "Verilator"],
|
259 |
+
value="Icarus",
|
260 |
+
label="Simulator",
|
261 |
+
scale=1,
|
262 |
+
)
|
263 |
|
264 |
with gr.Row(equal_height=True):
|
265 |
search_box = gr.Textbox(
|
|
|
461 |
fig = generate_scatter_plot(benchmark, metric)
|
462 |
return gr.update(value=benchmark), fig
|
463 |
|
464 |
+
def on_simulator_change(
|
465 |
+
simulator,
|
466 |
+
task,
|
467 |
+
benchmark,
|
468 |
+
model_type,
|
469 |
+
search,
|
470 |
+
max_params,
|
471 |
+
plot_bench,
|
472 |
+
plot_metric,
|
473 |
+
):
|
474 |
+
global df, df_agg
|
475 |
+
if simulator == "Icarus":
|
476 |
+
df, df_agg = df_icarus, df_agg_icarus
|
477 |
+
else:
|
478 |
+
df, df_agg = df_verilator, df_agg_verilator
|
479 |
+
|
480 |
+
leaderboard_df = filter_leaderboard(
|
481 |
+
task, benchmark, model_type, search, max_params
|
482 |
+
)
|
483 |
+
fig = generate_scatter_plot(plot_bench, plot_metric)
|
484 |
+
return leaderboard_df, fig
|
485 |
+
|
486 |
bubble_benchmark.change(
|
487 |
fn=on_benchmark_change,
|
488 |
inputs=[bubble_benchmark, bubble_metric],
|
|
|
517 |
""",
|
518 |
)
|
519 |
|
520 |
+
simulator_radio.change(
|
521 |
+
fn=on_simulator_change,
|
522 |
+
inputs=[
|
523 |
+
simulator_radio,
|
524 |
+
task_radio,
|
525 |
+
benchmark_radio,
|
526 |
+
model_type_dropdown,
|
527 |
+
search_box,
|
528 |
+
params_slider,
|
529 |
+
bubble_benchmark,
|
530 |
+
bubble_metric,
|
531 |
+
],
|
532 |
+
outputs=[leaderboard, scatter_plot],
|
533 |
+
)
|
534 |
+
|
535 |
|
536 |
app.launch(
|
537 |
allowed_paths=[
|
results/aggregated_scores.csv
DELETED
@@ -1,28 +0,0 @@
|
|
1 |
-
Model,Agg S2R,Agg MC,Agg VerilogEval S2R,Agg VerilogEval MC,Agg RTLLM,Agg VeriGen
|
2 |
-
DeepSeek R1,75.53,72.96,77.67,77.55,68.49,57.82
|
3 |
-
Llama 3.1 405B,53.23,53.88,56.55,54.35,42.26,52.35
|
4 |
-
Qwen3 236B A22B,69.16,63.42,74.83,68.36,50.48,47.15
|
5 |
-
Llama 3.(1-3) 70B,39.48,43.29,39.47,40.83,39.53,51.42
|
6 |
-
Qwen2.5 72B,49.36,47.23,50.22,50.74,46.51,35.65
|
7 |
-
QwQ 32B,62.6,39.46,65.02,38.68,54.6,42.03
|
8 |
-
Qwen2.5 32B,50.39,38.93,50.86,41.01,48.86,32.09
|
9 |
-
StarChat2 15B v0.1,38.76,38.98,36.68,35.58,45.61,50.2
|
10 |
-
DeepSeek R1 Distill Qwen 14B,23.14,23.3,24.94,24.3,17.22,20.01
|
11 |
-
CodeLlama 70B,33.04,32.86,32.2,32.27,35.81,34.8
|
12 |
-
DeepSeek Coder 33B,27.03,36.31,22.65,37.64,41.47,31.91
|
13 |
-
QwenCoder 2.5 32B,44.02,43.75,43.68,44.05,45.15,42.76
|
14 |
-
QwenCoder 2.5 14B,37.69,38.97,35.32,40.26,45.5,34.72
|
15 |
-
DeepCoder 14B,26.4,30.75,27.32,33.18,23.38,22.75
|
16 |
-
OpenCoder 8B,30.06,35.86,26.8,34.57,40.83,40.1
|
17 |
-
SeedCoder 8B,50.89,34.05,51.71,36.52,48.2,25.89
|
18 |
-
SeedCoder 8B Reasoning,43.75,47.1,47.85,46.76,30.22,48.23
|
19 |
-
QwenCoder 2.5 7B,14.15,32.86,6.57,33.0,39.16,32.4
|
20 |
-
"DeepSeek Coder 6,7B",31.87,27.89,28.88,28.99,41.75,24.27
|
21 |
-
RTLCoder Mistral,21.82,28.65,23.71,26.34,15.58,36.27
|
22 |
-
RTLCoder DeepSeek,37.22,36.64,38.33,36.13,33.58,38.33
|
23 |
-
OriGen,52.88,51.89,53.0,50.0,52.47,58.12
|
24 |
-
CodeV R1 Distill Qwen 7B,36.12,26.84,32.35,20.56,48.57,47.55
|
25 |
-
HaVen-CodeQwen,43.58,47.13,44.67,47.23,39.98,46.8
|
26 |
-
CodeV-CL-7B,14.73,33.73,12.71,30.93,21.38,42.97
|
27 |
-
CodeV-QW-7B,20.37,50.11,18.82,50.64,25.48,48.38
|
28 |
-
CodeV-DS-6.7B,19.62,47.1,14.8,46.08,35.52,50.46
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
results/aggregated_scores_icarus.csv
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Model,Agg S2R,Agg MC,Agg VerilogEval S2R,Agg VerilogEval MC,Agg RTLLM,Agg VeriGen
|
2 |
+
DeepSeek R1-0528,76.79,77.79,78.84,79.65,70.04,71.64
|
3 |
+
DeepSeek R1,75.53,76.24,77.67,77.55,68.49,71.92
|
4 |
+
Llama 3.1 405B,53.23,55.25,56.55,54.35,42.26,58.23
|
5 |
+
Qwen3 235B A22B,69.16,66.42,74.83,68.36,50.48,60.01
|
6 |
+
Qwen2.5 72B,49.36,49.97,50.22,50.74,46.51,47.42
|
7 |
+
Llama 3.(1-3) 70B,39.48,46.29,39.47,40.83,39.53,64.29
|
8 |
+
QwQ 32B,62.6,41.92,65.02,38.68,54.6,52.6
|
9 |
+
Qwen2.5 32B,50.39,41.94,50.86,41.01,48.86,45.0
|
10 |
+
StarChat2 15B v0.1,38.76,41.72,36.68,35.58,45.61,61.96
|
11 |
+
DeepSeek R1 Distill Qwen 14B,23.14,24.94,24.94,24.3,17.22,27.07
|
12 |
+
CodeLlama 70B,33.04,35.59,32.2,32.27,35.81,46.56
|
13 |
+
DeepSeek Coder 33B,27.03,39.59,22.65,37.64,41.47,46.01
|
14 |
+
QwenCoder 2.5 32B,44.02,46.49,43.68,44.05,45.15,54.52
|
15 |
+
DeepCoder 14B,26.4,32.92,27.32,33.18,23.38,32.07
|
16 |
+
QwenCoder 2.5 14B,37.69,41.98,35.32,40.26,45.5,47.64
|
17 |
+
SeedCoder 8B,50.89,36.79,51.71,36.52,48.2,37.66
|
18 |
+
SeedCoder 8B Reasoning,43.75,49.83,47.85,46.76,30.22,59.97
|
19 |
+
OpenCoder 8B,30.06,36.95,26.8,34.57,40.83,44.8
|
20 |
+
QwenCoder 2.5 7B,14.15,34.5,6.57,33.0,39.16,39.46
|
21 |
+
DeepSeek Coder 6.7B,31.87,30.9,28.88,28.99,41.75,37.19
|
22 |
+
CodeV R1 Distill Qwen 7B,36.12,30.66,32.35,20.56,48.57,63.98
|
23 |
+
HaVen-CodeQwen,43.58,50.68,44.67,47.23,39.98,62.04
|
24 |
+
CodeV-QW-7B,20.37,52.85,18.82,50.64,25.48,60.14
|
25 |
+
RTLCoder Mistral,21.82,32.19,23.71,26.34,15.58,51.5
|
26 |
+
RTLCoder DeepSeek,37.22,40.19,38.33,36.13,33.58,53.57
|
27 |
+
OriGen,52.88,55.97,53.0,50.0,52.47,75.66
|
28 |
+
CodeV-CL-7B,14.73,35.1,12.71,30.93,21.38,48.85
|
29 |
+
CodeV-DS-6.7B,19.62,49.29,14.8,46.08,35.52,59.87
|
results/aggregated_scores_verilator.csv
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Model,Agg S2R,Agg MC,Agg VerilogEval S2R,Agg VerilogEval MC,Agg RTLLM,Agg VeriGen
|
2 |
+
DeepSeek R1-0528,75.83,77.12,77.64,78.78,69.85,71.64
|
3 |
+
DeepSeek R1,75.78,75.4,78.04,76.42,68.31,72.05
|
4 |
+
Llama 3.1 405B,52.08,55.01,54.39,55.1,44.48,54.7
|
5 |
+
Qwen3 236B A22B,69.17,65.8,74.24,67.55,52.44,60.01
|
6 |
+
Qwen2.5 72B,51.72,52.09,52.7,52.44,48.49,50.95
|
7 |
+
Llama 3.(1-3) 70B,40.06,47.44,39.84,42.69,40.79,63.12
|
8 |
+
QwQ 32B,63.76,44.52,66.09,38.64,56.06,63.91
|
9 |
+
Qwen2.5 32B,53.2,44.35,54.23,43.05,49.81,48.64
|
10 |
+
StarChat2 15B v0.1,40.2,41.91,37.97,35.85,47.54,61.91
|
11 |
+
DeepSeek R1 Distill Qwen 14B,22.93,25.34,24.44,24.43,17.96,28.33
|
12 |
+
CodeLlama 70B,34.55,38.02,33.58,33.89,37.75,51.62
|
13 |
+
DeepSeek Coder 33B,27.93,41.16,23.14,38.14,43.71,51.12
|
14 |
+
QwenCoder 2.5 32B,45.72,48.38,45.31,46.49,47.07,54.62
|
15 |
+
DeepCoder 14B,27.06,33.64,27.87,33.39,24.38,34.45
|
16 |
+
QwenCoder 2.5 14B,39.39,43.55,36.86,41.54,47.73,50.17
|
17 |
+
SeedCoder 8B,52.04,38.31,52.58,37.24,50.25,41.84
|
18 |
+
SeedCoder 8B Reasoning,43.41,50.73,47.02,47.51,31.51,61.35
|
19 |
+
OpenCoder 8B,30.45,37.27,26.96,35.34,41.96,43.63
|
20 |
+
QwenCoder 2.5 7B,14.91,37.2,7.08,34.02,40.74,47.7
|
21 |
+
DeepSeek Coder 6.7B,34.14,31.2,30.46,29.39,46.28,37.19
|
22 |
+
CodeV R1 Distill Qwen 7B,37.26,30.97,33.33,21.67,50.21,61.63
|
23 |
+
HaVen-CodeQwen,44.57,52.4,45.09,48.07,42.87,66.7
|
24 |
+
CodeV-QW-7B,21.69,52.12,19.85,50.51,27.77,57.45
|
25 |
+
RTLCoder Mistral,22.64,33.32,24.75,26.44,15.68,56.02
|
26 |
+
RTLCoder DeepSeek,38.48,39.89,39.19,35.74,36.14,53.57
|
27 |
+
OriGen,52.85,55.3,52.72,49.84,53.29,73.3
|
28 |
+
CodeV-CL-7B,15.32,35.2,13.21,31.06,22.28,48.85
|
29 |
+
CodeV-DS-6.7B,19.28,49.43,14.23,45.91,35.94,61.05
|
results/parse.py
CHANGED
@@ -111,7 +111,7 @@ model_details = {
|
|
111 |
"Coding",
|
112 |
"V1",
|
113 |
),
|
114 |
-
"DeepSeek Coder 6
|
115 |
"https://huggingface.co/deepseek-ai/deepseek-coder-6.7b-instruct",
|
116 |
6.74,
|
117 |
"Coding",
|
@@ -198,6 +198,7 @@ def parse_results(csv_path: str) -> list[dict]:
|
|
198 |
metrics, benchs = get_headers(reader)
|
199 |
for i, row in enumerate(reader):
|
200 |
model = row[0]
|
|
|
201 |
url, params, type, release = get_model_params_and_url(model)
|
202 |
models.append(model)
|
203 |
row = row[1:]
|
@@ -220,12 +221,12 @@ def parse_results(csv_path: str) -> list[dict]:
|
|
220 |
return dataset
|
221 |
|
222 |
|
223 |
-
def parse_agg(csv_path: str) ->
|
224 |
"""
|
225 |
Each row has the following format:
|
226 |
MODEL | BENCHMARK | TASK | METRIC | RESULT
|
227 |
"""
|
228 |
-
return pd.read_csv(
|
229 |
|
230 |
|
231 |
def writeJson(data: list):
|
@@ -234,15 +235,16 @@ def writeJson(data: list):
|
|
234 |
print("Done")
|
235 |
|
236 |
|
237 |
-
def read_json():
|
238 |
-
json_path = "results/results.json"
|
239 |
with open(json_path, "r", encoding="utf-8") as file:
|
240 |
data = json.load(file)
|
241 |
return data
|
242 |
|
243 |
|
244 |
-
def read_data(
|
245 |
-
|
|
|
|
|
246 |
df = pd.DataFrame(data)
|
247 |
df.rename(
|
248 |
columns={
|
|
|
111 |
"Coding",
|
112 |
"V1",
|
113 |
),
|
114 |
+
"DeepSeek Coder 6.7B": (
|
115 |
"https://huggingface.co/deepseek-ai/deepseek-coder-6.7b-instruct",
|
116 |
6.74,
|
117 |
"Coding",
|
|
|
198 |
metrics, benchs = get_headers(reader)
|
199 |
for i, row in enumerate(reader):
|
200 |
model = row[0]
|
201 |
+
print(model)
|
202 |
url, params, type, release = get_model_params_and_url(model)
|
203 |
models.append(model)
|
204 |
row = row[1:]
|
|
|
221 |
return dataset
|
222 |
|
223 |
|
224 |
+
def parse_agg(csv_path: str = "results/aggregated_scores_icarus.csv") -> pd.DataFrame:
|
225 |
"""
|
226 |
Each row has the following format:
|
227 |
MODEL | BENCHMARK | TASK | METRIC | RESULT
|
228 |
"""
|
229 |
+
return pd.read_csv(csv_path)
|
230 |
|
231 |
|
232 |
def writeJson(data: list):
|
|
|
235 |
print("Done")
|
236 |
|
237 |
|
238 |
+
def read_json(json_path: str = "results/results_icarus.json"):
|
|
|
239 |
with open(json_path, "r", encoding="utf-8") as file:
|
240 |
data = json.load(file)
|
241 |
return data
|
242 |
|
243 |
|
244 |
+
def read_data(
|
245 |
+
json_path: str = "results/results_icarus.json",
|
246 |
+
) -> tuple[pd.DataFrame, list, list, str]:
|
247 |
+
data = read_json(json_path)
|
248 |
df = pd.DataFrame(data)
|
249 |
df.rename(
|
250 |
columns={
|
results/results.csv
DELETED
@@ -1,30 +0,0 @@
|
|
1 |
-
,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area,EM,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area
|
2 |
-
,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,RTL-Repo,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen
|
3 |
-
DeepSeek R1-0528,96.15,86.12,81.54,64.9,81.28,64.49,79.15,73.33,78.09,65.64,79.28,71.15,-1,95.38,91.76,81.54,62.35,81.41,62.35,80.27,52.12,78.69,62.25,79.99,65.32
|
4 |
-
DeepSeek R1,97.18,89.80,79.74,65.71,79.62,63.27,78.33,71.34,76.49,64.06,78.19,70.08,-1.00,97.44,96.47,79.49,60.00,79.49,60.00,78.27,50.25,76.43,60.15,77.96,63.07
|
5 |
-
Llama 3.1 405B,87.44,77.14,58.97,45.71,58.85,41.63,57.58,50.88,55.93,32.44,56.13,43.45,34.62,88.59,95.29,56.15,52.94,55.90,52.94,55.13,49.22,53.45,52.52,54.48,55.31
|
6 |
-
Qwen3 236B A22B,91.28,73.88,76.92,51.43,76.79,48.57,75.25,54.61,73.56,46.37,75.67,50.47,41.94,82.18,87.06,69.62,49.41,69.62,49.41,69.04,41.82,66.89,49.64,69.15,49.99
|
7 |
-
Llama 3.(1-3) 70B,66.15,73.88,40.64,42.45,40.64,39.18,40.46,40.81,38.08,38.14,39.86,39.65,28.72,84.74,89.41,41.67,51.76,41.67,51.76,41.38,50.61,39.75,51.76,41.36,51.88
|
8 |
-
Qwen2.5 72B,82.18,79.59,52.44,45.31,51.92,44.08,51.83,46.47,48.75,45.40,50.09,47.65,37.44,80.90,84.71,52.95,35.29,52.69,35.29,51.66,35.82,49.37,35.20,51.18,35.94
|
9 |
-
QwQ 32B,87.95,82.45,66.41,56.73,66.41,52.24,66.15,55.83,63.80,51.91,65.12,56.07,-1.00,58.97,68.24,40.00,42.35,39.62,42.35,39.40,40.90,37.53,42.31,39.10,42.87
|
10 |
-
Qwen2.5 32B,88.59,84.08,52.56,50.20,52.18,46.12,52.32,49.73,49.43,46.43,50.82,50.43,28.93,93.21,85.88,41.54,32.94,41.54,32.94,41.31,30.65,40.48,33.11,41.23,32.50
|
11 |
-
StarChat2 15B v0.1,88.46,84.90,37.95,44.49,37.95,44.08,37.56,46.95,35.30,43.22,37.19,46.65,13.42,79.74,92.94,36.41,51.76,36.03,51.76,36.08,46.30,34.91,51.49,35.76,52.80
|
12 |
-
DeepSeek R1 Distill Qwen 14B,42.18,34.69,25.51,18.37,25.51,16.33,25.36,17.86,24.19,16.48,25.27,17.33,-1.00,45.00,44.71,25.64,21.18,25.26,21.18,24.79,17.65,23.48,21.08,24.63,21.29
|
13 |
-
CodeLlama 70B,67.05,69.80,33.08,36.33,33.08,34.29,32.69,37.19,31.46,34.29,32.44,35.95,24.33,90.77,88.24,33.33,35.29,33.33,35.29,33.02,34.03,30.80,35.15,32.99,35.21
|
14 |
-
DeepSeek Coder 33B,62.82,83.67,23.33,42.45,23.08,42.04,22.86,42.29,22.81,39.42,22.29,42.71,24.58,75.26,88.24,39.62,31.76,39.36,31.76,38.23,32.16,36.79,31.46,37.90,32.12
|
15 |
-
QwenCoder 2.5 32B,87.18,77.96,45.00,43.27,44.87,43.27,44.25,46.82,43.03,43.20,43.76,45.42,31.07,83.72,87.06,45.64,42.35,45.13,42.35,44.59,42.79,43.01,42.24,44.55,43.25
|
16 |
-
QwenCoder 2.5 14B,78.97,81.63,37.82,46.12,37.44,45.31,35.94,45.82,34.83,44.64,35.18,46.05,37.53,80.00,83.53,41.67,35.29,41.15,35.29,40.74,34.17,39.20,35.32,40.83,34.67
|
17 |
-
DeepCoder 14B,43.85,39.59,28.08,23.67,28.08,22.04,27.94,25.00,26.26,22.00,27.77,23.15,-1.00,61.92,48.24,34.10,23.53,33.72,23.53,33.70,21.18,32.17,23.43,33.67,23.65
|
18 |
-
OpenCoder 8B,78.21,75.92,28.46,42.86,27.82,40.82,27.34,41.36,25.95,39.77,27.11,41.36,16.17,80.00,95.29,35.64,41.18,35.38,41.18,35.12,37.69,33.47,41.05,35.13,41.55
|
19 |
-
SeedCoder 8B,91.41,85.31,53.46,47.35,53.33,46.53,52.86,49.42,50.62,45.60,51.65,49.59,28.23,77.44,94.12,37.31,30.59,37.31,27.06,37.32,23.53,35.35,26.92,36.89,27.23
|
20 |
-
SeedCoder 8B Reasoning,67.82,53.47,49.23,30.20,49.23,29.39,48.92,32.04,46.76,28.64,47.87,29.99,-1.00,83.33,78.82,48.21,50.59,48.08,50.59,47.78,41.74,45.44,50.02,47.06,52.92
|
21 |
-
QwenCoder 2.5 7B,20.13,76.33,6.92,38.78,6.67,37.14,6.51,40.65,6.63,37.25,6.56,39.58,28.33,74.10,90.59,33.72,32.94,33.72,32.94,33.59,30.67,31.78,33.01,33.62,33.51
|
22 |
-
"DeepSeek Coder 6,7B",82.05,78.78,29.62,41.22,29.49,38.78,29.51,42.62,27.73,39.33,29.41,43.30,24.63,67.18,84.71,31.67,24.71,29.87,24.71,29.78,23.53,27.98,24.50,29.21,24.79
|
23 |
-
RTLCoder Mistral,54.87,32.24,24.62,16.33,24.62,15.92,24.28,16.03,22.78,14.71,24.06,16.00,14.77,60.51,85.88,27.05,36.47,27.05,36.47,26.94,34.63,25.22,36.55,26.87,37.64
|
24 |
-
RTLCoder DeepSeek,84.62,73.06,39.49,37.14,39.49,34.69,38.91,34.30,37.52,32.76,38.55,33.69,19.35,77.31,85.88,36.92,40.00,36.79,40.00,36.94,35.57,34.84,39.83,36.62,39.60
|
25 |
-
OriGen,96.15,81.63,54.23,50.61,54.23,50.61,54.29,53.10,51.57,50.86,53.15,53.44,17.07,92.44,98.82,50.77,58.82,50.77,58.82,50.95,54.14,48.53,58.81,50.51,61.40
|
26 |
-
CodeV R1 Distill Qwen 7B,56.92,73.06,33.33,49.80,33.33,47.35,32.58,49.25,32.01,47.45,32.45,49.01,-1.00,92.69,89.41,21.28,49.41,21.28,49.41,21.04,43.68,19.59,49.06,21.05,49.91
|
27 |
-
HaVen-CodeQwen,93.33,80.41,47.31,42.86,46.15,41.22,45.08,40.59,44.26,38.83,44.68,40.53,25.14,93.59,100.00,50.13,47.06,49.49,47.06,47.55,46.60,47.05,47.14,47.09,46.67
|
28 |
-
CodeV-CL-7B,32.18,48.16,13.08,24.49,12.95,21.63,12.80,22.25,12.51,20.59,12.82,21.29,12.27,92.05,98.82,31.79,43.53,31.79,43.53,31.74,42.25,29.45,43.46,31.61,43.20
|
29 |
-
CodeV-QW-7B,45.38,68.16,19.62,34.29,18.97,26.53,18.91,28.14,18.71,21.80,18.85,26.50,20.94,93.33,100.00,52.31,48.24,51.54,48.24,51.69,48.14,48.79,48.18,51.45,48.81
|
30 |
-
CodeV-DS-6.7B,33.59,67.35,15.00,38.78,15.00,37.14,15.10,35.56,14.46,35.13,14.85,35.88,21.26,95.51,100.00,47.05,50.59,47.05,50.59,47.37,50.47,44.35,50.54,46.52,50.36
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
results/results_icarus.csv
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area,EM,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area
|
2 |
+
,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,RTL-Repo,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen
|
3 |
+
DeepSeek R1-0528,96.150000000000006,86.120000000000005,81.540000000000006,64.900000000000006,81.280000000000001,64.489999999999995,79.150000000000006,73.329999999999998,78.090000000000003,65.640000000000001,79.280000000000001,71.150000000000006,-1,95.379999999999995,91.760000000000005,81.540000000000006,74.120000000000005,81.409999999999997,74.120000000000005,80.269999999999996,63.859999999999999,78.689999999999998,74.049999999999997,79.989999999999995,77.010000000000005
|
4 |
+
DeepSeek R1,97.180000000000007,89.799999999999997,79.739999999999995,65.709999999999994,79.620000000000005,63.270000000000003,78.329999999999998,71.340000000000003,76.489999999999995,64.060000000000002,78.189999999999998,70.079999999999998,-1,97.439999999999998,96.469999999999999,79.489999999999995,74.120000000000005,79.489999999999995,74.120000000000005,78.269999999999996,64.340000000000003,76.430000000000007,74.290000000000006,77.959999999999994,77.120000000000005
|
5 |
+
Llama 3.1 405B,87.439999999999998,77.140000000000001,58.969999999999999,45.710000000000001,58.850000000000001,41.630000000000003,57.579999999999998,50.880000000000003,55.93,32.439999999999998,56.130000000000003,43.450000000000003,34.619999999999997,88.590000000000003,95.290000000000006,56.149999999999999,58.82,55.899999999999999,58.82,55.130000000000003,55.100000000000001,53.450000000000003,58.399999999999999,54.479999999999997,61.200000000000003
|
6 |
+
Qwen3 236B A22B,91.280000000000001,73.879999999999995,76.920000000000002,51.43,76.790000000000006,48.57,75.25,54.609999999999999,73.560000000000002,46.369999999999997,75.670000000000002,50.469999999999999,41.939999999999998,82.180000000000007,87.060000000000002,69.620000000000005,62.350000000000001,69.620000000000005,62.350000000000001,69.040000000000006,54.630000000000003,66.890000000000001,62.630000000000003,69.150000000000006,62.780000000000001
|
7 |
+
Qwen2.5 72B,82.180000000000007,79.590000000000003,52.439999999999998,45.310000000000002,51.920000000000002,44.079999999999998,51.829999999999998,46.469999999999999,48.75,45.399999999999999,50.090000000000003,47.649999999999999,37.439999999999998,80.900000000000006,84.709999999999994,52.950000000000003,47.060000000000002,52.689999999999998,47.060000000000002,51.659999999999997,47.590000000000003,49.369999999999997,46.960000000000001,51.18,47.700000000000003
|
8 |
+
Llama 3.(1-3) 70B,66.150000000000006,73.879999999999995,40.640000000000001,42.450000000000003,40.640000000000001,39.18,40.460000000000001,40.810000000000002,38.079999999999998,38.140000000000001,39.859999999999999,39.649999999999999,28.719999999999999,84.739999999999995,89.409999999999997,41.670000000000002,65.879999999999995,41.670000000000002,64.709999999999994,41.380000000000003,63.469999999999999,39.75,64.689999999999998,41.359999999999999,64.709999999999994
|
9 |
+
QwQ 32B,87.950000000000003,82.450000000000003,66.409999999999997,56.729999999999997,66.409999999999997,52.240000000000002,66.150000000000006,55.829999999999998,63.799999999999997,51.909999999999997,65.120000000000005,56.07,-1,58.969999999999999,68.239999999999995,40,52.939999999999998,39.619999999999997,52.939999999999998,39.399999999999999,51.469999999999999,37.530000000000001,52.93,39.100000000000001,53.390000000000001
|
10 |
+
Qwen2.5 32B,88.590000000000003,84.079999999999998,52.560000000000002,50.200000000000003,52.18,46.119999999999997,52.32,49.729999999999997,49.43,46.43,50.82,50.43,28.93,93.209999999999994,85.879999999999995,41.539999999999999,45.880000000000003,41.539999999999999,45.880000000000003,41.310000000000002,43.560000000000002,40.479999999999997,46.079999999999998,41.229999999999997,45.369999999999997
|
11 |
+
StarChat2 15B v0.1,88.459999999999994,84.900000000000006,37.950000000000003,44.490000000000002,37.950000000000003,44.079999999999998,37.560000000000002,46.950000000000003,35.299999999999997,43.219999999999999,37.189999999999998,46.649999999999999,13.42,79.739999999999995,92.939999999999998,36.409999999999997,63.530000000000001,36.030000000000001,63.530000000000001,36.079999999999998,58.060000000000002,34.909999999999997,63.259999999999998,35.759999999999998,64.560000000000002
|
12 |
+
DeepSeek R1 Distill Qwen 14B,42.18,34.689999999999998,25.510000000000002,18.370000000000001,25.510000000000002,16.329999999999998,25.359999999999999,17.859999999999999,24.190000000000001,16.48,25.27,17.329999999999998,-1,45,44.710000000000001,25.640000000000001,28.239999999999998,25.260000000000002,28.239999999999998,24.789999999999999,24.710000000000001,23.48,28.140000000000001,24.629999999999999,28.350000000000001
|
13 |
+
CodeLlama 70B,67.049999999999997,69.799999999999997,33.079999999999998,36.329999999999998,33.079999999999998,34.289999999999999,32.689999999999998,37.189999999999998,31.460000000000001,34.289999999999999,32.439999999999998,35.950000000000003,24.329999999999998,90.769999999999996,88.239999999999995,33.329999999999998,47.060000000000002,33.329999999999998,47.060000000000002,33.020000000000003,45.799999999999997,30.800000000000001,46.909999999999997,32.990000000000002,46.979999999999997
|
14 |
+
DeepSeek Coder 33B,62.82,83.670000000000002,23.329999999999998,42.450000000000003,23.079999999999998,42.039999999999999,22.859999999999999,42.289999999999999,22.809999999999999,39.420000000000002,22.289999999999999,42.710000000000001,24.579999999999998,75.260000000000005,88.239999999999995,39.619999999999997,45.880000000000003,39.359999999999999,45.880000000000003,38.229999999999997,46.259999999999998,36.789999999999999,45.609999999999999,37.899999999999999,46.170000000000002
|
15 |
+
QwenCoder 2.5 32B,87.180000000000007,77.959999999999994,45,43.270000000000003,44.869999999999997,43.270000000000003,44.25,46.82,43.030000000000001,43.200000000000003,43.759999999999998,45.420000000000002,31.07,83.719999999999999,87.060000000000002,45.640000000000001,54.119999999999997,45.130000000000003,54.119999999999997,44.590000000000003,54.549999999999997,43.009999999999998,54.009999999999998,44.549999999999997,55.009999999999998
|
16 |
+
DeepCoder 14B,43.850000000000001,39.590000000000003,28.079999999999998,23.670000000000002,28.079999999999998,22.039999999999999,27.940000000000001,25,26.260000000000002,22,27.77,23.149999999999999,-1,61.920000000000002,48.240000000000002,34.100000000000001,32.939999999999998,33.719999999999999,32.939999999999998,33.700000000000003,30.469999999999999,32.170000000000002,32.840000000000003,33.670000000000002,32.909999999999997
|
17 |
+
QwenCoder 2.5 14B,78.969999999999999,81.629999999999995,37.82,46.119999999999997,37.439999999999998,45.310000000000002,35.939999999999998,45.82,34.829999999999998,44.640000000000001,35.18,46.049999999999997,37.530000000000001,80,83.530000000000001,41.670000000000002,48.240000000000002,41.149999999999999,48.240000000000002,40.740000000000002,47.090000000000003,39.200000000000003,48.289999999999999,40.829999999999998,47.539999999999999
|
18 |
+
SeedCoder 8B,91.409999999999997,85.310000000000002,53.460000000000001,47.350000000000001,53.329999999999998,46.530000000000001,52.859999999999999,49.420000000000002,50.619999999999997,45.600000000000001,51.649999999999999,49.590000000000003,28.23,77.439999999999998,94.120000000000005,37.310000000000002,42.350000000000001,37.310000000000002,38.82,37.32,35.289999999999999,35.350000000000001,38.689999999999998,36.890000000000001,38.990000000000002
|
19 |
+
SeedCoder 8B Reasoning,67.819999999999993,53.469999999999999,49.229999999999997,30.199999999999999,49.229999999999997,29.390000000000001,48.920000000000002,32.039999999999999,46.759999999999998,28.640000000000001,47.869999999999997,29.989999999999998,-1,83.329999999999998,78.819999999999993,48.210000000000001,62.350000000000001,48.079999999999998,62.350000000000001,47.780000000000001,53.479999999999997,45.439999999999998,61.810000000000002,47.060000000000002,64.620000000000005
|
20 |
+
OpenCoder 8B,78.209999999999994,75.920000000000002,28.460000000000001,42.859999999999999,27.82,40.82,27.34,41.359999999999999,25.949999999999999,39.770000000000003,27.109999999999999,41.359999999999999,16.170000000000002,80,95.290000000000006,35.640000000000001,45.880000000000003,35.380000000000003,45.880000000000003,35.119999999999997,42.399999999999999,33.469999999999999,45.75,35.130000000000003,46.259999999999998
|
21 |
+
QwenCoder 2.5 7B,20.129999999999999,76.329999999999998,6.9199999999999999,38.780000000000001,6.6699999999999999,37.140000000000001,6.5099999999999998,40.649999999999999,6.6299999999999999,37.25,6.5599999999999996,39.579999999999998,28.329999999999998,74.099999999999994,90.590000000000003,33.719999999999999,40,33.719999999999999,40,33.590000000000003,37.729999999999997,31.780000000000001,40.07,33.619999999999997,40.57
|
22 |
+
DeepSeek Coder 6.7B,82.049999999999997,78.780000000000001,29.620000000000001,41.219999999999999,29.489999999999998,38.780000000000001,29.510000000000002,42.619999999999997,27.73,39.329999999999998,29.41,43.299999999999997,24.629999999999999,67.180000000000007,84.709999999999994,31.670000000000002,37.649999999999999,29.870000000000001,37.649999999999999,29.780000000000001,36.450000000000003,27.98,37.469999999999999,29.210000000000001,37.659999999999997
|
23 |
+
CodeV R1 Distill Qwen 7B,56.920000000000002,73.060000000000002,33.329999999999998,49.799999999999997,33.329999999999998,47.350000000000001,32.579999999999998,49.25,32.009999999999998,47.450000000000003,32.450000000000003,49.009999999999998,-1,92.689999999999998,89.409999999999997,21.280000000000001,65.879999999999995,21.280000000000001,65.879999999999995,21.039999999999999,60.100000000000001,19.59,65.590000000000003,21.050000000000001,66.239999999999995
|
24 |
+
HaVen-CodeQwen,93.329999999999998,80.409999999999997,47.310000000000002,42.859999999999999,46.149999999999999,41.219999999999999,45.079999999999998,40.590000000000003,44.259999999999998,38.829999999999998,44.68,40.530000000000001,25.140000000000001,93.590000000000003,100,50.130000000000003,62.350000000000001,49.490000000000002,62.350000000000001,47.549999999999997,61.82,47.049999999999997,62.530000000000001,47.090000000000003,61.759999999999998
|
25 |
+
CodeV-QW-7B,45.380000000000003,68.159999999999997,19.620000000000001,34.289999999999999,18.969999999999999,26.530000000000001,18.91,28.140000000000001,18.710000000000001,21.800000000000001,18.850000000000001,26.5,20.940000000000001,93.329999999999998,100,52.310000000000002,60,51.539999999999999,60,51.689999999999998,59.899999999999999,48.789999999999999,59.950000000000003,51.450000000000003,60.579999999999998
|
26 |
+
RTLCoder Mistral,54.869999999999997,32.240000000000002,24.620000000000001,16.329999999999998,24.620000000000001,15.92,24.280000000000001,16.030000000000001,22.780000000000001,14.710000000000001,24.059999999999999,16,14.77,60.509999999999998,85.879999999999995,27.050000000000001,51.759999999999998,27.050000000000001,51.759999999999998,26.940000000000001,49.850000000000001,25.219999999999999,51.939999999999998,26.870000000000001,52.719999999999999
|
27 |
+
RTLCoder DeepSeek,84.620000000000005,73.060000000000002,39.490000000000002,37.140000000000001,39.490000000000002,34.689999999999998,38.909999999999997,34.299999999999997,37.520000000000003,32.759999999999998,38.549999999999997,33.689999999999998,19.350000000000001,77.310000000000002,85.879999999999995,36.920000000000002,55.289999999999999,36.789999999999999,55.289999999999999,36.939999999999998,50.789999999999999,34.840000000000003,55.219999999999999,36.619999999999997,54.689999999999998
|
28 |
+
OriGen,96.150000000000006,81.629999999999995,54.229999999999997,50.609999999999999,54.229999999999997,50.609999999999999,54.289999999999999,53.100000000000001,51.57,50.859999999999999,53.149999999999999,53.439999999999998,17.07,92.439999999999998,98.819999999999993,50.770000000000003,76.469999999999999,50.770000000000003,76.469999999999999,50.950000000000003,71.659999999999997,48.530000000000001,76.609999999999999,50.509999999999998,78.700000000000003
|
29 |
+
CodeV-CL-7B,32.18,48.159999999999997,13.08,24.489999999999998,12.949999999999999,21.629999999999999,12.800000000000001,22.25,12.51,20.59,12.82,21.289999999999999,12.27,92.049999999999997,98.819999999999993,31.789999999999999,49.409999999999997,31.789999999999999,49.409999999999997,31.739999999999998,48.130000000000003,29.449999999999999,49.340000000000003,31.609999999999999,49.079999999999998
|
30 |
+
CodeV-DS-6.7B,33.590000000000003,67.349999999999994,15,38.780000000000001,15,37.140000000000001,15.1,35.560000000000002,14.460000000000001,35.130000000000003,14.85,35.880000000000003,21.260000000000002,95.510000000000005,100,47.049999999999997,61.18,47.049999999999997,60,47.369999999999997,59.880000000000003,44.350000000000001,59.960000000000001,46.520000000000003,59.770000000000003
|
results/{results.json → results_icarus.json}
RENAMED
The diff for this file is too large to render.
See raw diff
|
|
results/results_verilator.csv
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area,EM,Syntax (STX),Syntax (STX),Functionality (FNC),Functionality (FNC),Synthesis (SYN),Synthesis (SYN),Power,Power,Performance,Performance,Area,Area
|
2 |
+
,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,VerilogEval S2R,RTLLM,RTL-Repo,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen,VerilogEval MC,VeriGen
|
3 |
+
DeepSeek R1-0528,96.540000000000006,89.790000000000006,79.099999999999994,67.659999999999997,78.969999999999999,64.260000000000005,78.439999999999998,73.319999999999993,76.290000000000006,65.379999999999995,78.200000000000003,70.859999999999999,-1,94.739999999999995,98.819999999999993,80,80,79.870000000000005,74.120000000000005,79.659999999999997,63.859999999999999,77.280000000000001,74.049999999999997,79.409999999999997,77.010000000000005
|
4 |
+
DeepSeek R1,97.689999999999998,93.189999999999998,79.359999999999999,67.659999999999997,79.099999999999994,62.979999999999997,79.010000000000005,71.379999999999995,76.489999999999995,63.740000000000002,78.629999999999995,69.819999999999993,-1,97.439999999999998,95.290000000000006,77.819999999999993,74.120000000000005,77.689999999999998,74.120000000000005,77.299999999999997,64.579999999999998,75.030000000000001,74.420000000000002,76.939999999999998,77.150000000000006
|
5 |
+
Llama 3.1 405B,88.209999999999994,83.400000000000006,56.789999999999999,50.210000000000001,56.409999999999997,43.829999999999998,55.159999999999997,53.869999999999997,54.009999999999998,33.829999999999998,53.990000000000002,45.729999999999997,34.619999999999997,90.510000000000005,95.290000000000006,57.689999999999998,60,56.670000000000002,55.289999999999999,55.950000000000003,51.57,54.090000000000003,54.869999999999997,55.259999999999998,57.670000000000002
|
6 |
+
Qwen3 236B A22B,93.969999999999999,78.719999999999999,75.769999999999996,56.170000000000002,75.379999999999995,50.210000000000001,75,57.009999999999998,72.939999999999998,47.850000000000001,74.780000000000001,52.450000000000003,41.939999999999998,83.719999999999999,88.239999999999995,68.969999999999999,62.350000000000001,68.459999999999994,62.350000000000001,68.299999999999997,54.630000000000003,65.989999999999995,62.630000000000003,68.349999999999994,62.780000000000001
|
7 |
+
Qwen2.5 72B,83.849999999999994,82.980000000000004,55,48.509999999999998,54.490000000000002,45.960000000000001,53.969999999999999,48.450000000000003,51.299999999999997,47.340000000000003,52.840000000000003,49.68,37.439999999999998,83.079999999999998,87.060000000000002,54.740000000000002,50.590000000000003,54.359999999999999,50.590000000000003,53.359999999999999,50.049999999999997,51.200000000000003,50.560000000000002,52.759999999999998,52.229999999999997
|
8 |
+
Llama 3.(1-3) 70B,68.329999999999998,79.150000000000006,40.899999999999999,45.960000000000001,40.899999999999999,40.43,40.770000000000003,42.119999999999997,38.329999999999998,39.340000000000003,40.420000000000002,40.920000000000002,28.719999999999999,86.030000000000001,87.060000000000002,43.719999999999999,63.530000000000001,43.590000000000003,63.530000000000001,43.549999999999997,62.289999999999999,41.57,63.520000000000003,42.939999999999998,63.539999999999999
|
9 |
+
QwQ 32B,89.230000000000004,85.959999999999994,67.560000000000002,58.299999999999997,67.180000000000007,53.619999999999997,67.040000000000006,57.289999999999999,64.780000000000001,53.340000000000003,66.439999999999998,57.560000000000002,-1,59.619999999999997,87.060000000000002,40.130000000000003,65.879999999999995,39.490000000000002,64.709999999999994,39.259999999999998,60.950000000000003,37.490000000000002,64.480000000000004,39.170000000000002,66.310000000000002
|
10 |
+
Qwen2.5 32B,90.900000000000006,87.659999999999997,55.899999999999999,50.210000000000001,55.259999999999998,46.810000000000002,55.560000000000002,50.659999999999997,53.100000000000001,47.409999999999997,54.020000000000003,51.369999999999997,28.93,95.510000000000005,85.879999999999995,45,49.409999999999997,43.719999999999999,49.409999999999997,43.719999999999999,46.409999999999997,42.490000000000002,49.890000000000001,42.950000000000003,49.609999999999999
|
11 |
+
StarChat2 15B v0.1,88.719999999999999,89.359999999999999,38.850000000000001,48.509999999999998,38.850000000000001,45.960000000000001,38.920000000000002,48.950000000000003,36.18,45.049999999999997,38.810000000000002,48.630000000000003,13.42,81.409999999999997,91.760000000000005,36.539999999999999,63.530000000000001,36.280000000000001,63.530000000000001,36.189999999999998,57.509999999999998,35.109999999999999,63.229999999999997,36.240000000000002,65
|
12 |
+
DeepSeek R1 Distill Qwen 14B,42.82,36.600000000000001,25.260000000000002,20.43,25,17.02,24.809999999999999,18.620000000000001,23.68,17.18,24.829999999999998,18.07,-1,45.640000000000001,44.710000000000001,25.379999999999999,29.41,25.260000000000002,29.41,24.98,25.920000000000002,23.609999999999999,29.43,24.690000000000001,29.649999999999999
|
13 |
+
CodeLlama 70B,67.310000000000002,77.450000000000003,34.740000000000002,38.719999999999999,34.490000000000002,36.170000000000002,34.030000000000001,39.18,32.880000000000003,36.140000000000001,33.829999999999998,37.93,24.329999999999998,92.560000000000002,88.239999999999995,35.770000000000003,52.939999999999998,35.380000000000003,51.759999999999998,34.810000000000002,50.619999999999997,32.340000000000003,51.890000000000001,34.520000000000003,52.359999999999999
|
14 |
+
DeepSeek Coder 33B,64.489999999999995,88.939999999999998,23.59,46.380000000000003,23.59,44.259999999999998,23.370000000000001,44.539999999999999,23.32,41.539999999999999,22.739999999999998,45.039999999999999,24.579999999999998,76.540000000000006,88.239999999999995,40.130000000000003,50.590000000000003,39.869999999999997,50.590000000000003,38.700000000000003,51.5,37.329999999999998,50.219999999999999,38.399999999999999,51.630000000000003
|
15 |
+
QwenCoder 2.5 32B,90.260000000000005,81.280000000000001,46.539999999999999,47.659999999999997,46.409999999999997,45.109999999999999,45.950000000000003,48.810000000000002,44.420000000000002,45.039999999999999,45.57,47.359999999999999,31.07,86.150000000000006,85.879999999999995,48.210000000000001,54.119999999999997,47.560000000000002,54.119999999999997,47.350000000000001,54.590000000000003,45.350000000000001,54.119999999999997,46.780000000000001,55.140000000000001
|
16 |
+
DeepCoder 14B,45.130000000000003,42.549999999999997,28.719999999999999,25.530000000000001,28.719999999999999,22.98,28.579999999999998,26.059999999999999,26.859999999999999,22.940000000000001,28.16,24.140000000000001,-1,63.460000000000001,49.409999999999997,34.359999999999999,37.649999999999999,34.100000000000001,35.289999999999999,34.170000000000002,32.789999999999999,32.579999999999998,35.289999999999999,33.409999999999997,35.280000000000001
|
17 |
+
QwenCoder 2.5 14B,80.900000000000006,82.980000000000004,39.869999999999997,50.640000000000001,38.969999999999999,47.659999999999997,37.490000000000002,47.82,36.369999999999997,46.979999999999997,36.729999999999997,48.399999999999999,37.530000000000001,81.409999999999997,84.709999999999994,43.079999999999998,50.590000000000003,42.439999999999998,50.590000000000003,42.020000000000003,49.509999999999998,40.479999999999997,50.859999999999999,42.109999999999999,50.149999999999999
|
18 |
+
SeedCoder 8B,96.409999999999997,89.359999999999999,54.359999999999999,51.490000000000002,54.229999999999997,48.509999999999998,53.68,51.520000000000003,51.5,47.539999999999999,52.560000000000002,51.700000000000003,28.23,78.209999999999994,91.760000000000005,38.210000000000001,47.060000000000002,38.079999999999998,43.530000000000001,38.100000000000001,37.890000000000001,36.090000000000003,43.770000000000003,37.539999999999999,43.869999999999997
|
19 |
+
SeedCoder 8B Reasoning,68.719999999999999,56.170000000000002,48.079999999999998,34.039999999999999,48.079999999999998,30.640000000000001,48.270000000000003,33.409999999999997,45.780000000000001,29.859999999999999,47,31.27,-1,84.489999999999995,80,48.969999999999999,63.530000000000001,48.850000000000001,63.530000000000001,48.68,54.979999999999997,46.32,62.969999999999999,47.530000000000001,66.099999999999994
|
20 |
+
OpenCoder 8B,80,80,27.949999999999999,43.829999999999998,27.949999999999999,42.130000000000003,27.52,42.439999999999998,26.07,40.979999999999997,27.280000000000001,42.460000000000001,16.170000000000002,81.030000000000001,94.120000000000005,36.789999999999999,49.409999999999997,36.149999999999999,44.710000000000001,35.890000000000001,41.219999999999999,34.240000000000002,44.579999999999998,35.899999999999999,45.079999999999998
|
21 |
+
QwenCoder 2.5 7B,19.23,83.400000000000006,7.1799999999999997,40.850000000000001,7.1799999999999997,38.719999999999999,7.0199999999999996,42.310000000000002,7.1500000000000004,38.710000000000001,7.0800000000000001,41.200000000000003,28.329999999999998,76.150000000000006,90.590000000000003,35,48.240000000000002,34.740000000000002,48.240000000000002,34.619999999999997,44.93,32.799999999999997,48.399999999999999,34.649999999999999,49.759999999999998
|
22 |
+
DeepSeek Coder 6.7B,86.030000000000001,89.359999999999999,31.280000000000001,45.960000000000001,31.149999999999999,42.979999999999997,31.16,47.369999999999997,29.149999999999999,43.299999999999997,31.079999999999998,48.170000000000002,24.629999999999999,69.099999999999994,83.530000000000001,31.670000000000002,37.649999999999999,30.129999999999999,37.649999999999999,30.190000000000001,36.450000000000003,28.16,37.469999999999999,29.82,37.659999999999997
|
23 |
+
CodeV R1 Distill Qwen 7B,56.409999999999997,79.150000000000006,33.969999999999999,50.640000000000001,33.850000000000001,48.939999999999998,33.799999999999997,50.920000000000002,32.490000000000002,49.039999999999999,33.710000000000001,50.670000000000002,-1,94.230000000000004,87.060000000000002,22.18,63.530000000000001,22.18,63.530000000000001,22.210000000000001,57.75,20.73,63.240000000000002,22.079999999999998,63.890000000000001
|
24 |
+
HaVen-CodeQwen,93.969999999999999,84.260000000000005,46.789999999999999,47.229999999999997,46.280000000000001,44.259999999999998,45.469999999999999,42.270000000000003,44.289999999999999,42.07,45.5,44.270000000000003,25.140000000000001,95,95.290000000000006,50,67.060000000000002,50,67.060000000000002,48.509999999999998,65.700000000000003,47.560000000000002,67.609999999999999,48.140000000000001,66.799999999999997
|
25 |
+
CodeV-QW-7B,45.259999999999998,71.489999999999995,20.640000000000001,36.170000000000002,20,29.359999999999999,19.940000000000001,30.309999999999999,19.739999999999998,24.52,19.879999999999999,28.48,20.940000000000001,92.689999999999998,96.469999999999999,51.539999999999999,57.649999999999999,51.409999999999997,57.649999999999999,51.520000000000003,56.439999999999998,48.710000000000001,57.560000000000002,51.310000000000002,58.350000000000001
|
26 |
+
RTLCoder Mistral,56.030000000000001,35.32,25.379999999999999,17.02,25.379999999999999,16.170000000000002,25.52,15.859999999999999,23.18,15.34,25.539999999999999,15.84,14.77,62.310000000000002,87.060000000000002,27.309999999999999,56.469999999999999,27.18,56.469999999999999,26.93,52.350000000000001,25.43,56.549999999999997,26.949999999999999,59.170000000000002
|
27 |
+
RTLCoder DeepSeek,84.739999999999995,76.170000000000002,40.509999999999998,42.130000000000003,40.380000000000003,37.450000000000003,39.729999999999997,36.75,38.439999999999998,35.289999999999999,39.399999999999999,36.390000000000001,19.350000000000001,79.230000000000004,85.879999999999995,36.409999999999997,55.289999999999999,36.409999999999997,55.289999999999999,36.490000000000002,50.789999999999999,34.509999999999998,55.219999999999999,36.210000000000001,54.689999999999998
|
28 |
+
OriGen,96.790000000000006,85.109999999999999,54.359999999999999,53.189999999999998,53.850000000000001,51.060000000000002,54.079999999999998,54.170000000000002,51.07,51.310000000000002,53.009999999999998,54.390000000000001,17.07,92.560000000000002,96.469999999999999,50.509999999999998,74.120000000000005,50.509999999999998,74.120000000000005,50.829999999999998,69.299999999999997,48.280000000000001,74.260000000000005,50.409999999999997,76.349999999999994
|
29 |
+
CodeV-CL-7B,32.82,54.469999999999999,13.460000000000001,29.359999999999999,13.33,22.550000000000001,13.19,23.190000000000001,13.26,21.469999999999999,13.19,22.190000000000001,12.27,92.180000000000007,98.819999999999993,31.789999999999999,49.409999999999997,31.789999999999999,49.409999999999997,31.739999999999998,48.130000000000003,29.829999999999998,49.340000000000003,31.609999999999999,49.079999999999998
|
30 |
+
CodeV-DS-6.7B,34.359999999999999,69.790000000000006,14.74,41.280000000000001,14.359999999999999,37.869999999999997,14.380000000000001,35.890000000000001,14.130000000000001,35.740000000000002,14.19,36.18,21.260000000000002,95.769999999999996,100,46.670000000000002,61.18,46.670000000000002,61.18,47.07,61.060000000000002,44.189999999999998,61.130000000000003,46.469999999999999,60.950000000000003
|
results/results_verilator.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|