decorative changes
Browse files- app.py +3 -1
- leaderboard.csv +15 -15
- templates/index.html +12 -12
app.py
CHANGED
@@ -8,7 +8,9 @@ def index():
|
|
8 |
# Load the CSV file into a DataFrame
|
9 |
df = pd.read_csv('leaderboard.csv')
|
10 |
|
11 |
-
df.
|
|
|
|
|
12 |
# Convert the DataFrame to HTML
|
13 |
table_html = df.to_html(classes='table table-striped table-bordered', index=False)
|
14 |
|
|
|
8 |
# Load the CSV file into a DataFrame
|
9 |
df = pd.read_csv('leaderboard.csv')
|
10 |
|
11 |
+
df = df.round(3)
|
12 |
+
df.insert(0, '#', '')
|
13 |
+
|
14 |
# Convert the DataFrame to HTML
|
15 |
table_html = df.to_html(classes='table table-striped table-bordered', index=False)
|
16 |
|
leaderboard.csv
CHANGED
@@ -1,15 +1,15 @@
|
|
1 |
-
Model,
|
2 |
-
phi-3-mini-128k-instruct,0.
|
3 |
-
phi-3-medium-128k-instruct,0.
|
4 |
-
Mistral-7B-Instruct-v0.1,0.
|
5 |
-
Mistral-7B-Instruct-v0.2,0.
|
6 |
-
Mistral-7B-Instruct-v0.3,0.
|
7 |
-
Mixtral-8x7B-Instruct-v0.1,0.
|
8 |
-
Mixtral-8x22B-Instruct-v0.1,0.
|
9 |
-
command_r_plus,0.
|
10 |
-
llama_3_8b_instruct,0.
|
11 |
-
llama_3_70b_instruct,0.
|
12 |
-
Qwen2-7B-Instruct,0.
|
13 |
-
Qwen2-72B-Instruct,0.
|
14 |
-
gpt-3.5-turbo-0125,0.
|
15 |
-
gpt-4o-0513,0.
|
|
|
1 |
+
Model,Ordinal (Win rate),Cardinal (Score),RO Stability,Rank Distance,CFI,SRMR,RMSEA,Cronbach alpha
|
2 |
+
phi-3-mini-128k-instruct,0.258309591642925,0.18707102480796897,0.16880341880341881,0.7264957264957265,0.32478632478632474,0.5555555555555556,0.6239316239316239,0.23076923076923084
|
3 |
+
phi-3-medium-128k-instruct,0.28490028490028496,0.18789267301588508,0.26282051282051283,0.7521367521367521,0.2820512820512821,0.7692307692307692,0.7606837606837606,0.5128205128205128
|
4 |
+
Mistral-7B-Instruct-v0.1,0.3418803418803419,0.23063750442486428,0.12393162393162394,0.4786324786324786,0.49572649572649574,0.3076923076923077,0.2222222222222222,0.09401709401709403
|
5 |
+
Mistral-7B-Instruct-v0.2,0.3342830009496676,0.1747138068267554,0.41666666666666674,0.4358974358974358,0.1282051282051282,0.829059829059829,0.8205128205128205,0.2991452991452992
|
6 |
+
Mistral-7B-Instruct-v0.3,0.3133903133903134,0.20131219867252867,0.23504273504273498,0.4273504273504273,0.28205128205128205,0.6324786324786325,0.5897435897435896,0.24786324786324787
|
7 |
+
Mixtral-8x7B-Instruct-v0.1,0.43114909781576455,0.2437400779497571,0.5811965811965812,0.641025641025641,0.2136752136752137,0.7863247863247863,0.7521367521367521,0.5213675213675214
|
8 |
+
Mixtral-8x22B-Instruct-v0.1,0.29629629629629634,0.18791617935864172,0.37820512820512825,0.6837606837606838,0.1794871794871795,0.9230769230769231,0.9145299145299145,0.49572649572649574
|
9 |
+
command_r_plus,0.560303893637227,0.3737946817620246,0.6880341880341879,0.6923076923076923,0.45299145299145294,0.5128205128205128,0.5811965811965811,0.6239316239316239
|
10 |
+
llama_3_8b_instruct,0.4691358024691358,0.28828624999947805,0.5747863247863247,0.5470085470085471,0.3162393162393162,0.7008547008547008,0.6923076923076923,0.5470085470085471
|
11 |
+
llama_3_70b_instruct,0.7701804368471036,0.5976823900754995,0.9380341880341881,0.7264957264957265,0.8376068376068376,0.4273504273504274,0.49572649572649574,0.9914529914529915
|
12 |
+
Qwen2-7B-Instruct,0.5251661918328584,0.3400513233761655,0.5769230769230768,0.5811965811965811,0.4188034188034188,0.45299145299145294,0.4871794871794872,0.5213675213675214
|
13 |
+
Qwen2-72B-Instruct,0.5906932573599241,0.42123592516768155,0.9658119658119655,0.5811965811965811,0.07692307692307693,0.9658119658119658,0.9914529914529915,0.9145299145299146
|
14 |
+
gpt-3.5-turbo-0125,0.23741690408357075,0.14920836189480854,0.24145299145299137,0.7777777777777778,0.1965811965811966,0.717948717948718,0.7094017094017093,0.1794871794871795
|
15 |
+
gpt-4o-0513,0.7340930674264008,0.5383734693976642,0.8482905982905984,0.6666666666666667,0.811965811965812,0.41025641025641024,0.3418803418803419,0.8205128205128205
|
templates/index.html
CHANGED
@@ -15,7 +15,7 @@
|
|
15 |
font-family: 'Arial', sans-serif;
|
16 |
}
|
17 |
.container {
|
18 |
-
max-width:
|
19 |
margin: auto; /* Center the container */
|
20 |
padding: 20px; /* Add some padding */
|
21 |
background: #fff;
|
@@ -31,14 +31,16 @@
|
|
31 |
}
|
32 |
table {
|
33 |
border-collapse: separate;
|
34 |
-
border-spacing: 0
|
35 |
-
font-size: 14px;
|
|
|
|
|
36 |
}
|
37 |
table thead th {
|
38 |
background-color: #610b5d;
|
39 |
color: white;
|
40 |
-
border:
|
41 |
-
|
42 |
}
|
43 |
table tbody tr {
|
44 |
background-color: #fff;
|
@@ -49,15 +51,13 @@
|
|
49 |
}
|
50 |
table td, table th {
|
51 |
padding: 10px; /* Reduce padding */
|
52 |
-
border:
|
53 |
}
|
54 |
-
table th:first-child
|
55 |
-
border-top-left-radius:
|
56 |
-
border-bottom-left-radius: 8px;
|
57 |
}
|
58 |
-
table th:last-child
|
59 |
-
border-top-right-radius:
|
60 |
-
border-bottom-right-radius: 8px;
|
61 |
}
|
62 |
</style>
|
63 |
</head>
|
|
|
15 |
font-family: 'Arial', sans-serif;
|
16 |
}
|
17 |
.container {
|
18 |
+
max-width: 1200px; /* Limit the width of the container */
|
19 |
margin: auto; /* Center the container */
|
20 |
padding: 20px; /* Add some padding */
|
21 |
background: #fff;
|
|
|
31 |
}
|
32 |
table {
|
33 |
border-collapse: separate;
|
34 |
+
border-spacing: 0;
|
35 |
+
font-size: 14px; /* Reduce the font size */
|
36 |
+
width: 100%;
|
37 |
+
border: none; /* Remove any default border */
|
38 |
}
|
39 |
table thead th {
|
40 |
background-color: #610b5d;
|
41 |
color: white;
|
42 |
+
border: 1px solid #dee2e6;
|
43 |
+
text-align: left;
|
44 |
}
|
45 |
table tbody tr {
|
46 |
background-color: #fff;
|
|
|
51 |
}
|
52 |
table td, table th {
|
53 |
padding: 10px; /* Reduce padding */
|
54 |
+
border: 1px solid #dee2e6;
|
55 |
}
|
56 |
+
table th:first-child {
|
57 |
+
border-top-left-radius: 10px;
|
|
|
58 |
}
|
59 |
+
table th:last-child {
|
60 |
+
border-top-right-radius: 10px;
|
|
|
61 |
}
|
62 |
</style>
|
63 |
</head>
|