Upload constants.py with huggingface_hub
Browse files- constants.py +20 -16
constants.py
CHANGED
|
@@ -1,16 +1,20 @@
|
|
| 1 |
AVBENCH_INTRODUCTION = """# AVBench Leaderboard
|
| 2 |
|
| 3 |
-
|
|
|
|
| 4 |
|
| 5 |
-
|
| 6 |
-
-
|
| 7 |
-
-
|
|
|
|
| 8 |
|
| 9 |
-
|
| 10 |
- Cross-Modal Alignment & Sync: AV, AT, VT, SyncNet
|
| 11 |
- Unimodal Generation Quality: SC, DF-Arena, NISQA, Audiobox, DOVER++, Aesthetic
|
|
|
|
| 12 |
|
| 13 |
-
|
|
|
|
| 14 |
"""
|
| 15 |
|
| 16 |
METRIC_COLUMNS = [
|
|
@@ -41,17 +45,17 @@ METRIC_WEIGHTS = {
|
|
| 41 |
}
|
| 42 |
|
| 43 |
NORMAL_ROWS = [
|
| 44 |
-
["Sora 2", 0.8713, 0.
|
| 45 |
-
["Veo 3 Fast", 0.6924, 0.
|
| 46 |
-
["Wan 2.6", 0.8207, 0.
|
| 47 |
-
["Kling 2.6", 0.7626, 0.
|
| 48 |
-
["Seedance 1.5 Pro", 0.6536, 0.
|
| 49 |
]
|
| 50 |
|
| 51 |
HARD_ROWS = [
|
| 52 |
-
["Sora 2", 0.9320, 0.
|
| 53 |
-
["Veo 3 Fast", 0.7766, 0.
|
| 54 |
-
["Wan 2.6", 0.8780, 0.
|
| 55 |
-
["Kling 2.6", 0.8813, 0.
|
| 56 |
-
["Seedance 1.5 Pro", 0.7409, 0.
|
| 57 |
]
|
|
|
|
| 1 |
AVBENCH_INTRODUCTION = """# AVBench Leaderboard
|
| 2 |
|
| 3 |
+
AVBench is a human-aligned and automated benchmark for evaluating text-to-audio-video (T2AV) generation.
|
| 4 |
+
It reports **Normal** and **Hard** splits across cross-modal alignment and unimodal quality metrics.
|
| 5 |
|
| 6 |
+
## Links
|
| 7 |
+
- Code: https://github.com/YaJialiang/AVBench
|
| 8 |
+
- Models: https://huggingface.co/iiiiii123/AVBench_model
|
| 9 |
+
- Dataset: https://huggingface.co/datasets/iiiiii123/AVBench
|
| 10 |
|
| 11 |
+
## Metrics
|
| 12 |
- Cross-Modal Alignment & Sync: AV, AT, VT, SyncNet
|
| 13 |
- Unimodal Generation Quality: SC, DF-Arena, NISQA, Audiobox, DOVER++, Aesthetic
|
| 14 |
+
- All metrics are higher-is-better.
|
| 15 |
|
| 16 |
+
## Chart
|
| 17 |
+

|
| 18 |
"""
|
| 19 |
|
| 20 |
METRIC_COLUMNS = [
|
|
|
|
| 45 |
}
|
| 46 |
|
| 47 |
NORMAL_ROWS = [
|
| 48 |
+
["Sora 2", 0.8713, 0.8675, 0.7599, 4.9057, 87.8391, 0.4328, 2.3784, 3.1759, 60.0125, 4.0704],
|
| 49 |
+
["Veo 3 Fast", 0.6924, 0.8300, 0.7235, 6.5943, 77.4950, 0.3043, 2.8191, 3.5877, 69.2275, 4.9967],
|
| 50 |
+
["Wan 2.6", 0.8207, 0.8227, 0.7556, 4.5016, 91.5568, 0.0441, 3.0289, 3.9271, 71.6473, 4.7790],
|
| 51 |
+
["Kling 2.6", 0.7626, 0.8061, 0.7501, 8.1027, 68.7844, 0.1665, 3.3141, 3.8082, 65.6786, 5.4885],
|
| 52 |
+
["Seedance 1.5 Pro", 0.6536, 0.8554, 0.7363, 5.0146, 84.9268, 0.1602, 3.6411, 4.1686, 71.7205, 4.7373],
|
| 53 |
]
|
| 54 |
|
| 55 |
HARD_ROWS = [
|
| 56 |
+
["Sora 2", 0.9320, 0.8575, 0.7190, 3.7932, 76.7905, 0.5498, 2.0564, 3.1339, 58.1538, 4.0434],
|
| 57 |
+
["Veo 3 Fast", 0.7766, 0.8117, 0.6943, 3.4535, 70.3144, 0.3827, 2.3321, 3.6113, 67.0833, 5.1438],
|
| 58 |
+
["Wan 2.6", 0.8780, 0.8418, 0.7482, 3.0488, 84.4512, 0.0498, 3.0726, 4.0924, 71.5229, 4.7721],
|
| 59 |
+
["Kling 2.6", 0.8813, 0.7602, 0.7105, 3.9844, 69.0691, 0.1469, 3.2425, 3.8912, 62.9994, 5.5033],
|
| 60 |
+
["Seedance 1.5 Pro", 0.7409, 0.8646, 0.7398, 3.3239, 80.8029, 0.2059, 3.4093, 4.1618, 69.4430, 4.7707],
|
| 61 |
]
|