Jonna Marie Matthiesen commited on
Commit ·
e36fba8
1
Parent(s): 3ba0d66
Add Qwen3.5 AGX Thor benchmarks
Browse files- config.json +34 -0
- data/Qwen3.5.csv +82 -0
config.json
CHANGED
|
@@ -135,6 +135,40 @@
|
|
| 135 |
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 136 |
"orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 137 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 138 |
}
|
| 139 |
}
|
| 140 |
}
|
|
|
|
| 135 |
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 136 |
"orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 137 |
}
|
| 138 |
+
},
|
| 139 |
+
"Qwen3.5-0.8B": {
|
| 140 |
+
"data_file": "data/Qwen3.5.csv",
|
| 141 |
+
"table_group_by": ["res", "fps"],
|
| 142 |
+
"experiment_setup": {
|
| 143 |
+
"agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 144 |
+
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 145 |
+
"orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 146 |
+
}
|
| 147 |
+
},
|
| 148 |
+
"Qwen3.5-2B": {
|
| 149 |
+
"data_file": "data/Qwen3.5.csv",
|
| 150 |
+
"table_group_by": ["res", "fps"],
|
| 151 |
+
"experiment_setup": {
|
| 152 |
+
"agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 153 |
+
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 154 |
+
"orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 155 |
+
}
|
| 156 |
+
},
|
| 157 |
+
"Qwen3.5-4B": {
|
| 158 |
+
"data_file": "data/Qwen3.5.csv",
|
| 159 |
+
"table_group_by": ["res", "fps"],
|
| 160 |
+
"experiment_setup": {
|
| 161 |
+
"agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 162 |
+
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 163 |
+
}
|
| 164 |
+
},
|
| 165 |
+
"Qwen3.5-9B": {
|
| 166 |
+
"data_file": "data/Qwen3.5.csv",
|
| 167 |
+
"table_group_by": ["res", "fps"],
|
| 168 |
+
"experiment_setup": {
|
| 169 |
+
"agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
|
| 170 |
+
"agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
|
| 171 |
+
}
|
| 172 |
}
|
| 173 |
}
|
| 174 |
}
|
data/Qwen3.5.csv
ADDED
|
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model_family,model,type,batch,device,res,fps,frames,e2e,tps,tpot,ttft
|
| 2 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,1280x720,N/A,N/A,3.1547,81.15,9.63,689.01
|
| 3 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,1920x1080,N/A,N/A,3.0482,83.98,9.52,609.01
|
| 4 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,854x480,N/A,N/A,2.9693,86.22,9.53,527.85
|
| 5 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,1280x720,N/A,N/A,6.0349,339.36,9.41,2220.21
|
| 6 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,1920x1080,N/A,N/A,5.4511,375.70,10.32,1861.66
|
| 7 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,854x480,N/A,N/A,6.0003,341.32,9.42,2261.71
|
| 8 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,text,1,agx_thor,N/A,N/A,N/A,2.4818,103.15,9.48,53.33
|
| 9 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,text,8,agx_thor,N/A,N/A,N/A,2.4017,852.74,9.01,88.37
|
| 10 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1280x720,2,6,2.8887,88.62,9.52,450.19
|
| 11 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1280x720,4,12,2.6629,96.13,8.70,435.18
|
| 12 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1920x1080,2,6,3.3747,75.86,9.72,884.67
|
| 13 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1920x1080,4,12,3.3594,76.20,9.63,892.37
|
| 14 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,854x480,2,6,2.6786,95.57,9.45,258.06
|
| 15 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,854x480,4,12,2.4043,106.48,8.43,245.77
|
| 16 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1280x720,2,6,4.7497,431.19,10.90,1235.70
|
| 17 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1280x720,4,12,4.8586,421.52,11.26,1243.70
|
| 18 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1920x1080,2,6,7.1575,286.14,12.02,2625.62
|
| 19 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1920x1080,4,12,7.1667,285.77,11.90,2639.20
|
| 20 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,854x480,2,6,3.3770,606.46,9.37,594.63
|
| 21 |
+
Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,854x480,4,12,3.6522,560.76,10.42,602.73
|
| 22 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,1280x720,N/A,N/A,5.3602,47.76,17.58,859.56
|
| 23 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,1920x1080,N/A,N/A,5.3912,47.48,17.69,861.15
|
| 24 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,854x480,N/A,N/A,4.9181,52.05,16.54,683.47
|
| 25 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,1280x720,N/A,N/A,8.7155,234.98,20.03,2253.31
|
| 26 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,1920x1080,N/A,N/A,8.6447,236.91,20.00,2230.21
|
| 27 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,854x480,N/A,N/A,8.7861,233.10,19.94,2283.97
|
| 28 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,text,1,agx_thor,N/A,N/A,N/A,4.7835,53.52,18.45,58.28
|
| 29 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,text,8,agx_thor,N/A,N/A,N/A,5.0283,407.29,19.22,99.12
|
| 30 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1280x720,2,6,5.0749,50.44,17.94,480.60
|
| 31 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1280x720,4,12,5.0026,51.17,17.67,479.12
|
| 32 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1920x1080,2,6,5.5593,46.05,17.80,1002.52
|
| 33 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1920x1080,4,12,5.5114,46.45,17.60,1004.64
|
| 34 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,854x480,2,6,4.4620,57.37,16.43,255.18
|
| 35 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,854x480,4,12,4.6379,55.20,17.09,261.74
|
| 36 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1280x720,2,6,7.1252,287.43,20.15,1253.66
|
| 37 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1280x720,4,12,7.2464,282.62,20.65,1253.71
|
| 38 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1920x1080,2,6,10.0072,204.65,23.88,2654.43
|
| 39 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1920x1080,4,12,9.9937,204.93,23.86,2650.33
|
| 40 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,854x480,2,6,5.8224,351.75,18.88,595.93
|
| 41 |
+
Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,854x480,4,12,5.8278,351.42,18.92,595.51
|
| 42 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,1280x720,N/A,N/A,10.9790,23.32,36.40,1660.10
|
| 43 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,1920x1080,N/A,N/A,10.2370,25.01,36.68,846.99
|
| 44 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,854x480,N/A,N/A,10.2156,25.06,36.70,818.28
|
| 45 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1280x720,N/A,N/A,15.3444,133.47,46.04,2455.68
|
| 46 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1280x720,N/A,N/A,14.7126,139.20,45.80,2079.04
|
| 47 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1920x1080,N/A,N/A,15.0641,135.95,46.11,2311.00
|
| 48 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,854x480,N/A,N/A,16.0785,127.38,46.35,2541.09
|
| 49 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,text,1,agx_thor,N/A,N/A,N/A,11.5369,22.19,44.83,59.20
|
| 50 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,text,8,agx_thor,N/A,N/A,N/A,10.0954,202.86,38.90,126.17
|
| 51 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1280x720,2,6,9.9871,25.63,36.42,662.34
|
| 52 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1280x720,4,12,10.0533,25.46,36.70,656.44
|
| 53 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1920x1080,2,6,10.9197,23.44,37.17,1403.77
|
| 54 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1920x1080,4,12,10.8428,23.61,36.86,1404.92
|
| 55 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,854x480,2,6,9.7512,26.25,36.72,349.70
|
| 56 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,854x480,4,12,9.6476,26.54,36.35,340.00
|
| 57 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1280x720,2,6,13.8354,148.03,45.83,1455.86
|
| 58 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1280x720,4,12,13.7043,149.44,45.31,1458.86
|
| 59 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1920x1080,2,6,18.7536,109.21,55.61,3295.62
|
| 60 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1920x1080,4,12,18.8363,108.73,55.97,3294.32
|
| 61 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,854x480,2,6,11.7998,173.56,41.68,733.10
|
| 62 |
+
Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,854x480,4,12,11.9580,171.27,42.30,727.69
|
| 63 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,1280x720,N/A,N/A,19.6150,13.05,68.86,1985.85
|
| 64 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,1920x1080,N/A,N/A,18.7188,13.68,69.17,1009.03
|
| 65 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,854x480,N/A,N/A,18.5157,13.83,68.41,1002.13
|
| 66 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,1280x720,N/A,N/A,23.8683,85.80,80.03,2400.06
|
| 67 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,1920x1080,N/A,N/A,24.3279,84.18,80.66,2649.78
|
| 68 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,854x480,N/A,N/A,23.8917,85.72,79.30,2566.15
|
| 69 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,text,1,agx_thor,N/A,N/A,N/A,17.2797,14.82,67.16,84.25
|
| 70 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,text,8,agx_thor,N/A,N/A,N/A,18.7864,109.02,72.64,175.13
|
| 71 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1280x720,2,6,18.3248,13.97,68.31,835.77
|
| 72 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1280x720,4,12,18.0996,14.14,67.47,825.91
|
| 73 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1920x1080,2,6,19.2352,13.31,67.93,1843.14
|
| 74 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1920x1080,4,12,19.5311,13.11,69.15,1828.39
|
| 75 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,854x480,2,6,18.0794,14.16,68.98,420.49
|
| 76 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,854x480,4,12,17.9946,14.23,68.62,425.62
|
| 77 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1280x720,2,6,23.2278,88.17,78.84,2177.68
|
| 78 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1280x720,4,12,22.9413,89.27,77.75,2179.41
|
| 79 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1920x1080,2,6,30.4954,67.16,91.76,5243.04
|
| 80 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1920x1080,4,12,29.9639,68.35,89.64,5256.77
|
| 81 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,854x480,2,6,20.3426,100.68,73.19,1094.31
|
| 82 |
+
Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,854x480,4,12,20.6727,99.07,74.40,1095.14
|