Jonna Marie Matthiesen commited on
Commit
e36fba8
·
1 Parent(s): 3ba0d66

Add Qwen3.5 AGX Thor benchmarks

Browse files
Files changed (2) hide show
  1. config.json +34 -0
  2. data/Qwen3.5.csv +82 -0
config.json CHANGED
@@ -135,6 +135,40 @@
135
  "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
136
  "orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
137
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
138
  }
139
  }
140
  }
 
135
  "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
136
  "orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.14.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
137
  }
138
+ },
139
+ "Qwen3.5-0.8B": {
140
+ "data_file": "data/Qwen3.5.csv",
141
+ "table_group_by": ["res", "fps"],
142
+ "experiment_setup": {
143
+ "agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
144
+ "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
145
+ "orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
146
+ }
147
+ },
148
+ "Qwen3.5-2B": {
149
+ "data_file": "data/Qwen3.5.csv",
150
+ "table_group_by": ["res", "fps"],
151
+ "experiment_setup": {
152
+ "agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
153
+ "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
154
+ "orin_nano": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
155
+ }
156
+ },
157
+ "Qwen3.5-4B": {
158
+ "data_file": "data/Qwen3.5.csv",
159
+ "table_group_by": ["res", "fps"],
160
+ "experiment_setup": {
161
+ "agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
162
+ "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
163
+ }
164
+ },
165
+ "Qwen3.5-9B": {
166
+ "data_file": "data/Qwen3.5.csv",
167
+ "table_group_by": ["res", "fps"],
168
+ "experiment_setup": {
169
+ "agx_thor": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 arm64, 256 tokens generated, 10 warm-up runs, averaged over 25 runs.",
170
+ "agx_orin": "Measurement setup: NVIDIA AI IoT vLLM 0.16.0 tegra, 256 tokens generated, 10 warm-up runs, averaged over 25 runs."
171
+ }
172
  }
173
  }
174
  }
data/Qwen3.5.csv ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_family,model,type,batch,device,res,fps,frames,e2e,tps,tpot,ttft
2
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,1280x720,N/A,N/A,3.1547,81.15,9.63,689.01
3
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,1920x1080,N/A,N/A,3.0482,83.98,9.52,609.01
4
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,1,agx_thor,854x480,N/A,N/A,2.9693,86.22,9.53,527.85
5
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,1280x720,N/A,N/A,6.0349,339.36,9.41,2220.21
6
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,1920x1080,N/A,N/A,5.4511,375.70,10.32,1861.66
7
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,image,8,agx_thor,854x480,N/A,N/A,6.0003,341.32,9.42,2261.71
8
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,text,1,agx_thor,N/A,N/A,N/A,2.4818,103.15,9.48,53.33
9
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,text,8,agx_thor,N/A,N/A,N/A,2.4017,852.74,9.01,88.37
10
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1280x720,2,6,2.8887,88.62,9.52,450.19
11
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1280x720,4,12,2.6629,96.13,8.70,435.18
12
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1920x1080,2,6,3.3747,75.86,9.72,884.67
13
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,1920x1080,4,12,3.3594,76.20,9.63,892.37
14
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,854x480,2,6,2.6786,95.57,9.45,258.06
15
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,1,agx_thor,854x480,4,12,2.4043,106.48,8.43,245.77
16
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1280x720,2,6,4.7497,431.19,10.90,1235.70
17
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1280x720,4,12,4.8586,421.52,11.26,1243.70
18
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1920x1080,2,6,7.1575,286.14,12.02,2625.62
19
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,1920x1080,4,12,7.1667,285.77,11.90,2639.20
20
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,854x480,2,6,3.3770,606.46,9.37,594.63
21
+ Qwen3.5-0.8B,Qwen/Qwen3.5-0.8B,video,8,agx_thor,854x480,4,12,3.6522,560.76,10.42,602.73
22
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,1280x720,N/A,N/A,5.3602,47.76,17.58,859.56
23
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,1920x1080,N/A,N/A,5.3912,47.48,17.69,861.15
24
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,1,agx_thor,854x480,N/A,N/A,4.9181,52.05,16.54,683.47
25
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,1280x720,N/A,N/A,8.7155,234.98,20.03,2253.31
26
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,1920x1080,N/A,N/A,8.6447,236.91,20.00,2230.21
27
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,image,8,agx_thor,854x480,N/A,N/A,8.7861,233.10,19.94,2283.97
28
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,text,1,agx_thor,N/A,N/A,N/A,4.7835,53.52,18.45,58.28
29
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,text,8,agx_thor,N/A,N/A,N/A,5.0283,407.29,19.22,99.12
30
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1280x720,2,6,5.0749,50.44,17.94,480.60
31
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1280x720,4,12,5.0026,51.17,17.67,479.12
32
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1920x1080,2,6,5.5593,46.05,17.80,1002.52
33
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,1920x1080,4,12,5.5114,46.45,17.60,1004.64
34
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,854x480,2,6,4.4620,57.37,16.43,255.18
35
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,1,agx_thor,854x480,4,12,4.6379,55.20,17.09,261.74
36
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1280x720,2,6,7.1252,287.43,20.15,1253.66
37
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1280x720,4,12,7.2464,282.62,20.65,1253.71
38
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1920x1080,2,6,10.0072,204.65,23.88,2654.43
39
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,1920x1080,4,12,9.9937,204.93,23.86,2650.33
40
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,854x480,2,6,5.8224,351.75,18.88,595.93
41
+ Qwen3.5-2B,Qwen/Qwen3.5-2B,video,8,agx_thor,854x480,4,12,5.8278,351.42,18.92,595.51
42
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,1280x720,N/A,N/A,10.9790,23.32,36.40,1660.10
43
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,1920x1080,N/A,N/A,10.2370,25.01,36.68,846.99
44
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,1,agx_thor,854x480,N/A,N/A,10.2156,25.06,36.70,818.28
45
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1280x720,N/A,N/A,15.3444,133.47,46.04,2455.68
46
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1280x720,N/A,N/A,14.7126,139.20,45.80,2079.04
47
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,1920x1080,N/A,N/A,15.0641,135.95,46.11,2311.00
48
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,image,8,agx_thor,854x480,N/A,N/A,16.0785,127.38,46.35,2541.09
49
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,text,1,agx_thor,N/A,N/A,N/A,11.5369,22.19,44.83,59.20
50
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,text,8,agx_thor,N/A,N/A,N/A,10.0954,202.86,38.90,126.17
51
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1280x720,2,6,9.9871,25.63,36.42,662.34
52
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1280x720,4,12,10.0533,25.46,36.70,656.44
53
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1920x1080,2,6,10.9197,23.44,37.17,1403.77
54
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,1920x1080,4,12,10.8428,23.61,36.86,1404.92
55
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,854x480,2,6,9.7512,26.25,36.72,349.70
56
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,1,agx_thor,854x480,4,12,9.6476,26.54,36.35,340.00
57
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1280x720,2,6,13.8354,148.03,45.83,1455.86
58
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1280x720,4,12,13.7043,149.44,45.31,1458.86
59
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1920x1080,2,6,18.7536,109.21,55.61,3295.62
60
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,1920x1080,4,12,18.8363,108.73,55.97,3294.32
61
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,854x480,2,6,11.7998,173.56,41.68,733.10
62
+ Qwen3.5-4B,Qwen/Qwen3.5-4B,video,8,agx_thor,854x480,4,12,11.9580,171.27,42.30,727.69
63
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,1280x720,N/A,N/A,19.6150,13.05,68.86,1985.85
64
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,1920x1080,N/A,N/A,18.7188,13.68,69.17,1009.03
65
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,1,agx_thor,854x480,N/A,N/A,18.5157,13.83,68.41,1002.13
66
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,1280x720,N/A,N/A,23.8683,85.80,80.03,2400.06
67
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,1920x1080,N/A,N/A,24.3279,84.18,80.66,2649.78
68
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,image,8,agx_thor,854x480,N/A,N/A,23.8917,85.72,79.30,2566.15
69
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,text,1,agx_thor,N/A,N/A,N/A,17.2797,14.82,67.16,84.25
70
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,text,8,agx_thor,N/A,N/A,N/A,18.7864,109.02,72.64,175.13
71
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1280x720,2,6,18.3248,13.97,68.31,835.77
72
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1280x720,4,12,18.0996,14.14,67.47,825.91
73
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1920x1080,2,6,19.2352,13.31,67.93,1843.14
74
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,1920x1080,4,12,19.5311,13.11,69.15,1828.39
75
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,854x480,2,6,18.0794,14.16,68.98,420.49
76
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,1,agx_thor,854x480,4,12,17.9946,14.23,68.62,425.62
77
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1280x720,2,6,23.2278,88.17,78.84,2177.68
78
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1280x720,4,12,22.9413,89.27,77.75,2179.41
79
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1920x1080,2,6,30.4954,67.16,91.76,5243.04
80
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,1920x1080,4,12,29.9639,68.35,89.64,5256.77
81
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,854x480,2,6,20.3426,100.68,73.19,1094.31
82
+ Qwen3.5-9B,Qwen/Qwen3.5-9B,video,8,agx_thor,854x480,4,12,20.6727,99.07,74.40,1095.14