| { |
| "NVIDIA_T4": { |
| "name": "NVIDIA T4", |
| "cuda_cores": 2560, |
| "tensor_cores": 320, |
| "memory_gb": 16, |
| "memory_bandwidth_gbps": 320, |
| "base_clock_mhz": 585, |
| "boost_clock_mhz": 1590, |
| "sm_count": 40, |
| "fp32_tflops": 8.1, |
| "fp16_tflops": 65, |
| "tdp_watts": 70, |
| "compute_capability": 7.5, |
| "l2_cache_mb": 4 |
| }, |
| "NVIDIA_V100": { |
| "name": "NVIDIA V100", |
| "cuda_cores": 5120, |
| "tensor_cores": 640, |
| "memory_gb": 32, |
| "memory_bandwidth_gbps": 900, |
| "base_clock_mhz": 1230, |
| "boost_clock_mhz": 1530, |
| "sm_count": 80, |
| "fp32_tflops": 15.7, |
| "fp16_tflops": 125, |
| "tdp_watts": 300, |
| "compute_capability": 7.0, |
| "l2_cache_mb": 6 |
| }, |
| "NVIDIA_A10G": { |
| "name": "NVIDIA A10G", |
| "cuda_cores": 9216, |
| "tensor_cores": 288, |
| "memory_gb": 24, |
| "memory_bandwidth_gbps": 600, |
| "base_clock_mhz": 885, |
| "boost_clock_mhz": 1695, |
| "sm_count": 80, |
| "fp32_tflops": 31.2, |
| "fp16_tflops": 62.5, |
| "tdp_watts": 150, |
| "compute_capability": 8.6, |
| "l2_cache_mb": 6 |
| }, |
| "NVIDIA_A100_40GB": { |
| "name": "NVIDIA A100 40GB", |
| "cuda_cores": 6912, |
| "tensor_cores": 432, |
| "memory_gb": 40, |
| "memory_bandwidth_gbps": 1555, |
| "base_clock_mhz": 765, |
| "boost_clock_mhz": 1410, |
| "sm_count": 108, |
| "fp32_tflops": 19.5, |
| "fp16_tflops": 312, |
| "tdp_watts": 400, |
| "compute_capability": 8.0, |
| "l2_cache_mb": 40 |
| }, |
| "NVIDIA_A100_80GB": { |
| "name": "NVIDIA A100 80GB", |
| "cuda_cores": 6912, |
| "tensor_cores": 432, |
| "memory_gb": 80, |
| "memory_bandwidth_gbps": 2039, |
| "base_clock_mhz": 765, |
| "boost_clock_mhz": 1410, |
| "sm_count": 108, |
| "fp32_tflops": 19.5, |
| "fp16_tflops": 312, |
| "tdp_watts": 400, |
| "compute_capability": 8.0, |
| "l2_cache_mb": 40 |
| }, |
| "NVIDIA_L4": { |
| "name": "NVIDIA L4", |
| "cuda_cores": 7424, |
| "tensor_cores": 232, |
| "memory_gb": 24, |
| "memory_bandwidth_gbps": 300, |
| "base_clock_mhz": 795, |
| "boost_clock_mhz": 2040, |
| "sm_count": 58, |
| "fp32_tflops": 30.3, |
| "fp16_tflops": 121, |
| "tdp_watts": 72, |
| "compute_capability": 8.9, |
| "l2_cache_mb": 48 |
| }, |
| "NVIDIA_L40S": { |
| "name": "NVIDIA L40S", |
| "cuda_cores": 18176, |
| "tensor_cores": 568, |
| "memory_gb": 48, |
| "memory_bandwidth_gbps": 864, |
| "base_clock_mhz": 1110, |
| "boost_clock_mhz": 2520, |
| "sm_count": 142, |
| "fp32_tflops": 91.6, |
| "fp16_tflops": 183.2, |
| "tdp_watts": 350, |
| "compute_capability": 8.9, |
| "l2_cache_mb": 96 |
| }, |
| "NVIDIA_RTX_3090": { |
| "name": "NVIDIA RTX 3090", |
| "cuda_cores": 10496, |
| "tensor_cores": 328, |
| "memory_gb": 24, |
| "memory_bandwidth_gbps": 936, |
| "base_clock_mhz": 1395, |
| "boost_clock_mhz": 1695, |
| "sm_count": 82, |
| "fp32_tflops": 35.6, |
| "fp16_tflops": 71, |
| "tdp_watts": 350, |
| "compute_capability": 8.6, |
| "l2_cache_mb": 6 |
| }, |
| "NVIDIA_RTX_4090": { |
| "name": "NVIDIA RTX 4090", |
| "cuda_cores": 16384, |
| "tensor_cores": 512, |
| "memory_gb": 24, |
| "memory_bandwidth_gbps": 1008, |
| "base_clock_mhz": 2235, |
| "boost_clock_mhz": 2520, |
| "sm_count": 128, |
| "fp32_tflops": 82.6, |
| "fp16_tflops": 165.2, |
| "tdp_watts": 450, |
| "compute_capability": 8.9, |
| "l2_cache_mb": 72 |
| }, |
| "NVIDIA_H100_SXM": { |
| "name": "NVIDIA H100 SXM", |
| "cuda_cores": 16896, |
| "tensor_cores": 528, |
| "memory_gb": 80, |
| "memory_bandwidth_gbps": 3350, |
| "base_clock_mhz": 1095, |
| "boost_clock_mhz": 1830, |
| "sm_count": 132, |
| "fp32_tflops": 67, |
| "fp16_tflops": 989, |
| "tdp_watts": 700, |
| "compute_capability": 9.0, |
| "l2_cache_mb": 50 |
| }, |
| "NVIDIA_H100_PCIe": { |
| "name": "NVIDIA H100 PCIe", |
| "cuda_cores": 14592, |
| "tensor_cores": 456, |
| "memory_gb": 80, |
| "memory_bandwidth_gbps": 2039, |
| "base_clock_mhz": 1095, |
| "boost_clock_mhz": 1620, |
| "sm_count": 114, |
| "fp32_tflops": 48, |
| "fp16_tflops": 756, |
| "tdp_watts": 350, |
| "compute_capability": 9.0, |
| "l2_cache_mb": 50 |
| }, |
| "NVIDIA_RTX_A6000": { |
| "name": "NVIDIA RTX A6000", |
| "cuda_cores": 10752, |
| "tensor_cores": 336, |
| "memory_gb": 48, |
| "memory_bandwidth_gbps": 768, |
| "base_clock_mhz": 1410, |
| "boost_clock_mhz": 1860, |
| "sm_count": 84, |
| "fp32_tflops": 38.7, |
| "fp16_tflops": 77.4, |
| "tdp_watts": 300, |
| "compute_capability": 8.6, |
| "l2_cache_mb": 6 |
| } |
| } |