Skip to content

Commit

Permalink
Merge pull request bytedance#84 from bytedance/jzs/fix_vendor_zoo
Browse files Browse the repository at this point in the history
fix vendor_zoo nvidia cards.
  • Loading branch information
suisiyuan authored Jul 9, 2024
2 parents 0dbf19b + e618946 commit d9054cb
Show file tree
Hide file tree
Showing 7 changed files with 93 additions and 40 deletions.
15 changes: 11 additions & 4 deletions vendor_zoo/NVIDIA/A10-PCIe.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,20 +38,23 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": " FP32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 31.2
},
"张量参数": {
"张量精度": "TF32, FP16, BF16, INT8, INT4",
"INT8张量算力(TFLOPS)": 250.0,
"INT4张量算力(TOPS)": 500.0,
"INT8张量算力(TOPS)": 250.0,
"BF16张量算力(TFLOPS)": 125.0,
"FP16张量算力(TFLOPS)": 125.0,
"TF32张量算力(TFLOPS)": 62.5,
"FP32张量算力(TFLOPS)": null
}
},
Expand All @@ -61,5 +64,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://www.nvidia.com/content/dam/en-zz/Solutions/Data-Center/a10/pdf/datasheet-new/nvidia-a10-datasheet.pdf",
"https://www.techpowerup.com/gpu-specs/a10-pcie.c3793"
]
}
20 changes: 14 additions & 6 deletions vendor_zoo/NVIDIA/A100-PCIe.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,21 +38,25 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP64, FP32, TF32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 19.5
"FP32向量算力(TFLOPS)": 19.5,
"FP64向量算力(TFLOPS)": 9.7
},
"张量参数": {
"张量精度": "FP64, FP32, TF32, FP16, BF16, INT8",
"INT8张量算力(TFLOPS)": 624.0,
"INT8张量算力(TOPS)": 624.0,
"BF16张量算力(TFLOPS)": 312.0,
"FP16张量算力(TFLOPS)": 312.0,
"FP32张量算力(TFLOPS)": 156.0
"TF32张量算力(TFLOPS)": 156.0,
"FP32张量算力(TFLOPS)": null,
"FP64张量算力(TFLOPS)": 19.5
}
},
"卡间通信参数": {
Expand All @@ -61,5 +65,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://www.nvidia.com/content/dam/en-zz/Solutions/Data-Center/a100/pdf/nvidia-a100-datasheet-nvidia-us-2188504-web.pdf",
"https://www.techpowerup.com/gpu-specs/a100-pcie-80-gb.c3821"
]
}
22 changes: 15 additions & 7 deletions vendor_zoo/NVIDIA/A100-SXM4.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,21 +38,25 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP64, FP32, TF32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 19.5
"FP32向量算力(TFLOPS)": 19.5,
"FP64向量算力(TFLOPS)": 9.7
},
"张量参数": {
"张量精度": "FP64, FP16, BF16, INT8",
"INT8张量算力(TFLOPS)": 624.0,
"张量精度": "FP64, FP32, TF32, FP16, BF16, INT8",
"INT8张量算力(TOPS)": 624.0,
"BF16张量算力(TFLOPS)": 312.0,
"FP16张量算力(TFLOPS)": 312.0,
"FP32张量算力(TFLOPS)": 156.0
"TF32张量算力(TFLOPS)": 156.0,
"FP32张量算力(TFLOPS)": null,
"FP64张量算力(TFLOPS)": 19.5
}
},
"卡间通信参数": {
Expand All @@ -61,5 +65,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://www.nvidia.com/content/dam/en-zz/Solutions/Data-Center/a100/pdf/nvidia-a100-datasheet-nvidia-us-2188504-web.pdf",
"https://www.techpowerup.com/gpu-specs/a100-sxm4-80-gb.c3746"
]
}
23 changes: 16 additions & 7 deletions vendor_zoo/NVIDIA/A30-PCIe.json
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@
"内存": {
"内存类型": "HBM2e",
"内存容量(GB)": 24,
"内存带宽(GB/s)": 1223
"内存带宽(GB/s)": 933.1
},
"一级缓存": {
"缓存类型": "Cache(x56)",
Expand All @@ -38,21 +38,26 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP64, FP32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 10.3
"FP32向量算力(TFLOPS)": 10.3,
"FP64向量算力(TFLOPS)": 5.2
},
"张量参数": {
"张量精度": "TF32, FP16, BF16, INT8, INT4",
"INT8张量算力(TFLOPS)": 330.0,
"INT4张量算力(TOPS)": 661.0,
"INT8张量算力(TOPS)": 330.0,
"BF16张量算力(TFLOPS)": 165.0,
"FP16张量算力(TFLOPS)": 165.0,
"FP32张量算力(TFLOPS)": 82.0
"TF32张量算力(TFLOPS)": 82.0,
"FP32张量算力(TFLOPS)": null,
"FP64张量算力(TFLOPS)": 10.3
}
},
"卡间通信参数": {
Expand All @@ -61,5 +66,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://www.nvidia.com/content/dam/en-zz/Solutions/data-center/products/a30-gpu/pdf/a30-datasheet.pdf",
"https://www.techpowerup.com/gpu-specs/a30-pcie.c3792"
]
}
20 changes: 14 additions & 6 deletions vendor_zoo/NVIDIA/H100-PCIe.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,21 +38,25 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP64, FP32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 51.0
"FP32向量算力(TFLOPS)": 51.0,
"FP64向量算力(TFLOPS)": 26.0
},
"张量参数": {
"张量精度": "FP64, TF32, FP16, BF16, FP8, INT8",
"INT8张量算力(TFLOPS)": 3026.0,
"INT8张量算力(TOPS)": 3026.0,
"FP8张量算力(TFLOPS)": 3026.0,
"BF16张量算力(TFLOPS)": 1513.0,
"FP16张量算力(TFLOPS)": 1513.0,
"FP32张量算力(TFLOPS)": 756.0
"TF32张量算力(TFLOPS)": 756.0,
"FP64张量算力(TFLOPS)": 51.0
}
},
"卡间通信参数": {
Expand All @@ -61,5 +65,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://resources.nvidia.com/en-us-tensor-core/nvidia-tensor-core-gpu-datasheet?ncid=no-ncid",
"https://www.techpowerup.com/gpu-specs/h100-pcie-80-gb.c3899"
]
}
20 changes: 14 additions & 6 deletions vendor_zoo/NVIDIA/H100-SXM5.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,21 +38,25 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP64, FP32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 67.0
"FP32向量算力(TFLOPS)": 67.0,
"FP64向量算力(TFLOPS)": 34.0
},
"张量参数": {
"张量精度": "FP64, TF32, FP16, BF16, FP8, INT8",
"INT8张量算力(TFLOPS)": 3958.0,
"INT8张量算力(TOPS)": 3958.0,
"FP8张量算力(TFLOPS)": 3958.0,
"BF16张量算力(TFLOPS)": 1979.0,
"FP16张量算力(TFLOPS)": 1979.0,
"FP32张量算力(TFLOPS)": 989.0
"TF32张量算力(TFLOPS)": 989.0,
"FP64张量算力(TFLOPS)": 67.0
}
},
"卡间通信参数": {
Expand All @@ -61,5 +65,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://resources.nvidia.com/en-us-tensor-core/nvidia-tensor-core-gpu-datasheet?ncid=no-ncid",
"https://www.techpowerup.com/gpu-specs/h100-sxm5-80-gb.c3900"
]
}
13 changes: 9 additions & 4 deletions vendor_zoo/NVIDIA/T4.json
Original file line number Diff line number Diff line change
Expand Up @@ -38,19 +38,20 @@
},
"标量参数": {
"标量精度": null,
"INT8标量算力(TFLOPS)": null,
"INT8标量算力(TOPS)": null,
"FP16标量算力(TFLOPS)": null,
"FP32标量算力(TFLOPS)": null
},
"向量参数": {
"向量精度": "FP32",
"INT8量算力(TFLOPS)": null,
"INT8量算力(TOPS)": null,
"FP16向量算力(TFLOPS)": null,
"FP32向量算力(TFLOPS)": 8.1
},
"张量参数": {
"张量精度": "FP16, INT8, INT4",
"INT8张量算力(TFLOPS)": 130.0,
"INT4张量算力(TOPS)": 260.0,
"INT8张量算力(TOPS)": 130.0,
"FP16张量算力(TFLOPS)": 65.0,
"FP32张量算力(TFLOPS)": null
}
Expand All @@ -61,5 +62,9 @@
"RDMA协议": null,
"下行带宽(GB/s)": null,
"上行带宽(GB/s)": null
}
},
"数据源": [
"https://www.nvidia.com/en-us/data-center/tesla-t4/",
"https://www.techpowerup.com/gpu-specs/tesla-t4.c3316"
]
}

0 comments on commit d9054cb

Please sign in to comment.