llm_perf/hardware.yaml (38 lines of code) (raw):
- machine: 1xA10
hardware: cuda
subsets:
- unquantized
- awq
- bnb
- gptq
- torchao
backends:
- pytorch
- machine: 1xA100
hardware: cuda
subsets:
- unquantized
- awq
- bnb
- gptq
- torchao
backends:
- pytorch
- machine: 1xT4
hardware: cuda
subsets:
- unquantized
- awq
- bnb
- gptq
- torchao
backends:
- pytorch
- machine: 32vCPU-C7i
hardware: cpu
subsets:
- unquantized
backends:
- pytorch
- openvino
- onnxruntime