llm_perf/hardware.yaml (38 lines of code) (raw):

- machine: 1xA10 hardware: cuda subsets: - unquantized - awq - bnb - gptq - torchao backends: - pytorch - machine: 1xA100 hardware: cuda subsets: - unquantized - awq - bnb - gptq - torchao backends: - pytorch - machine: 1xT4 hardware: cuda subsets: - unquantized - awq - bnb - gptq - torchao backends: - pytorch - machine: 32vCPU-C7i hardware: cpu subsets: - unquantized backends: - pytorch - openvino - onnxruntime