in optimum_benchmark/backends/py_txi/backend.py [0:0]
def tgi_kwargs(self):
kwargs = {}
if self.config.dtype is not None:
kwargs["dtype"] = self.config.dtype
if self.config.sharded is not None:
kwargs["sharded"] = self.config.sharded
if self.config.quantize is not None:
kwargs["quantize"] = self.config.quantize
if self.config.num_shard is not None:
kwargs["num_shard"] = self.config.num_shard
if self.config.speculate is not None:
kwargs["speculate"] = self.config.speculate
if self.config.cuda_graphs is not None:
kwargs["cuda_graphs"] = self.config.cuda_graphs
if self.config.trust_remote_code is not None:
kwargs["trust_remote_code"] = self.config.trust_remote_code
if self.config.disable_custom_kernels is not None:
kwargs["disable_custom_kernels"] = self.config.disable_custom_kernels
return kwargs