in use-cases/inferencing/benchmark/src/tasks.py [0:0]
def test1(self):
headers = {"content-type": "application/json"}
r = self.client.post(
"/v1/chat/completions",
json={
"model": self.model_id,
"messages": [{"role": "user", "content": self.message1}],
"temperature": 0.5,
"top_k": 1.0,
"top_p": 1.0,
"max_tokens": 256,
},
headers=headers,
)