in gpu-workload/triton/loadgenerator/locustfile.py [0:0]
def bert(self):
with self.client.post(self.infer_url,
catch_response=True, data=json.dumps(self.data)
) as response:
if response.status_code == 200:
response.success()
else:
response.failure(f'{response.status_code} {response.reason}')