Skip to content

Commit

Permalink
update
Browse files Browse the repository at this point in the history
ZeldaHuang committed Dec 19, 2024
1 parent 1b82ce1 commit fc18695
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion benchmark/benchmark_serving.py
Original file line number Diff line number Diff line change
@@ -102,7 +102,7 @@ async def query_model_vllm(prompt, verbose, ip_ports):
if verbose:
print('Done')

output = await resp.json()
output = await resp.json(content_type='text/plain')
# necessary for latency calc
output['response_len'] = expected_response_len
if verbose and 'generated_text' in output:
2 changes: 1 addition & 1 deletion tests/e2e_test/test_e2e.py
Original file line number Diff line number Diff line change
@@ -36,7 +36,7 @@ async def get_llumnix_response(prompt, sampling_params, ip_ports):

async with aiohttp.ClientSession(timeout=timeout) as session:
async with session.post(f'http://{ip_ports}/generate', json=request) as resp:
output = await resp.json()
output = await resp.json('text/plain')
return output

prompts = [

0 comments on commit fc18695

Please sign in to comment.