Skip to content

Commit

Permalink
server: tests - slow inference causes timeout on the CI (ggerganov#5715)
Browse files Browse the repository at this point in the history
* server: tests - longer inference timeout for CI
  • Loading branch information
phymbert authored and hodlen committed Apr 1, 2024
1 parent f928471 commit 31d23c9
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 2 deletions.
2 changes: 1 addition & 1 deletion common/sampling.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -266,7 +266,7 @@ static llama_token llama_sampling_sample_impl(
// }
//}

LOG("sampled token: %5d: '%s'\n", id, llama_token_to_piece(ctx_main, id).c_str());
//LOG("sampled token: %5d: '%s'\n", id, llama_token_to_piece(ctx_main, id).c_str());
}
}

Expand Down
4 changes: 3 additions & 1 deletion examples/server/tests/features/steps/steps.py
Original file line number Diff line number Diff line change
Expand Up @@ -699,6 +699,8 @@ async def wait_for_health_status(context,
if context.debug:
print(f"Starting checking for health for expected_health_status={expected_health_status}")
timeout = 3 # seconds
if expected_health_status == 'ok':
timeout = 10 # CI slow inference
interval = 0.5
counter = 0
async with aiohttp.ClientSession() as session:
Expand Down Expand Up @@ -736,7 +738,7 @@ async def wait_for_health_status(context,
if n_completions > 0:
return

assert False, 'timeout exceeded'
assert False, f'{expected_health_status} timeout exceeded {counter}s>={timeout}'


def assert_embeddings(embeddings):
Expand Down

0 comments on commit 31d23c9

Please sign in to comment.