Skip to content

Commit

Permalink
Try 5% fails
Browse files Browse the repository at this point in the history
  • Loading branch information
borzunov committed Oct 23, 2023
1 parent 82a97d6 commit 63282af
Show file tree
Hide file tree
Showing 2 changed files with 7 additions and 1 deletion.
2 changes: 1 addition & 1 deletion src/petals/client/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ class ClientConfig:

max_retries: Optional[int] = DEFAULT_MAX_RETRIES # max number of retries before an exception (default: inf)
min_backoff: float = 1 # after a repeated failure, sleep for this many seconds times 2 ** (num_failures - 1)
max_backoff: float = 60 # limit maximal sleep time between retries to this value
max_backoff: float = 5 # limit maximal sleep time between retries to this value
ban_timeout: float = 15 # when a remote peer fails to respond, prevent routing to that peer for this many seconds
active_adapter: Optional[str] = None # name of active LoRA adapter (usually, Hugging Face repo)

Expand Down
6 changes: 6 additions & 0 deletions src/petals/client/inference_session.py
Original file line number Diff line number Diff line change
Expand Up @@ -144,6 +144,12 @@ def step(
)
)
)

import random

if random.random() < 0.05:
raise Exception("fail")

outputs = list(map(deserialize_torch_tensor, outputs_serialized.tensors))
assert (
outputs[0].shape == inputs.shape
Expand Down

0 comments on commit 63282af

Please sign in to comment.