Skip to content

Commit

Permalink
Increase time before failing a node when it is unresponsive
Browse files Browse the repository at this point in the history
  • Loading branch information
hmusum committed Nov 7, 2024
1 parent 87f170b commit c70ebbf
Showing 1 changed file with 4 additions and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,8 @@
import java.util.List;
import java.util.concurrent.CopyOnWriteArrayList;

import static com.yahoo.config.provision.CloudName.YAHOO;

/**
* A component which sets up all the node repo maintenance jobs.
*
Expand Down Expand Up @@ -144,7 +146,8 @@ private static class DefaultTimes {
hostResumeProvisionerInterval = Duration.ofMinutes(3);
diskReplacerInterval = Duration.ofMinutes(3);
failedExpirerInterval = Duration.ofMinutes(10);
failGrace = Duration.ofMinutes(10);
// Nodes in Yahoo cloud need more time to start, so give those longer time before failing them (need more than 10 mins)
failGrace = zone.cloud().name() == YAHOO ? Duration.ofMinutes(20) : Duration.ofMinutes(10);
infrastructureProvisionInterval = Duration.ofMinutes(3);
loadBalancerExpirerInterval = Duration.ofMinutes(5);
loadBalancerPreProvisionerInterval = Duration.ofMinutes(1);
Expand Down

0 comments on commit c70ebbf

Please sign in to comment.