increase default healthCheckTimeout to 120s

mostlygeek · mostlygeek · commit 02ee29d8813f · 2025-05-26T09:57:53.000-07:00
diff --git a/README.md b/README.md
@@ -63,9 +63,10 @@ models:
 <summary>But also very powerful ...</summary>
 
 ```yaml
-# Seconds to wait for llama.cpp to load and be ready to serve requests
-# Default (and minimum) is 15 seconds
-healthCheckTimeout: 60
+# Seconds to wait for upstream to load and be ready to serve requests
+# minimum is 15 seconds
+# default is 120 seconds
+healthCheckTimeout: 500
 
 # Valid log levels: debug, info (default), warn, error
 logLevel: info
diff --git a/proxy/config.go b/proxy/config.go
@@ -113,7 +113,12 @@ func LoadConfigFromReader(r io.Reader) (Config, error) {
 		return Config{}, err
 	}
 
-	if config.HealthCheckTimeout < 15 {
+	if config.HealthCheckTimeout == 0 {
+		// this high default timeout helps avoid failing health checks
+		// for configurations that wait for docker or have slower startup
+		config.HealthCheckTimeout = 120
+	} else if config.HealthCheckTimeout < 15 {
+		// set a minimum of 15 seconds
 		config.HealthCheckTimeout = 15
 	}
 
diff --git a/proxy/process.go b/proxy/process.go
@@ -100,7 +100,7 @@ func NewProcess(ID string, healthCheckTimeout int, config ModelConfig, processLo
 		concurrencyLimitSemaphore: make(chan struct{}, concurrentLimit),
 
 		// stop timeout
-		gracefulStopTimeout:        5 * time.Second,
+		gracefulStopTimeout:        10 * time.Second,
 		upstreamWasStoppedWithKill: false,
 	}
 }

Original file line number	Diff line number	Diff line change
`@@ -113,7 +113,12 @@ func LoadConfigFromReader(r io.Reader) (Config, error) {`
`113`	`113`	`return Config{}, err`
`114`	`114`	`}`
`115`	`115`
`116`		`- if config.HealthCheckTimeout < 15 {`
	`116`	`+ if config.HealthCheckTimeout == 0 {`
	`117`	`+ // this high default timeout helps avoid failing health checks`
	`118`	`+ // for configurations that wait for docker or have slower startup`
	`119`	`+ config.HealthCheckTimeout = 120`
	`120`	`+ } else if config.HealthCheckTimeout < 15 {`
	`121`	`+ // set a minimum of 15 seconds`
`117`	`122`	`config.HealthCheckTimeout = 15`
`118`	`123`	`}`
`119`	`124`
Original file line number	Diff line number	Diff line change
`@@ -100,7 +100,7 @@ func NewProcess(ID string, healthCheckTimeout int, config ModelConfig, processLo`
`100`	`100`	`concurrencyLimitSemaphore: make(chan struct{}, concurrentLimit),`
`101`	`101`
`102`	`102`	`// stop timeout`
`103`		`- gracefulStopTimeout: 5 * time.Second,`
	`103`	`+ gracefulStopTimeout: 10 * time.Second,`
`104`	`104`	`upstreamWasStoppedWithKill: false,`
`105`	`105`	`}`
`106`	`106`	`}`