Merge pull request #3566 from dhiltgen/more_time

Handle very slow model loads
This commit is contained in:
Daniel Hiltgen 2024-04-09 16:53:49 -07:00 committed by GitHub
commit 4c7db6b7e9
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -383,7 +383,8 @@ func (s *LlamaServer) Ping(ctx context.Context) error {
func (s *LlamaServer) waitUntilRunning() error {
start := time.Now()
expiresAt := time.Now().Add(3 * time.Minute) // be generous with timeout, large models can take a while to load
// TODO we need to wire up a better way to detect hangs during model load and startup of the server
expiresAt := time.Now().Add(10 * time.Minute) // be generous with timeout, large models can take a while to load
ticker := time.NewTicker(50 * time.Millisecond)
defer ticker.Stop()