diff --git a/llama/runner/runner.go b/llama/runner/runner.go index c0bc8b6a..43a70f30 100644 --- a/llama/runner/runner.go +++ b/llama/runner/runner.go @@ -184,6 +184,10 @@ func (s *Server) run(ctx context.Context) { seq.iBatch = batch.NumTokens() - 1 } + if batch.NumTokens() == 0 { + continue + } + err := s.lc.Decode(batch) if err != nil { slog.Error("failed to decode batch", "error", err)