diff --git a/docs/api.md b/docs/api.md index 65aefc25..7415101b 100644 --- a/docs/api.md +++ b/docs/api.md @@ -23,6 +23,10 @@ Model names follow a `model:tag` format. Some examples are `orca-mini:3b-q4_1` a All durations are returned in nanoseconds. +### Streaming responses + +Certain endpoints stream responses as JSON objects delineated with the newline (`\n`) character. + ## Generate a completion ```shell diff --git a/server/routes.go b/server/routes.go index 6ca7b428..c68011df 100644 --- a/server/routes.go +++ b/server/routes.go @@ -610,6 +610,7 @@ func streamResponse(c *gin.Context, ch chan any) { return false } + // Delineate chunks with new-line delimiter bts = append(bts, '\n') if _, err := w.Write(bts); err != nil { log.Printf("streamResponse: w.Write failed with %s", err)