ollama/server/upload.go

182 lines
4.3 KiB
Go
Raw Normal View History

2023-08-22 11:50:21 -04:00
package server
import (
"context"
"errors"
"fmt"
"io"
"log"
"net/http"
"net/url"
"os"
"strconv"
"github.com/jmorganca/ollama/api"
)
func startUpload(ctx context.Context, mp ModelPath, layer *Layer, regOpts *RegistryOptions) (*url.URL, error) {
requestURL := mp.BaseURL()
requestURL = requestURL.JoinPath("v2", mp.GetNamespaceRepository(), "blobs/uploads/")
if layer.From != "" {
values := requestURL.Query()
values.Add("mount", layer.Digest)
values.Add("from", layer.From)
requestURL.RawQuery = values.Encode()
}
resp, err := makeRequestWithRetry(ctx, "POST", requestURL, nil, nil, regOpts)
if err != nil {
log.Printf("couldn't start upload: %v", err)
return nil, err
}
defer resp.Body.Close()
// Extract UUID location from header
location := resp.Header.Get("Location")
if location == "" {
return nil, fmt.Errorf("location header is missing in response")
}
return url.Parse(location)
}
2023-08-28 18:35:18 -04:00
func uploadBlobChunked(ctx context.Context, requestURL *url.URL, layer *Layer, regOpts *RegistryOptions, fn func(api.ProgressResponse)) error {
2023-08-22 11:50:21 -04:00
// TODO allow resumability
// TODO allow canceling uploads via DELETE
fp, err := GetBlobsPath(layer.Digest)
if err != nil {
return err
}
f, err := os.Open(fp)
if err != nil {
return err
}
defer f.Close()
2023-08-25 18:38:39 -04:00
// 95MB chunk size
chunkSize := 95 * 1024 * 1024
2023-09-14 12:54:05 -04:00
pw := ProgressWriter{
status: fmt.Sprintf("uploading %s", layer.Digest),
digest: layer.Digest,
total: layer.Size,
fn: fn,
}
2023-08-22 11:50:21 -04:00
2023-08-26 11:28:35 -04:00
for offset := int64(0); offset < int64(layer.Size); {
chunk := int64(layer.Size) - offset
2023-08-22 11:50:21 -04:00
if chunk > int64(chunkSize) {
chunk = int64(chunkSize)
}
2023-08-26 11:28:35 -04:00
sectionReader := io.NewSectionReader(f, int64(offset), chunk)
2023-09-14 12:54:05 -04:00
var errStatus error
2023-08-26 11:28:35 -04:00
for try := 0; try < MaxRetries; try++ {
2023-09-14 12:54:05 -04:00
errStatus = nil
2023-08-26 11:28:35 -04:00
headers := make(http.Header)
headers.Set("Content-Type", "application/octet-stream")
headers.Set("Content-Length", strconv.Itoa(int(chunk)))
headers.Set("Content-Range", fmt.Sprintf("%d-%d", offset, offset+sectionReader.Size()-1))
2023-09-14 12:54:05 -04:00
resp, err := makeRequest(ctx, "PATCH", requestURL, headers, io.TeeReader(sectionReader, &pw), regOpts)
2023-08-26 11:28:35 -04:00
if err != nil && !errors.Is(err, io.EOF) {
fn(api.ProgressResponse{
Status: fmt.Sprintf("error uploading chunk: %v", err),
Digest: layer.Digest,
Total: layer.Size,
Completed: int(offset),
})
return err
}
defer resp.Body.Close()
2023-08-27 00:55:21 -04:00
switch {
case resp.StatusCode == http.StatusUnauthorized:
2023-09-14 12:54:05 -04:00
errStatus = errors.New("unauthorized")
2023-09-07 15:01:50 -04:00
2023-08-26 11:28:35 -04:00
auth := resp.Header.Get("www-authenticate")
authRedir := ParseAuthRedirectString(auth)
2023-09-13 14:46:29 -04:00
token, err := getAuthToken(ctx, authRedir)
2023-08-26 11:28:35 -04:00
if err != nil {
return err
}
regOpts.Token = token
2023-09-14 12:54:05 -04:00
pw.completed = int(offset)
sectionReader = io.NewSectionReader(f, offset, chunk)
2023-08-26 11:28:35 -04:00
continue
2023-08-27 00:55:21 -04:00
case resp.StatusCode >= http.StatusBadRequest:
2023-08-26 11:28:35 -04:00
body, _ := io.ReadAll(resp.Body)
return fmt.Errorf("on upload registry responded with code %d: %s", resp.StatusCode, body)
}
offset += sectionReader.Size()
requestURL, err = url.Parse(resp.Header.Get("Location"))
if err != nil {
return err
}
2023-08-22 11:50:21 -04:00
break
}
2023-09-14 12:54:05 -04:00
if errStatus != nil {
return fmt.Errorf("max retries exceeded: %w", errStatus)
}
2023-08-22 11:50:21 -04:00
}
values := requestURL.Query()
values.Add("digest", layer.Digest)
requestURL.RawQuery = values.Encode()
headers := make(http.Header)
headers.Set("Content-Type", "application/octet-stream")
headers.Set("Content-Length", "0")
// finish the upload
resp, err := makeRequest(ctx, "PUT", requestURL, headers, nil, regOpts)
if err != nil {
log.Printf("couldn't finish upload: %v", err)
return err
}
defer resp.Body.Close()
2023-08-27 00:55:21 -04:00
if resp.StatusCode >= http.StatusBadRequest {
2023-08-22 11:50:21 -04:00
body, _ := io.ReadAll(resp.Body)
return fmt.Errorf("on finish upload registry responded with code %d: %v", resp.StatusCode, string(body))
}
return nil
}
2023-09-14 12:54:05 -04:00
type ProgressWriter struct {
status string
digest string
bucket int
completed int
total int
fn func(api.ProgressResponse)
}
func (pw *ProgressWriter) Write(b []byte) (int, error) {
n := len(b)
pw.bucket += n
pw.completed += n
// throttle status updates to not spam the client
if pw.bucket >= 1024*1024 || pw.completed >= pw.total {
pw.fn(api.ProgressResponse{
Status: pw.status,
Digest: pw.digest,
Total: pw.total,
Completed: pw.completed,
})
pw.bucket = 0
}
return n, nil
}