474 lines
11 KiB
Go
474 lines
11 KiB
Go
package registry
|
|
|
|
import (
|
|
"bufio"
|
|
"bytes"
|
|
"cmp"
|
|
"context"
|
|
"crypto/sha256"
|
|
"encoding/json"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"net"
|
|
"net/http/httptest"
|
|
"net/url"
|
|
"os"
|
|
"os/exec"
|
|
"strconv"
|
|
"syscall"
|
|
"testing"
|
|
"time"
|
|
|
|
"github.com/minio/minio-go/v7"
|
|
"github.com/minio/minio-go/v7/pkg/credentials"
|
|
"github.com/ollama/ollama/x/registry/apitype"
|
|
"github.com/ollama/ollama/x/utils/backoff"
|
|
"github.com/ollama/ollama/x/utils/upload"
|
|
"kr.dev/diff"
|
|
)
|
|
|
|
// const ref = "registry.ollama.ai/x/y:latest+Z"
|
|
// const manifest = `{
|
|
// "layers": [
|
|
// {"digest": "sha256-1", "size": 1},
|
|
// {"digest": "sha256-2", "size": 2},
|
|
// {"digest": "sha256-3", "size": 3}
|
|
// ]
|
|
// }`
|
|
|
|
// ts := newTestServer(t)
|
|
// ts.pushNotOK(ref, `{}`, &ollama.Error{
|
|
// Status: 400,
|
|
// Code: "invalid",
|
|
// Message: "name must be fully qualified",
|
|
// })
|
|
|
|
// ts.push(ref, `{
|
|
// "layers": [
|
|
// {"digest": "sha256-1", "size": 1},
|
|
// {"digest": "sha256-2", "size": 2},
|
|
// {"digest": "sha256-3", "size": 3}
|
|
// ]
|
|
// }`)
|
|
|
|
type tWriter struct {
|
|
t *testing.T
|
|
}
|
|
|
|
func (w tWriter) Write(p []byte) (n int, err error) {
|
|
w.t.Logf("%s", p)
|
|
return len(p), nil
|
|
}
|
|
|
|
func TestPushBasic(t *testing.T) {
|
|
const MB = 1024 * 1024
|
|
|
|
mc := startMinio(t, true)
|
|
|
|
defer func() {
|
|
mcc := &minio.Core{Client: mc}
|
|
// fail if there are any incomplete uploads
|
|
for x := range mcc.ListIncompleteUploads(context.Background(), "test", "theKey", true) {
|
|
t.Errorf("incomplete: %v", x)
|
|
}
|
|
}()
|
|
|
|
const ref = "registry.ollama.ai/x/y:latest+Z"
|
|
|
|
// Upload two small layers and one large layer that will
|
|
// trigger a multipart upload.
|
|
manifest := []byte(`{
|
|
"layers": [
|
|
{"digest": "sha256-1", "size": 1},
|
|
{"digest": "sha256-2", "size": 2},
|
|
{"digest": "sha256-3", "size": 11000000}
|
|
]
|
|
}`)
|
|
|
|
hs := httptest.NewServer(&Server{
|
|
minioClient: mc,
|
|
UploadChunkSize: 5 * MB,
|
|
})
|
|
t.Cleanup(hs.Close)
|
|
c := &Client{BaseURL: hs.URL}
|
|
|
|
requirements, err := c.Push(context.Background(), ref, manifest, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if len(requirements) < 3 {
|
|
t.Errorf("expected at least 3 requirements; got %d", len(requirements))
|
|
t.Logf("requirements: %v", requirements)
|
|
}
|
|
|
|
var uploaded []apitype.CompletePart
|
|
for i, r := range requirements {
|
|
t.Logf("[%d] pushing layer: offset=%d size=%d", i, r.Offset, r.Size)
|
|
|
|
cp, err := PushLayer(context.Background(), &abcReader{}, r.URL, r.Offset, r.Size)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
uploaded = append(uploaded, cp)
|
|
}
|
|
|
|
requirements, err = c.Push(context.Background(), ref, manifest, &PushParams{
|
|
CompleteParts: uploaded,
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if len(requirements) != 0 {
|
|
t.Errorf("unexpected requirements: %v", requirements)
|
|
}
|
|
|
|
var paths []string
|
|
keys := mc.ListObjects(context.Background(), "test", minio.ListObjectsOptions{
|
|
Recursive: true,
|
|
})
|
|
for k := range keys {
|
|
paths = append(paths, k.Key)
|
|
}
|
|
|
|
t.Logf("paths: %v", paths)
|
|
|
|
diff.Test(t, t.Errorf, paths, []string{
|
|
"blobs/sha256-1",
|
|
"blobs/sha256-2",
|
|
"blobs/sha256-3",
|
|
"manifests/registry.ollama.ai/x/y/latest/Z",
|
|
})
|
|
|
|
obj, err := mc.GetObject(context.Background(), "test", "manifests/registry.ollama.ai/x/y/latest/Z", minio.GetObjectOptions{})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer obj.Close()
|
|
|
|
var gotM apitype.Manifest
|
|
if err := json.NewDecoder(obj).Decode(&gotM); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
diff.Test(t, t.Errorf, gotM, apitype.Manifest{
|
|
Layers: []apitype.Layer{
|
|
{Digest: "sha256-1", Size: 1},
|
|
{Digest: "sha256-2", Size: 2},
|
|
{Digest: "sha256-3", Size: 3},
|
|
},
|
|
})
|
|
|
|
// checksum the blobs
|
|
for i, l := range gotM.Layers {
|
|
obj, err := mc.GetObject(context.Background(), "test", "blobs/"+l.Digest, minio.GetObjectOptions{})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer obj.Close()
|
|
|
|
info, err := obj.Stat()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
t.Logf("[%d] layer info: name=%q l.Size=%d size=%d", i, info.Key, l.Size, info.Size)
|
|
|
|
if msg := checkABCs(obj, int(l.Size)); msg != "" {
|
|
t.Errorf("[%d] %s", i, msg)
|
|
}
|
|
}
|
|
}
|
|
|
|
// TestBasicPresignS3MultipartReferenceDoNotDelete tests the basic flow of
|
|
// presigning a multipart upload, uploading the parts, and completing the
|
|
// upload. It is for future reference and should not be deleted. This flow
|
|
// is tricky and if we get it wrong in our server, we can refer back to this
|
|
// as a "back to basics" test/reference.
|
|
func TestBasicPresignS3MultipartReferenceDoNotDelete(t *testing.T) {
|
|
t.Skip("skipping reference test; unskip when needed")
|
|
|
|
mc := startMinio(t, true)
|
|
mcc := &minio.Core{Client: mc}
|
|
|
|
uploadID, err := mcc.NewMultipartUpload(context.Background(), "test", "theKey", minio.PutObjectOptions{})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
var completed []minio.CompletePart
|
|
const size int64 = 10 * 1024 * 1024
|
|
const chunkSize = 5 * 1024 * 1024
|
|
|
|
for partNumber, c := range upload.Chunks(size, chunkSize) {
|
|
u, err := mcc.Presign(context.Background(), "PUT", "test", "theKey", 15*time.Minute, url.Values{
|
|
"partNumber": {strconv.Itoa(partNumber)},
|
|
"uploadId": {uploadID},
|
|
})
|
|
if err != nil {
|
|
t.Fatalf("[partNumber=%d]: %v", partNumber, err)
|
|
}
|
|
t.Logf("[partNumber=%d]: %v", partNumber, u)
|
|
|
|
var body abcReader
|
|
cp, err := PushLayer(context.Background(), &body, u.String(), c.Offset, c.N)
|
|
if err != nil {
|
|
t.Fatalf("[partNumber=%d]: %v", partNumber, err)
|
|
}
|
|
t.Logf("completed part: %v", cp)
|
|
|
|
// behave like server here (don't cheat and use partNumber)
|
|
// instead get partNumber from the URL
|
|
retPartNumber, err := strconv.Atoi(u.Query().Get("partNumber"))
|
|
if err != nil {
|
|
t.Fatalf("[partNumber=%d]: %v", partNumber, err)
|
|
}
|
|
|
|
completed = append(completed, minio.CompletePart{
|
|
PartNumber: retPartNumber,
|
|
ETag: cp.ETag,
|
|
})
|
|
}
|
|
|
|
defer func() {
|
|
// fail if there are any incomplete uploads
|
|
for x := range mcc.ListIncompleteUploads(context.Background(), "test", "theKey", true) {
|
|
t.Errorf("incomplete: %v", x)
|
|
}
|
|
}()
|
|
|
|
info, err := mcc.CompleteMultipartUpload(context.Background(), "test", "theKey", uploadID, completed, minio.PutObjectOptions{})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
t.Logf("completed: %v", info)
|
|
|
|
// Check key in bucket
|
|
obj, err := mc.GetObject(context.Background(), "test", "theKey", minio.GetObjectOptions{})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer obj.Close()
|
|
|
|
h := sha256.New()
|
|
if _, err := io.Copy(h, obj); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
gotSum := h.Sum(nil)
|
|
|
|
h.Reset()
|
|
var body abcReader
|
|
if _, err := io.CopyN(h, &body, size); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
wantSum := h.Sum(nil)
|
|
|
|
if !bytes.Equal(gotSum, wantSum) {
|
|
t.Errorf("got sum = %x; want %x", gotSum, wantSum)
|
|
}
|
|
}
|
|
|
|
func availableAddr() string {
|
|
l, err := net.Listen("tcp", "localhost:0")
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
defer l.Close()
|
|
return l.Addr().String()
|
|
}
|
|
|
|
// tracing is "experimental" and may be removed in the future, I can't get it to
|
|
// work consistently, but I'm leaving it in for now.
|
|
func startMinio(t *testing.T, trace bool) *minio.Client {
|
|
t.Helper()
|
|
|
|
// Trace is enabled by setting the OLLAMA_MINIO_TRACE environment or
|
|
// explicitly setting trace to true.
|
|
trace = cmp.Or(trace, os.Getenv("OLLAMA_MINIO_TRACE") != "")
|
|
|
|
dir := t.TempDir()
|
|
|
|
t.Cleanup(func() {
|
|
// TODO(bmizerany): trim temp dir based on dates so that
|
|
// future runs may be able to inspect results for some time.
|
|
})
|
|
|
|
waitAndMaybeLogError := func(cmd *exec.Cmd) {
|
|
if err := cmd.Wait(); err != nil {
|
|
var e *exec.ExitError
|
|
if errors.As(err, &e) {
|
|
if e.Exited() {
|
|
return
|
|
}
|
|
t.Logf("startMinio: %s stderr: %s", cmd.Path, e.Stderr)
|
|
t.Logf("startMinio: %s exit status: %v", cmd.Path, e.ExitCode())
|
|
t.Logf("startMinio: %s exited: %v", cmd.Path, e.Exited())
|
|
t.Logf("startMinio: %s stderr: %s", cmd.Path, e.Stderr)
|
|
} else {
|
|
if errors.Is(err, context.Canceled) {
|
|
return
|
|
}
|
|
t.Logf("startMinio: %s exit error: %v", cmd.Path, err)
|
|
}
|
|
}
|
|
}
|
|
|
|
// Cancel must be called first so do wait to add to Cleanup
|
|
// stack as last cleanup.
|
|
ctx, cancel := context.WithCancel(context.Background())
|
|
deadline, ok := t.Deadline()
|
|
if ok {
|
|
ctx, cancel = context.WithDeadline(ctx, deadline.Add(-100*time.Millisecond))
|
|
}
|
|
|
|
t.Logf(">> minio: minio server %s", dir)
|
|
|
|
addr := availableAddr()
|
|
cmd := exec.CommandContext(ctx, "minio", "server", "--address", addr, dir)
|
|
cmd.Env = os.Environ()
|
|
cmd.WaitDelay = 3 * time.Second
|
|
cmd.Cancel = func() error {
|
|
return cmd.Process.Signal(syscall.SIGQUIT)
|
|
}
|
|
if err := cmd.Start(); err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
t.Cleanup(func() {
|
|
cancel()
|
|
waitAndMaybeLogError(cmd)
|
|
})
|
|
|
|
mc, err := minio.New(addr, &minio.Options{
|
|
Creds: credentials.NewStaticV4("minioadmin", "minioadmin", ""),
|
|
Secure: false,
|
|
})
|
|
if err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
|
|
// wait for server to start with exponential backoff
|
|
for _, err := range backoff.Upto(ctx, 1*time.Second) {
|
|
if err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
// try list buckets to see if server is up
|
|
if _, err := mc.ListBuckets(ctx); err == nil {
|
|
break
|
|
}
|
|
t.Logf("startMinio: server is offline; retrying")
|
|
}
|
|
|
|
if trace {
|
|
cmd := exec.CommandContext(ctx, "mc", "admin", "trace", "--verbose", "test")
|
|
cmd.Env = append(os.Environ(),
|
|
"MC_HOST_test=http://minioadmin:minioadmin@"+addr,
|
|
)
|
|
cmd.WaitDelay = 3 * time.Second
|
|
cmd.Cancel = func() error {
|
|
return cmd.Process.Signal(syscall.SIGQUIT)
|
|
}
|
|
|
|
stdout, err := cmd.StdoutPipe()
|
|
if err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
if err := cmd.Start(); err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
|
|
doneLogging := make(chan struct{})
|
|
sc := bufio.NewScanner(stdout)
|
|
go func() {
|
|
defer close(doneLogging)
|
|
|
|
// Scan lines until the process exits.
|
|
for sc.Scan() {
|
|
t.Logf("startMinio: mc trace: %s", sc.Text())
|
|
}
|
|
_ = sc.Err() // ignore (not important)
|
|
}()
|
|
t.Cleanup(func() {
|
|
cancel()
|
|
waitAndMaybeLogError(cmd)
|
|
|
|
// Make sure we do not log after test exists to
|
|
// avoid panic.
|
|
<-doneLogging
|
|
})
|
|
}
|
|
|
|
if err := mc.MakeBucket(context.Background(), "test", minio.MakeBucketOptions{}); err != nil {
|
|
t.Fatalf("startMinio: %v", err)
|
|
}
|
|
return mc
|
|
}
|
|
|
|
// contextForTest returns a context that is canceled when the test deadline,
|
|
// if any, is reached. The returned doneLogging function should be called
|
|
// after all Log/Error/Fatalf calls are done before the test returns.
|
|
func contextForTest(t *testing.T) (_ context.Context, doneLogging func()) {
|
|
done := make(chan struct{})
|
|
deadline, ok := t.Deadline()
|
|
if !ok {
|
|
return context.Background(), func() {}
|
|
}
|
|
|
|
ctx, cancel := context.WithDeadline(context.Background(), deadline.Add(-100*time.Millisecond))
|
|
t.Cleanup(func() {
|
|
cancel()
|
|
<-done
|
|
})
|
|
return ctx, func() { close(done) }
|
|
}
|
|
|
|
// abcReader repeats the string s infinitely.
|
|
type abcReader struct {
|
|
pos int
|
|
}
|
|
|
|
const theABCs = "abcdefghijklmnopqrstuvwxyz"
|
|
|
|
func (r *abcReader) Read(p []byte) (n int, err error) {
|
|
for i := range p {
|
|
p[i] = theABCs[r.pos]
|
|
r.pos++
|
|
if r.pos == len(theABCs) {
|
|
r.pos = 0
|
|
}
|
|
}
|
|
return len(p), nil
|
|
}
|
|
|
|
func (r *abcReader) ReadAt(p []byte, off int64) (n int, err error) {
|
|
for i := range p {
|
|
p[i] = theABCs[(off+int64(i))%int64(len(theABCs))]
|
|
}
|
|
return len(p), nil
|
|
}
|
|
|
|
func checkABCs(r io.Reader, size int) (reason string) {
|
|
h := sha256.New()
|
|
n, err := io.CopyN(h, &abcReader{}, int64(size))
|
|
if err != nil {
|
|
return err.Error()
|
|
}
|
|
if n != int64(size) {
|
|
panic("short read; should not happen")
|
|
}
|
|
want := h.Sum(nil)
|
|
h = sha256.New()
|
|
n, err = io.Copy(h, r)
|
|
if err != nil {
|
|
return err.Error()
|
|
}
|
|
if n != int64(size) {
|
|
return fmt.Sprintf("got len(r) = %d; want %d", n, size)
|
|
}
|
|
got := h.Sum(nil)
|
|
if !bytes.Equal(got, want) {
|
|
return fmt.Sprintf("got sum = %x; want %x", got, want)
|
|
}
|
|
return ""
|
|
}
|