-
Notifications
You must be signed in to change notification settings - Fork 191
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
This commit introduces a BucketProvider interface for fetch operations against object storage provider buckets. Allowing for easier introduction of new provider implementations. The algorithm for conditionally downloading object files is the same, whether you are using GCP storage or an S3/Minio-compatible bucket. The only thing that differs is how the respective clients handle enumerating through the objects in the bucket; by implementing just that in each provider, I can have the select-and-fetch code in once place. The client implementations do now include safe-guards to ensure the fetched object is the same as metadata has been collected for. In addition, minor changes have been made to the object fetch operation to take into account that: - Etags can change between composition of index and actual fetch, in which case the etag is now updated. - Objects can disappear between composition of index and actual fetch, in which case the item is removed from the index. Lastly, the requirement for authentication has been removed (and not referring to a Secret at all is thus allowed), to provide support for e.g. public buckets. Co-authored-by: Hidde Beydals <hello@hidde.co> Co-authored by: Michael Bridgen <michael@weave.works> Signed-off-by: pa250194 <pa250194@ncr.com>
- Loading branch information
Showing
10 changed files
with
1,769 additions
and
938 deletions.
There are no files selected for viewing
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,322 @@ | ||
/* | ||
Copyright 2022 The Flux authors | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
*/ | ||
|
||
package controllers | ||
|
||
import ( | ||
"context" | ||
"fmt" | ||
"os" | ||
"path/filepath" | ||
"testing" | ||
"time" | ||
|
||
"gotest.tools/assert" | ||
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" | ||
|
||
sourcev1 "github.com/fluxcd/source-controller/api/v1beta2" | ||
) | ||
|
||
type mockBucketObject struct { | ||
etag string | ||
data string | ||
} | ||
|
||
type mockBucketClient struct { | ||
bucketName string | ||
objects map[string]mockBucketObject | ||
} | ||
|
||
var mockNotFound = fmt.Errorf("not found") | ||
|
||
func (m mockBucketClient) BucketExists(_ context.Context, name string) (bool, error) { | ||
return name == m.bucketName, nil | ||
} | ||
|
||
func (m mockBucketClient) FGetObject(_ context.Context, bucket, obj, path string) (string, error) { | ||
if bucket != m.bucketName { | ||
return "", fmt.Errorf("bucket does not exist") | ||
} | ||
// tiny bit of protocol, for convenience: if asked for an object "error", then return an error. | ||
if obj == "error" { | ||
return "", fmt.Errorf("I was asked to report an error") | ||
} | ||
object, ok := m.objects[obj] | ||
if !ok { | ||
return "", mockNotFound | ||
} | ||
if err := os.WriteFile(path, []byte(object.data), os.FileMode(0660)); err != nil { | ||
return "", err | ||
} | ||
return object.etag, nil | ||
} | ||
|
||
func (m mockBucketClient) ObjectIsNotFound(e error) bool { | ||
return e == mockNotFound | ||
} | ||
|
||
func (m mockBucketClient) VisitObjects(_ context.Context, _ string, f func(key, etag string) error) error { | ||
for key, obj := range m.objects { | ||
if err := f(key, obj.etag); err != nil { | ||
return err | ||
} | ||
} | ||
return nil | ||
} | ||
|
||
func (m mockBucketClient) Close(_ context.Context) { | ||
return | ||
} | ||
|
||
func (m *mockBucketClient) addObject(key string, object mockBucketObject) { | ||
if m.objects == nil { | ||
m.objects = make(map[string]mockBucketObject) | ||
} | ||
m.objects[key] = object | ||
} | ||
|
||
func (m *mockBucketClient) objectsToEtagIndex() *etagIndex { | ||
i := newEtagIndex() | ||
for k, v := range m.objects { | ||
i.Add(k, v.etag) | ||
} | ||
return i | ||
} | ||
|
||
func Test_fetchEtagIndex(t *testing.T) { | ||
bucketName := "all-my-config" | ||
|
||
bucket := sourcev1.Bucket{ | ||
Spec: sourcev1.BucketSpec{ | ||
BucketName: bucketName, | ||
Timeout: &metav1.Duration{Duration: 1 * time.Hour}, | ||
}, | ||
} | ||
|
||
t.Run("fetches etag index", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject("foo.yaml", mockBucketObject{data: "foo.yaml", etag: "etag1"}) | ||
client.addObject("bar.yaml", mockBucketObject{data: "bar.yaml", etag: "etag2"}) | ||
client.addObject("baz.yaml", mockBucketObject{data: "baz.yaml", etag: "etag3"}) | ||
|
||
index := newEtagIndex() | ||
err = fetchEtagIndex(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
|
||
assert.Equal(t, index.Len(), 3) | ||
}) | ||
|
||
t.Run("an error while bucket does not exist", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: "other-bucket-name"} | ||
|
||
index := newEtagIndex() | ||
err = fetchEtagIndex(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
assert.ErrorContains(t, err, "not found") | ||
}) | ||
|
||
t.Run("filters with .sourceignore rules", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject(".sourceignore", mockBucketObject{etag: "sourceignore1", data: `*.txt`}) | ||
client.addObject("foo.yaml", mockBucketObject{etag: "etag1", data: "foo.yaml"}) | ||
client.addObject("foo.txt", mockBucketObject{etag: "etag2", data: "foo.txt"}) | ||
|
||
index := newEtagIndex() | ||
err = fetchEtagIndex(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
|
||
if _, err := os.Stat(filepath.Join(tmp, ".sourceignore")); err != nil { | ||
t.Error(err) | ||
} | ||
|
||
if ok := index.Has("foo.txt"); ok { | ||
t.Error(fmt.Errorf("expected 'foo.txt' index item to not exist")) | ||
} | ||
assert.Equal(t, index.Len(), 1) | ||
}) | ||
|
||
t.Run("filters with ignore rules from object", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject(".sourceignore", mockBucketObject{etag: "sourceignore1", data: `*.txt`}) | ||
client.addObject("foo.txt", mockBucketObject{etag: "etag1", data: "foo.txt"}) | ||
|
||
ignore := "!*.txt" | ||
bucket := bucket.DeepCopy() | ||
bucket.Spec.Ignore = &ignore | ||
|
||
index := newEtagIndex() | ||
err = fetchEtagIndex(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
|
||
if _, err := os.Stat(filepath.Join(tmp, ".sourceignore")); err != nil { | ||
t.Error(err) | ||
} | ||
|
||
assert.Equal(t, index.Len(), 1) | ||
if ok := index.Has("foo.txt"); !ok { | ||
t.Error(fmt.Errorf("expected 'foo.txt' index item to exist")) | ||
} | ||
}) | ||
} | ||
|
||
func Test_fetchFiles(t *testing.T) { | ||
bucketName := "all-my-config" | ||
|
||
bucket := sourcev1.Bucket{ | ||
Spec: sourcev1.BucketSpec{ | ||
BucketName: bucketName, | ||
Timeout: &metav1.Duration{Duration: 1 * time.Hour}, | ||
}, | ||
} | ||
|
||
t.Run("fetches files", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject("foo.yaml", mockBucketObject{data: "foo.yaml", etag: "etag1"}) | ||
client.addObject("bar.yaml", mockBucketObject{data: "bar.yaml", etag: "etag2"}) | ||
client.addObject("baz.yaml", mockBucketObject{data: "baz.yaml", etag: "etag3"}) | ||
|
||
index := client.objectsToEtagIndex() | ||
|
||
err = fetchIndexFiles(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
|
||
for path := range index.Index() { | ||
p := filepath.Join(tmp, path) | ||
_, err := os.Stat(p) | ||
if err != nil { | ||
t.Error(err) | ||
} | ||
} | ||
}) | ||
|
||
t.Run("an error while fetching returns an error for the whole procedure", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName, objects: map[string]mockBucketObject{}} | ||
client.objects["error"] = mockBucketObject{} | ||
|
||
err = fetchIndexFiles(context.TODO(), client, bucket.DeepCopy(), client.objectsToEtagIndex(), tmp) | ||
if err == nil { | ||
t.Fatal("expected error but got nil") | ||
} | ||
}) | ||
|
||
t.Run("a changed etag updates the index", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject("foo.yaml", mockBucketObject{data: "foo.yaml", etag: "etag2"}) | ||
|
||
index := newEtagIndex() | ||
index.Add("foo.yaml", "etag1") | ||
err = fetchIndexFiles(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
f := index.Get("foo.yaml") | ||
assert.Equal(t, f, "etag2") | ||
}) | ||
|
||
t.Run("a disappeared index entry is removed from the index", func(t *testing.T) { | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
client.addObject("foo.yaml", mockBucketObject{data: "foo.yaml", etag: "etag1"}) | ||
|
||
index := newEtagIndex() | ||
index.Add("foo.yaml", "etag1") | ||
// Does not exist on server | ||
index.Add("bar.yaml", "etag2") | ||
|
||
err = fetchIndexFiles(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
f := index.Get("foo.yaml") | ||
assert.Equal(t, f, "etag1") | ||
assert.Check(t, !index.Has("bar.yaml")) | ||
}) | ||
|
||
t.Run("can fetch more than maxConcurrentFetches", func(t *testing.T) { | ||
// this will fail if, for example, the semaphore is not used correctly and blocks | ||
tmp, err := os.MkdirTemp("", "test-bucket") | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
defer os.RemoveAll(tmp) | ||
|
||
client := mockBucketClient{bucketName: bucketName} | ||
for i := 0; i < 2*maxConcurrentBucketFetches; i++ { | ||
f := fmt.Sprintf("file-%d", i) | ||
client.addObject(f, mockBucketObject{etag: f, data: f}) | ||
} | ||
index := client.objectsToEtagIndex() | ||
|
||
err = fetchIndexFiles(context.TODO(), client, bucket.DeepCopy(), index, tmp) | ||
if err != nil { | ||
t.Fatal(err) | ||
} | ||
}) | ||
} |
Oops, something went wrong.