mirror of
https://github.com/minio/minio.git
synced 2025-01-24 21:23:15 -05:00
a982baff27
Design: https://gist.github.com/klauspost/025c09b48ed4a1293c917cecfabdf21c Gist of improvements: * Cross-server caching and listing will use the same data across servers and requests. * Lists can be arbitrarily resumed at a constant speed. * Metadata for all files scanned is stored for streaming retrieval. * The existing bloom filters controlled by the crawler is used for validating caches. * Concurrent requests for the same data (or parts of it) will not spawn additional walkers. * Listing a subdirectory of an existing recursive cache will use the cache. * All listing operations are fully streamable so the number of objects in a bucket no longer dictates the amount of memory. * Listings can be handled by any server within the cluster. * Caches are cleaned up when out of date or superseded by a more recent one.
266 lines
17 KiB
Go
266 lines
17 KiB
Go
/*
|
|
* MinIO Cloud Storage, (C) 2020 MinIO, Inc.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package cmd
|
|
|
|
import (
|
|
"bytes"
|
|
"reflect"
|
|
"sort"
|
|
"testing"
|
|
)
|
|
|
|
func Test_metaCacheEntries_sort(t *testing.T) {
|
|
entries := loadMetacacheSampleEntries(t)
|
|
|
|
o := entries.entries()
|
|
if !o.isSorted() {
|
|
t.Fatal("Expected sorted objects")
|
|
}
|
|
|
|
// Swap first and last
|
|
o[0], o[len(o)-1] = o[len(o)-1], o[0]
|
|
if o.isSorted() {
|
|
t.Fatal("Expected unsorted objects")
|
|
}
|
|
|
|
sorted := o.sort()
|
|
if !o.isSorted() {
|
|
t.Fatal("Expected sorted o objects")
|
|
}
|
|
if !sorted.entries().isSorted() {
|
|
t.Fatal("Expected sorted wrapped objects")
|
|
}
|
|
want := loadMetacacheSampleNames
|
|
for i, got := range o {
|
|
if got.name != want[i] {
|
|
t.Errorf("entry %d, want %q, got %q", i, want[i], got.name)
|
|
}
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_forwardTo(t *testing.T) {
|
|
org := loadMetacacheSampleEntries(t)
|
|
entries := org
|
|
want := []string{"src/compress/zlib/reader_test.go", "src/compress/zlib/writer.go", "src/compress/zlib/writer_test.go"}
|
|
entries.forwardTo("src/compress/zlib/reader_test.go")
|
|
got := entries.entries().names()
|
|
if !reflect.DeepEqual(got, want) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
|
|
// Try with prefix
|
|
entries = org
|
|
entries.forwardTo("src/compress/zlib/reader_t")
|
|
got = entries.entries().names()
|
|
if !reflect.DeepEqual(got, want) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_merge(t *testing.T) {
|
|
org := loadMetacacheSampleEntries(t)
|
|
a, b := org.shallowClone(), org.shallowClone()
|
|
be := b.entries()
|
|
for i := range be {
|
|
// Modify b so it isn't deduplicated.
|
|
be[i].metadata = []byte("something-else")
|
|
}
|
|
// Merge b into a
|
|
a.merge(b, -1)
|
|
want := append(loadMetacacheSampleNames, loadMetacacheSampleNames...)
|
|
sort.Strings(want)
|
|
got := a.entries().names()
|
|
if len(got) != len(want) {
|
|
t.Errorf("unexpected count, want %v, got %v", len(want), len(got))
|
|
}
|
|
|
|
for i, name := range got {
|
|
if want[i] != name {
|
|
t.Errorf("unexpected name, want %q, got %q", want[i], name)
|
|
}
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_dedupe(t *testing.T) {
|
|
org := loadMetacacheSampleEntries(t)
|
|
a, b := org.shallowClone(), org.shallowClone()
|
|
|
|
// Merge b into a
|
|
a.merge(b, -1)
|
|
if a.deduplicate(nil) {
|
|
t.Fatal("deduplicate returned duplicate entries left")
|
|
}
|
|
want := loadMetacacheSampleNames
|
|
got := a.entries().names()
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_dedupe2(t *testing.T) {
|
|
org := loadMetacacheSampleEntries(t)
|
|
a, b := org.shallowClone(), org.shallowClone()
|
|
|
|
// Replace metadata in b
|
|
testMarker := []byte("sampleset")
|
|
for i := range b.o {
|
|
b.o[i].metadata = testMarker
|
|
}
|
|
|
|
// Merge b into a
|
|
a.merge(b, -1)
|
|
if a.deduplicate(func(existing, other *metaCacheEntry) (replace bool) {
|
|
a := bytes.Equal(existing.metadata, testMarker)
|
|
b := bytes.Equal(other.metadata, testMarker)
|
|
if a == b {
|
|
t.Fatal("got same number of testmarkers, only one should be given", a, b)
|
|
}
|
|
return b
|
|
}) {
|
|
t.Fatal("deduplicate returned duplicate entries left, we should always resolve")
|
|
}
|
|
want := loadMetacacheSampleNames
|
|
got := a.entries().names()
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterObjects(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
data.filterObjectsOnly()
|
|
got := data.entries().names()
|
|
want := []string{"src/compress/bzip2/bit_reader.go", "src/compress/bzip2/bzip2.go", "src/compress/bzip2/bzip2_test.go", "src/compress/bzip2/huffman.go", "src/compress/bzip2/move_to_front.go", "src/compress/bzip2/testdata/Isaac.Newton-Opticks.txt.bz2", "src/compress/bzip2/testdata/e.txt.bz2", "src/compress/bzip2/testdata/fail-issue5747.bz2", "src/compress/bzip2/testdata/pass-random1.bin", "src/compress/bzip2/testdata/pass-random1.bz2", "src/compress/bzip2/testdata/pass-random2.bin", "src/compress/bzip2/testdata/pass-random2.bz2", "src/compress/bzip2/testdata/pass-sawtooth.bz2", "src/compress/bzip2/testdata/random.data.bz2", "src/compress/flate/deflate.go", "src/compress/flate/deflate_test.go", "src/compress/flate/deflatefast.go", "src/compress/flate/dict_decoder.go", "src/compress/flate/dict_decoder_test.go", "src/compress/flate/example_test.go", "src/compress/flate/flate_test.go", "src/compress/flate/huffman_bit_writer.go", "src/compress/flate/huffman_bit_writer_test.go", "src/compress/flate/huffman_code.go", "src/compress/flate/inflate.go", "src/compress/flate/inflate_test.go", "src/compress/flate/reader_test.go", "src/compress/flate/testdata/huffman-null-max.dyn.expect", "src/compress/flate/testdata/huffman-null-max.dyn.expect-noinput", "src/compress/flate/testdata/huffman-null-max.golden", "src/compress/flate/testdata/huffman-null-max.in", "src/compress/flate/testdata/huffman-null-max.wb.expect", "src/compress/flate/testdata/huffman-null-max.wb.expect-noinput", "src/compress/flate/testdata/huffman-pi.dyn.expect", "src/compress/flate/testdata/huffman-pi.dyn.expect-noinput", "src/compress/flate/testdata/huffman-pi.golden", "src/compress/flate/testdata/huffman-pi.in", "src/compress/flate/testdata/huffman-pi.wb.expect", "src/compress/flate/testdata/huffman-pi.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-1k.dyn.expect", "src/compress/flate/testdata/huffman-rand-1k.dyn.expect-noinput", "src/compress/flate/testdata/huffman-rand-1k.golden", "src/compress/flate/testdata/huffman-rand-1k.in", "src/compress/flate/testdata/huffman-rand-1k.wb.expect", "src/compress/flate/testdata/huffman-rand-1k.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-limit.dyn.expect", "src/compress/flate/testdata/huffman-rand-limit.dyn.expect-noinput", "src/compress/flate/testdata/huffman-rand-limit.golden", "src/compress/flate/testdata/huffman-rand-limit.in", "src/compress/flate/testdata/huffman-rand-limit.wb.expect", "src/compress/flate/testdata/huffman-rand-limit.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-max.golden", "src/compress/flate/testdata/huffman-rand-max.in", "src/compress/flate/testdata/huffman-shifts.dyn.expect", "src/compress/flate/testdata/huffman-shifts.dyn.expect-noinput", "src/compress/flate/testdata/huffman-shifts.golden", "src/compress/flate/testdata/huffman-shifts.in", "src/compress/flate/testdata/huffman-shifts.wb.expect", "src/compress/flate/testdata/huffman-shifts.wb.expect-noinput", "src/compress/flate/testdata/huffman-text-shift.dyn.expect", "src/compress/flate/testdata/huffman-text-shift.dyn.expect-noinput", "src/compress/flate/testdata/huffman-text-shift.golden", "src/compress/flate/testdata/huffman-text-shift.in", "src/compress/flate/testdata/huffman-text-shift.wb.expect", "src/compress/flate/testdata/huffman-text-shift.wb.expect-noinput", "src/compress/flate/testdata/huffman-text.dyn.expect", "src/compress/flate/testdata/huffman-text.dyn.expect-noinput", "src/compress/flate/testdata/huffman-text.golden", "src/compress/flate/testdata/huffman-text.in", "src/compress/flate/testdata/huffman-text.wb.expect", "src/compress/flate/testdata/huffman-text.wb.expect-noinput", "src/compress/flate/testdata/huffman-zero.dyn.expect", "src/compress/flate/testdata/huffman-zero.dyn.expect-noinput", "src/compress/flate/testdata/huffman-zero.golden", "src/compress/flate/testdata/huffman-zero.in", "src/compress/flate/testdata/huffman-zero.wb.expect", "src/compress/flate/testdata/huffman-zero.wb.expect-noinput", "src/compress/flate/testdata/null-long-match.dyn.expect-noinput", "src/compress/flate/testdata/null-long-match.wb.expect-noinput", "src/compress/flate/token.go", "src/compress/flate/writer_test.go", "src/compress/gzip/example_test.go", "src/compress/gzip/gunzip.go", "src/compress/gzip/gunzip_test.go", "src/compress/gzip/gzip.go", "src/compress/gzip/gzip_test.go", "src/compress/gzip/issue14937_test.go", "src/compress/gzip/testdata/issue6550.gz.base64", "src/compress/lzw/reader.go", "src/compress/lzw/reader_test.go", "src/compress/lzw/writer.go", "src/compress/lzw/writer_test.go", "src/compress/testdata/e.txt", "src/compress/testdata/gettysburg.txt", "src/compress/testdata/pi.txt", "src/compress/zlib/example_test.go", "src/compress/zlib/reader.go", "src/compress/zlib/reader_test.go", "src/compress/zlib/writer.go", "src/compress/zlib/writer_test.go"}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterPrefixes(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
data.filterPrefixesOnly()
|
|
got := data.entries().names()
|
|
want := []string{"src/compress/bzip2/", "src/compress/bzip2/testdata/", "src/compress/flate/", "src/compress/flate/testdata/", "src/compress/gzip/", "src/compress/gzip/testdata/", "src/compress/lzw/", "src/compress/testdata/", "src/compress/zlib/"}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterRecursive(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
data.filterRecursiveEntries("src/compress/bzip2/", slashSeparator)
|
|
got := data.entries().names()
|
|
want := []string{"src/compress/bzip2/", "src/compress/bzip2/bit_reader.go", "src/compress/bzip2/bzip2.go", "src/compress/bzip2/bzip2_test.go", "src/compress/bzip2/huffman.go", "src/compress/bzip2/move_to_front.go"}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterRecursiveRoot(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
data.filterRecursiveEntries("", slashSeparator)
|
|
got := data.entries().names()
|
|
want := []string{}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterRecursiveRootSep(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
// This will remove anything with "bzip2/" in the path since it is separator
|
|
data.filterRecursiveEntries("", "bzip2/")
|
|
got := data.entries().names()
|
|
want := []string{"src/compress/flate/", "src/compress/flate/deflate.go", "src/compress/flate/deflate_test.go", "src/compress/flate/deflatefast.go", "src/compress/flate/dict_decoder.go", "src/compress/flate/dict_decoder_test.go", "src/compress/flate/example_test.go", "src/compress/flate/flate_test.go", "src/compress/flate/huffman_bit_writer.go", "src/compress/flate/huffman_bit_writer_test.go", "src/compress/flate/huffman_code.go", "src/compress/flate/inflate.go", "src/compress/flate/inflate_test.go", "src/compress/flate/reader_test.go", "src/compress/flate/testdata/", "src/compress/flate/testdata/huffman-null-max.dyn.expect", "src/compress/flate/testdata/huffman-null-max.dyn.expect-noinput", "src/compress/flate/testdata/huffman-null-max.golden", "src/compress/flate/testdata/huffman-null-max.in", "src/compress/flate/testdata/huffman-null-max.wb.expect", "src/compress/flate/testdata/huffman-null-max.wb.expect-noinput", "src/compress/flate/testdata/huffman-pi.dyn.expect", "src/compress/flate/testdata/huffman-pi.dyn.expect-noinput", "src/compress/flate/testdata/huffman-pi.golden", "src/compress/flate/testdata/huffman-pi.in", "src/compress/flate/testdata/huffman-pi.wb.expect", "src/compress/flate/testdata/huffman-pi.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-1k.dyn.expect", "src/compress/flate/testdata/huffman-rand-1k.dyn.expect-noinput", "src/compress/flate/testdata/huffman-rand-1k.golden", "src/compress/flate/testdata/huffman-rand-1k.in", "src/compress/flate/testdata/huffman-rand-1k.wb.expect", "src/compress/flate/testdata/huffman-rand-1k.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-limit.dyn.expect", "src/compress/flate/testdata/huffman-rand-limit.dyn.expect-noinput", "src/compress/flate/testdata/huffman-rand-limit.golden", "src/compress/flate/testdata/huffman-rand-limit.in", "src/compress/flate/testdata/huffman-rand-limit.wb.expect", "src/compress/flate/testdata/huffman-rand-limit.wb.expect-noinput", "src/compress/flate/testdata/huffman-rand-max.golden", "src/compress/flate/testdata/huffman-rand-max.in", "src/compress/flate/testdata/huffman-shifts.dyn.expect", "src/compress/flate/testdata/huffman-shifts.dyn.expect-noinput", "src/compress/flate/testdata/huffman-shifts.golden", "src/compress/flate/testdata/huffman-shifts.in", "src/compress/flate/testdata/huffman-shifts.wb.expect", "src/compress/flate/testdata/huffman-shifts.wb.expect-noinput", "src/compress/flate/testdata/huffman-text-shift.dyn.expect", "src/compress/flate/testdata/huffman-text-shift.dyn.expect-noinput", "src/compress/flate/testdata/huffman-text-shift.golden", "src/compress/flate/testdata/huffman-text-shift.in", "src/compress/flate/testdata/huffman-text-shift.wb.expect", "src/compress/flate/testdata/huffman-text-shift.wb.expect-noinput", "src/compress/flate/testdata/huffman-text.dyn.expect", "src/compress/flate/testdata/huffman-text.dyn.expect-noinput", "src/compress/flate/testdata/huffman-text.golden", "src/compress/flate/testdata/huffman-text.in", "src/compress/flate/testdata/huffman-text.wb.expect", "src/compress/flate/testdata/huffman-text.wb.expect-noinput", "src/compress/flate/testdata/huffman-zero.dyn.expect", "src/compress/flate/testdata/huffman-zero.dyn.expect-noinput", "src/compress/flate/testdata/huffman-zero.golden", "src/compress/flate/testdata/huffman-zero.in", "src/compress/flate/testdata/huffman-zero.wb.expect", "src/compress/flate/testdata/huffman-zero.wb.expect-noinput", "src/compress/flate/testdata/null-long-match.dyn.expect-noinput", "src/compress/flate/testdata/null-long-match.wb.expect-noinput", "src/compress/flate/token.go", "src/compress/flate/writer_test.go", "src/compress/gzip/", "src/compress/gzip/example_test.go", "src/compress/gzip/gunzip.go", "src/compress/gzip/gunzip_test.go", "src/compress/gzip/gzip.go", "src/compress/gzip/gzip_test.go", "src/compress/gzip/issue14937_test.go", "src/compress/gzip/testdata/", "src/compress/gzip/testdata/issue6550.gz.base64", "src/compress/lzw/", "src/compress/lzw/reader.go", "src/compress/lzw/reader_test.go", "src/compress/lzw/writer.go", "src/compress/lzw/writer_test.go", "src/compress/testdata/", "src/compress/testdata/e.txt", "src/compress/testdata/gettysburg.txt", "src/compress/testdata/pi.txt", "src/compress/zlib/", "src/compress/zlib/example_test.go", "src/compress/zlib/reader.go", "src/compress/zlib/reader_test.go", "src/compress/zlib/writer.go", "src/compress/zlib/writer_test.go"}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntries_filterPrefix(t *testing.T) {
|
|
data := loadMetacacheSampleEntries(t)
|
|
data.filterPrefix("src/compress/bzip2/")
|
|
got := data.entries().names()
|
|
want := []string{"src/compress/bzip2/", "src/compress/bzip2/bit_reader.go", "src/compress/bzip2/bzip2.go", "src/compress/bzip2/bzip2_test.go", "src/compress/bzip2/huffman.go", "src/compress/bzip2/move_to_front.go", "src/compress/bzip2/testdata/", "src/compress/bzip2/testdata/Isaac.Newton-Opticks.txt.bz2", "src/compress/bzip2/testdata/e.txt.bz2", "src/compress/bzip2/testdata/fail-issue5747.bz2", "src/compress/bzip2/testdata/pass-random1.bin", "src/compress/bzip2/testdata/pass-random1.bz2", "src/compress/bzip2/testdata/pass-random2.bin", "src/compress/bzip2/testdata/pass-random2.bz2", "src/compress/bzip2/testdata/pass-sawtooth.bz2", "src/compress/bzip2/testdata/random.data.bz2"}
|
|
if !reflect.DeepEqual(want, got) {
|
|
t.Errorf("got unexpected result: %#v", got)
|
|
}
|
|
}
|
|
|
|
func Test_metaCacheEntry_isInDir(t *testing.T) {
|
|
tests := []struct {
|
|
testName string
|
|
entry string
|
|
dir string
|
|
sep string
|
|
want bool
|
|
}{
|
|
{
|
|
testName: "basic-file",
|
|
entry: "src/file",
|
|
dir: "src/",
|
|
sep: slashSeparator,
|
|
want: true,
|
|
},
|
|
{
|
|
testName: "basic-dir",
|
|
entry: "src/dir/",
|
|
dir: "src/",
|
|
sep: slashSeparator,
|
|
want: true,
|
|
},
|
|
{
|
|
testName: "deeper-file",
|
|
entry: "src/dir/somewhere.ext",
|
|
dir: "src/",
|
|
sep: slashSeparator,
|
|
want: false,
|
|
},
|
|
{
|
|
testName: "deeper-dir",
|
|
entry: "src/dir/somewhere/",
|
|
dir: "src/",
|
|
sep: slashSeparator,
|
|
want: false,
|
|
},
|
|
{
|
|
testName: "root-dir",
|
|
entry: "doc/",
|
|
dir: "",
|
|
sep: slashSeparator,
|
|
want: true,
|
|
},
|
|
{
|
|
testName: "root-file",
|
|
entry: "word.doc",
|
|
dir: "",
|
|
sep: slashSeparator,
|
|
want: true,
|
|
},
|
|
}
|
|
for _, tt := range tests {
|
|
t.Run(tt.testName, func(t *testing.T) {
|
|
e := metaCacheEntry{
|
|
name: tt.entry,
|
|
}
|
|
if got := e.isInDir(tt.dir, tt.sep); got != tt.want {
|
|
t.Errorf("isInDir() = %v, want %v", got, tt.want)
|
|
}
|
|
})
|
|
}
|
|
}
|