mirror of
https://github.com/minio/minio.git
synced 2024-12-26 23:25:54 -05:00
dca7cf7200
Pass schema to parser to support dates. Fixes #11926
1369 lines
57 KiB
Go
1369 lines
57 KiB
Go
/*
|
|
* MinIO Cloud Storage, (C) 2019 MinIO, Inc.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package s3select
|
|
|
|
import (
|
|
"bytes"
|
|
"encoding/xml"
|
|
"fmt"
|
|
"io"
|
|
"io/ioutil"
|
|
"net/http"
|
|
"os"
|
|
"reflect"
|
|
"strings"
|
|
"testing"
|
|
|
|
"github.com/klauspost/cpuid/v2"
|
|
"github.com/minio/minio-go/v7"
|
|
"github.com/minio/simdjson-go"
|
|
)
|
|
|
|
type testResponseWriter struct {
|
|
statusCode int
|
|
response []byte
|
|
}
|
|
|
|
func (w *testResponseWriter) Header() http.Header {
|
|
return nil
|
|
}
|
|
|
|
func (w *testResponseWriter) Write(p []byte) (int, error) {
|
|
w.response = append(w.response, p...)
|
|
return len(p), nil
|
|
}
|
|
|
|
func (w *testResponseWriter) WriteHeader(statusCode int) {
|
|
w.statusCode = statusCode
|
|
}
|
|
|
|
func (w *testResponseWriter) Flush() {
|
|
}
|
|
|
|
func TestJSONQueries(t *testing.T) {
|
|
input := `{"id": 0,"title": "Test Record","desc": "Some text","synonyms": ["foo", "bar", "whatever"]}
|
|
{"id": 1,"title": "Second Record","desc": "another text","synonyms": ["some", "synonym", "value"]}
|
|
{"id": 2,"title": "Second Record","desc": "another text","numbers": [2, 3.0, 4]}
|
|
{"id": 3,"title": "Second Record","desc": "another text","nested": [[2, 3.0, 4], [7, 8.5, 9]]}`
|
|
|
|
var testTable = []struct {
|
|
name string
|
|
query string
|
|
requestXML []byte // override request XML
|
|
wantResult string
|
|
withJSON string // Override JSON input
|
|
}{
|
|
{
|
|
name: "select-in-array-full",
|
|
query: `SELECT * from s3object s WHERE 'bar' IN s.synonyms[*]`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}`,
|
|
},
|
|
{
|
|
name: "simple-in-array",
|
|
query: `SELECT * from s3object s WHERE s.id IN (1,3)`,
|
|
wantResult: `{"id":1,"title":"Second Record","desc":"another text","synonyms":["some","synonym","value"]}
|
|
{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "select-in-array-single",
|
|
query: `SELECT synonyms from s3object s WHERE 'bar' IN s.synonyms[*] `,
|
|
wantResult: `{"synonyms":["foo","bar","whatever"]}`,
|
|
},
|
|
{
|
|
name: "donatello-1",
|
|
query: `SELECT * from s3object s WHERE 'bar' in s.synonyms`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}`,
|
|
},
|
|
{
|
|
name: "donatello-2",
|
|
query: `SELECT * from s3object s WHERE 'bar' in s.synonyms[*]`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}`,
|
|
},
|
|
{
|
|
name: "bignum-1",
|
|
query: `SELECT id from s3object s WHERE s.id <= 9223372036854775807`,
|
|
wantResult: `{"id":0}
|
|
{"id":1}
|
|
{"id":2}
|
|
{"id":3}`},
|
|
{
|
|
name: "bignum-2",
|
|
query: `SELECT id from s3object s WHERE s.id >= -9223372036854775808`,
|
|
wantResult: `{"id":0}
|
|
{"id":1}
|
|
{"id":2}
|
|
{"id":3}`},
|
|
{
|
|
name: "donatello-3",
|
|
query: `SELECT * from s3object s WHERE 'value' IN s.synonyms[*]`,
|
|
wantResult: `{"id":1,"title":"Second Record","desc":"another text","synonyms":["some","synonym","value"]}`,
|
|
},
|
|
{
|
|
name: "select-in-number",
|
|
query: `SELECT * from s3object s WHERE 4 in s.numbers[*]`,
|
|
wantResult: `{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "select-in-number-float",
|
|
query: `SELECT * from s3object s WHERE 3 in s.numbers[*]`,
|
|
wantResult: `{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "select-in-number-float-in-sql",
|
|
query: `SELECT * from s3object s WHERE 3.0 in s.numbers[*]`,
|
|
wantResult: `{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "select-in-list-match",
|
|
query: `SELECT * from s3object s WHERE (2,3,4) IN s.nested[*]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "select-in-nested-float",
|
|
query: `SELECT s.nested from s3object s WHERE 8.5 IN s.nested[*][*]`,
|
|
wantResult: `{"nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "select-in-combine-and",
|
|
query: `SELECT s.nested from s3object s WHERE (8.5 IN s.nested[*][*]) AND (s.id > 0)`,
|
|
wantResult: `{"nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "select-in-combine-and-no",
|
|
query: `SELECT s.nested from s3object s WHERE (8.5 IN s.nested[*][*]) AND (s.id = 0)`,
|
|
wantResult: ``,
|
|
},
|
|
{
|
|
name: "select-in-nested-float-no-flat",
|
|
query: `SELECT s.nested from s3object s WHERE 8.5 IN s.nested[*]`,
|
|
wantResult: ``,
|
|
},
|
|
{
|
|
name: "select-empty-field-result",
|
|
query: `SELECT * from s3object s WHERE s.nested[0][0] = 2`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "select-arrays-specific",
|
|
query: `SELECT * from s3object s WHERE s.nested[1][0] = 7`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "wrong-index-no-result",
|
|
query: `SELECT * from s3object s WHERE s.nested[0][0] = 7`,
|
|
wantResult: ``,
|
|
},
|
|
{
|
|
name: "not-equal-result",
|
|
query: `SELECT * from s3object s WHERE s.nested[1][0] != 7`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}
|
|
{"id":1,"title":"Second Record","desc":"another text","synonyms":["some","synonym","value"]}
|
|
{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-match",
|
|
query: `SELECT * from s3object s WHERE (7,8.5,9) IN s.nested[1]`,
|
|
wantResult: ``,
|
|
},
|
|
{
|
|
name: "indexed-list-match-equals",
|
|
query: `SELECT * from s3object s WHERE (7,8.5,9) = s.nested[1]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-match-equals-s-star",
|
|
query: `SELECT s.* from s3object s WHERE (7,8.5,9) = s.nested[1]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-match-equals-s-index",
|
|
query: `SELECT s.nested[1], s.nested[0] from s3object s WHERE (7,8.5,9) = s.nested[1]`,
|
|
wantResult: `{"_1":[7,8.5,9],"_2":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-match-not-equals",
|
|
query: `SELECT * from s3object s WHERE (7,8.5,9) != s.nested[1]`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}
|
|
{"id":1,"title":"Second Record","desc":"another text","synonyms":["some","synonym","value"]}
|
|
{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-square-bracket",
|
|
query: `SELECT * from s3object s WHERE [7,8.5,9] = s.nested[1]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-square-bracket",
|
|
query: `SELECT * from s3object s WHERE [7,8.5,9] IN s.nested`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "indexed-list-square-bracket",
|
|
query: `SELECT * from s3object s WHERE id IN [3,2]`,
|
|
wantResult: `{"id":2,"title":"Second Record","desc":"another text","numbers":[2,3,4]}
|
|
{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "index-wildcard-in",
|
|
query: `SELECT * from s3object s WHERE (8.5) IN s.nested[1][*]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "index-wildcard-in",
|
|
query: `SELECT * from s3object s WHERE (8.0+0.5) IN s.nested[1][*]`,
|
|
wantResult: `{"id":3,"title":"Second Record","desc":"another text","nested":[[2,3,4],[7,8.5,9]]}`,
|
|
},
|
|
{
|
|
name: "compare-mixed",
|
|
query: `SELECT id from s3object s WHERE value = true`,
|
|
wantResult: `{"id":1}`,
|
|
withJSON: `{"id":0, "value": false}
|
|
{"id":1, "value": true}
|
|
{"id":2, "value": 42}
|
|
{"id":3, "value": "true"}
|
|
`,
|
|
},
|
|
{
|
|
name: "compare-mixed-not",
|
|
query: `SELECT COUNT(id) as n from s3object s WHERE value != true`,
|
|
wantResult: `{"n":3}`,
|
|
withJSON: `{"id":0, "value": false}
|
|
{"id":1, "value": true}
|
|
{"id":2, "value": 42}
|
|
{"id":3, "value": "true"}
|
|
`,
|
|
},
|
|
{
|
|
name: "index-wildcard-in",
|
|
query: `SELECT * from s3object s WHERE title = 'Test Record'`,
|
|
wantResult: `{"id":0,"title":"Test Record","desc":"Some text","synonyms":["foo","bar","whatever"]}`,
|
|
},
|
|
{
|
|
name: "select-output-field-as-csv",
|
|
requestXML: []byte(`<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT s.synonyms from s3object s WHERE 'whatever' IN s.synonyms</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>DOCUMENT</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
<QuoteCharacter>"</QuoteCharacter>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>`),
|
|
wantResult: `"[""foo"",""bar"",""whatever""]"`,
|
|
},
|
|
{
|
|
name: "document",
|
|
query: "",
|
|
requestXML: []byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>select * from s3object[*].elements[*] s where s.element_type = '__elem__merfu'</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>DOCUMENT</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>`),
|
|
withJSON: `
|
|
{
|
|
"name": "small_pdf1.pdf",
|
|
"lume_id": "9507193e-572d-4f95-bcf1-e9226d96be65",
|
|
"elements": [
|
|
{
|
|
"element_type": "__elem__image",
|
|
"element_id": "859d09c4-7cf1-4a37-9674-3a7de8b56abc",
|
|
"attributes": {
|
|
"__attr__image_dpi": 300,
|
|
"__attr__image_size": [
|
|
2550,
|
|
3299
|
|
],
|
|
"__attr__image_index": 1,
|
|
"__attr__image_format": "JPEG",
|
|
"__attr__file_extension": "jpg",
|
|
"__attr__data": null
|
|
}
|
|
},
|
|
{
|
|
"element_type": "__elem__merfu",
|
|
"element_id": "d868aefe-ef9a-4be2-b9b2-c9fd89cc43eb",
|
|
"attributes": {
|
|
"__attr__image_dpi": 300,
|
|
"__attr__image_size": [
|
|
2550,
|
|
3299
|
|
],
|
|
"__attr__image_index": 2,
|
|
"__attr__image_format": "JPEG",
|
|
"__attr__file_extension": "jpg",
|
|
"__attr__data": null
|
|
}
|
|
}
|
|
],
|
|
"data": "asdascasdc1234e123erdasdas"
|
|
}`,
|
|
wantResult: `{"element_type":"__elem__merfu","element_id":"d868aefe-ef9a-4be2-b9b2-c9fd89cc43eb","attributes":{"__attr__image_dpi":300,"__attr__image_size":[2550,3299],"__attr__image_index":2,"__attr__image_format":"JPEG","__attr__file_extension":"jpg","__attr__data":null}}`,
|
|
},
|
|
{
|
|
name: "date_diff_month",
|
|
query: `SELECT date_diff(MONTH, '2019-10-20T', '2020-01-20T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":3}`,
|
|
},
|
|
{
|
|
name: "date_diff_month_neg",
|
|
query: `SELECT date_diff(MONTH, '2020-01-20T', '2019-10-20T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":-3}`,
|
|
},
|
|
// Examples from https://docs.aws.amazon.com/AmazonS3/latest/userguide/s3-glacier-select-sql-reference-date.html#s3-glacier-select-sql-reference-date-diff
|
|
{
|
|
name: "date_diff_year",
|
|
query: `SELECT date_diff(year, '2010-01-01T', '2011-01-01T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":1}`,
|
|
},
|
|
{
|
|
name: "date_diff_year",
|
|
query: `SELECT date_diff(month, '2010-01-01T', '2010-05T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":4}`,
|
|
},
|
|
{
|
|
name: "date_diff_month_oney",
|
|
query: `SELECT date_diff(month, '2010T', '2011T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":12}`,
|
|
},
|
|
{
|
|
name: "date_diff_month_neg",
|
|
query: `SELECT date_diff(month, '2011T', '2010T') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":-12}`,
|
|
},
|
|
{
|
|
name: "date_diff_days",
|
|
query: `SELECT date_diff(day, '2010-01-01T23:00:00Z', '2010-01-02T01:00:00Z') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":0}`,
|
|
},
|
|
{
|
|
name: "date_diff_days_one",
|
|
query: `SELECT date_diff(day, '2010-01-01T23:00:00Z', '2010-01-02T23:00:00Z') FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":1}`,
|
|
},
|
|
{
|
|
name: "cast_from_int_to_float",
|
|
query: `SELECT cast(1 as float) FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":1}`,
|
|
},
|
|
{
|
|
name: "cast_from_float_to_float",
|
|
query: `SELECT cast(1.0 as float) FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":1}`,
|
|
},
|
|
{
|
|
name: "arithmetic_integer_operand",
|
|
query: `SELECT 1 / 2 FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":0}`,
|
|
},
|
|
{
|
|
name: "arithmetic_float_operand",
|
|
query: `SELECT 1.0 / 2.0 * .3 FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":0.15}`,
|
|
},
|
|
{
|
|
name: "arithmetic_integer_float_operand",
|
|
query: `SELECT 3.0 / 2, 5 / 2.0 FROM S3Object LIMIT 1`,
|
|
wantResult: `{"_1":1.5,"_2":2.5}`,
|
|
},
|
|
}
|
|
|
|
defRequest := `<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>%s</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>LINES</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>`
|
|
|
|
for _, testCase := range testTable {
|
|
t.Run(testCase.name, func(t *testing.T) {
|
|
// Hack cpuid to the CPU doesn't appear to support AVX2.
|
|
// Restore whatever happens.
|
|
if cpuid.CPU.Supports(cpuid.AVX2) {
|
|
cpuid.CPU.Disable(cpuid.AVX2)
|
|
defer cpuid.CPU.Enable(cpuid.AVX2)
|
|
}
|
|
if simdjson.SupportedCPU() {
|
|
t.Fatal("setup error: expected cpu to be unsupported")
|
|
}
|
|
testReq := testCase.requestXML
|
|
if len(testReq) == 0 {
|
|
var escaped bytes.Buffer
|
|
xml.EscapeText(&escaped, []byte(testCase.query))
|
|
testReq = []byte(fmt.Sprintf(defRequest, escaped.String()))
|
|
}
|
|
s3Select, err := NewS3Select(bytes.NewReader(testReq))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
in := input
|
|
if len(testCase.withJSON) > 0 {
|
|
in = testCase.withJSON
|
|
}
|
|
return ioutil.NopCloser(bytes.NewBufferString(in)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.query, gotS, testCase.wantResult)
|
|
}
|
|
})
|
|
t.Run("simd-"+testCase.name, func(t *testing.T) {
|
|
if !simdjson.SupportedCPU() {
|
|
t.Skip("No CPU support")
|
|
}
|
|
testReq := testCase.requestXML
|
|
if len(testReq) == 0 {
|
|
var escaped bytes.Buffer
|
|
xml.EscapeText(&escaped, []byte(testCase.query))
|
|
testReq = []byte(fmt.Sprintf(defRequest, escaped.String()))
|
|
}
|
|
s3Select, err := NewS3Select(bytes.NewReader(testReq))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
in := input
|
|
if len(testCase.withJSON) > 0 {
|
|
in = testCase.withJSON
|
|
}
|
|
return ioutil.NopCloser(bytes.NewBufferString(in)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.query, gotS, testCase.wantResult)
|
|
}
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestCSVQueries(t *testing.T) {
|
|
input := `index,ID,CaseNumber,Date,Day,Month,Year,Block,IUCR,PrimaryType,Description,LocationDescription,Arrest,Domestic,Beat,District,Ward,CommunityArea,FBI Code,XCoordinate,YCoordinate,UpdatedOn,Latitude,Longitude,Location
|
|
2700763,7732229,,2010-05-26 00:00:00,26,May,2010,113XX S HALSTED ST,1150,,CREDIT CARD FRAUD,,False,False,2233,22.0,34.0,,11,,,,41.688043288,-87.6422444,"(41.688043288, -87.6422444)"`
|
|
|
|
var testTable = []struct {
|
|
name string
|
|
query string
|
|
requestXML []byte
|
|
wantResult string
|
|
}{
|
|
{
|
|
name: "select-in-text-simple",
|
|
query: `SELECT index FROM s3Object s WHERE "Month"='May'`,
|
|
wantResult: `2700763`,
|
|
},
|
|
}
|
|
|
|
defRequest := `<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>%s</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FieldDelimiter>,</FieldDelimiter>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
<QuoteCharacter>"</QuoteCharacter>
|
|
<QuoteEscapeCharacter>"</QuoteEscapeCharacter>
|
|
<RecordDelimiter>\n</RecordDelimiter>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>`
|
|
|
|
for _, testCase := range testTable {
|
|
t.Run(testCase.name, func(t *testing.T) {
|
|
testReq := testCase.requestXML
|
|
if len(testReq) == 0 {
|
|
testReq = []byte(fmt.Sprintf(defRequest, testCase.query))
|
|
}
|
|
s3Select, err := NewS3Select(bytes.NewReader(testReq))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
return ioutil.NopCloser(bytes.NewBufferString(input)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.query, gotS, testCase.wantResult)
|
|
}
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestCSVQueries2(t *testing.T) {
|
|
input := `id,time,num,num2,text
|
|
1,2010-01-01T,7867786,4565.908123,"a text, with comma"
|
|
2,2017-01-02T03:04Z,-5, 0.765111,
|
|
`
|
|
var testTable = []struct {
|
|
name string
|
|
query string
|
|
requestXML []byte // override request XML
|
|
wantResult string
|
|
}{
|
|
{
|
|
name: "select-all",
|
|
query: `SELECT * from s3object AS s WHERE id = '1'`,
|
|
wantResult: `{"id":"1","time":"2010-01-01T","num":"7867786","num2":"4565.908123","text":"a text, with comma"}`,
|
|
},
|
|
{
|
|
name: "select-all-2",
|
|
query: `SELECT * from s3object s WHERE id = 2`,
|
|
wantResult: `{"id":"2","time":"2017-01-02T03:04Z","num":"-5","num2":" 0.765111","text":""}`,
|
|
},
|
|
{
|
|
name: "select-text-convert",
|
|
query: `SELECT CAST(text AS STRING) AS text from s3object s WHERE id = 1`,
|
|
wantResult: `{"text":"a text, with comma"}`,
|
|
},
|
|
{
|
|
name: "select-text-direct",
|
|
query: `SELECT text from s3object s WHERE id = 1`,
|
|
wantResult: `{"text":"a text, with comma"}`,
|
|
},
|
|
{
|
|
name: "select-time-direct",
|
|
query: `SELECT time from s3object s WHERE id = 2`,
|
|
wantResult: `{"time":"2017-01-02T03:04Z"}`,
|
|
},
|
|
{
|
|
name: "select-int-direct",
|
|
query: `SELECT num from s3object s WHERE id = 2`,
|
|
wantResult: `{"num":"-5"}`,
|
|
},
|
|
{
|
|
name: "select-float-direct",
|
|
query: `SELECT num2 from s3object s WHERE id = 2`,
|
|
wantResult: `{"num2":" 0.765111"}`,
|
|
},
|
|
{
|
|
name: "select-in-array",
|
|
query: `select id from S3Object s WHERE id in [1,3]`,
|
|
wantResult: `{"id":"1"}`,
|
|
},
|
|
{
|
|
name: "select-in-array-matchnone",
|
|
query: `select id from S3Object s WHERE s.id in [4,3]`,
|
|
wantResult: ``,
|
|
},
|
|
{
|
|
name: "select-float-by-val",
|
|
query: `SELECT num2 from s3object s WHERE num2 = 0.765111`,
|
|
wantResult: `{"num2":" 0.765111"}`,
|
|
},
|
|
}
|
|
|
|
defRequest := `<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>%s</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
<QuoteCharacter>"</QuoteCharacter>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>`
|
|
|
|
for _, testCase := range testTable {
|
|
t.Run(testCase.name, func(t *testing.T) {
|
|
testReq := testCase.requestXML
|
|
if len(testReq) == 0 {
|
|
testReq = []byte(fmt.Sprintf(defRequest, testCase.query))
|
|
}
|
|
s3Select, err := NewS3Select(bytes.NewReader(testReq))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
return ioutil.NopCloser(bytes.NewBufferString(input)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.query, gotS, testCase.wantResult)
|
|
}
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestCSVInput(t *testing.T) {
|
|
var testTable = []struct {
|
|
requestXML []byte
|
|
expectedResult []byte
|
|
}{
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT one, two, three from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 137, 0, 0, 0, 85, 194, 213, 168, 241, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 45, 49, 44, 102, 111, 111, 44, 116, 114, 117, 101, 10, 44, 98, 97, 114, 44, 102, 97, 108, 115, 101, 10, 50, 46, 53, 44, 98, 97, 122, 44, 116, 114, 117, 101, 10, 75, 182, 193, 80, 0, 0, 0, 235, 0, 0, 0, 67, 213, 243, 57, 141, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 53, 48, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 53, 48, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 51, 54, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 253, 105, 8, 216, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT COUNT(*) AS total_record_count from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 126, 0, 0, 0, 85, 56, 193, 36, 188, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 123, 34, 116, 111, 116, 97, 108, 95, 114, 101, 99, 111, 114, 100, 95, 99, 111, 117, 110, 116, 34, 58, 51, 125, 10, 196, 183, 134, 242, 0, 0, 0, 235, 0, 0, 0, 67, 213, 243, 57, 141, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 53, 48, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 53, 48, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 50, 53, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 47, 153, 24, 28, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT * from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{0x0, 0x0, 0x0, 0xdd, 0x0, 0x0, 0x0, 0x55, 0xf, 0x46, 0xc1, 0xfa, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x18, 0x61, 0x70, 0x70, 0x6c, 0x69, 0x63, 0x61, 0x74, 0x69, 0x6f, 0x6e, 0x2f, 0x6f, 0x63, 0x74, 0x65, 0x74, 0x2d, 0x73, 0x74, 0x72, 0x65, 0x61, 0x6d, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x7, 0x52, 0x65, 0x63, 0x6f, 0x72, 0x64, 0x73, 0x7b, 0x22, 0x6f, 0x6e, 0x65, 0x22, 0x3a, 0x22, 0x2d, 0x31, 0x22, 0x2c, 0x22, 0x74, 0x77, 0x6f, 0x22, 0x3a, 0x22, 0x66, 0x6f, 0x6f, 0x22, 0x2c, 0x22, 0x74, 0x68, 0x72, 0x65, 0x65, 0x22, 0x3a, 0x22, 0x74, 0x72, 0x75, 0x65, 0x22, 0x7d, 0xa, 0x7b, 0x22, 0x6f, 0x6e, 0x65, 0x22, 0x3a, 0x22, 0x22, 0x2c, 0x22, 0x74, 0x77, 0x6f, 0x22, 0x3a, 0x22, 0x62, 0x61, 0x72, 0x22, 0x2c, 0x22, 0x74, 0x68, 0x72, 0x65, 0x65, 0x22, 0x3a, 0x22, 0x66, 0x61, 0x6c, 0x73, 0x65, 0x22, 0x7d, 0xa, 0x7b, 0x22, 0x6f, 0x6e, 0x65, 0x22, 0x3a, 0x22, 0x32, 0x2e, 0x35, 0x22, 0x2c, 0x22, 0x74, 0x77, 0x6f, 0x22, 0x3a, 0x22, 0x62, 0x61, 0x7a, 0x22, 0x2c, 0x22, 0x74, 0x68, 0x72, 0x65, 0x65, 0x22, 0x3a, 0x22, 0x74, 0x72, 0x75, 0x65, 0x22, 0x7d, 0xa, 0x7e, 0xb5, 0x99, 0xfb, 0x0, 0x0, 0x0, 0xec, 0x0, 0x0, 0x0, 0x43, 0x67, 0xd3, 0xe5, 0x9d, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x8, 0x74, 0x65, 0x78, 0x74, 0x2f, 0x78, 0x6d, 0x6c, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3c, 0x3f, 0x78, 0x6d, 0x6c, 0x20, 0x76, 0x65, 0x72, 0x73, 0x69, 0x6f, 0x6e, 0x3d, 0x22, 0x31, 0x2e, 0x30, 0x22, 0x20, 0x65, 0x6e, 0x63, 0x6f, 0x64, 0x69, 0x6e, 0x67, 0x3d, 0x22, 0x55, 0x54, 0x46, 0x2d, 0x38, 0x22, 0x3f, 0x3e, 0x3c, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x35, 0x30, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x35, 0x30, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x31, 0x32, 0x30, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x2f, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0x5a, 0xe5, 0xd, 0x84, 0x0, 0x0, 0x0, 0x38, 0x0, 0x0, 0x0, 0x28, 0xc1, 0xc6, 0x84, 0xd4, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x3, 0x45, 0x6e, 0x64, 0xcf, 0x97, 0xd3, 0x92},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT one from S3Object limit 1</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<CSV>
|
|
<FileHeaderInfo>USE</FileHeaderInfo>
|
|
</CSV>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0x0, 0x0, 0x0, 0x68, 0x0, 0x0, 0x0, 0x55, 0xd7, 0x61, 0x46, 0x9e, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x18, 0x61, 0x70, 0x70, 0x6c, 0x69, 0x63, 0x61, 0x74, 0x69, 0x6f, 0x6e, 0x2f, 0x6f, 0x63, 0x74, 0x65, 0x74, 0x2d, 0x73, 0x74, 0x72, 0x65, 0x61, 0x6d, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x7, 0x52, 0x65, 0x63, 0x6f, 0x72, 0x64, 0x73, 0x2d, 0x31, 0xa, 0x17, 0xfb, 0x1, 0x90, 0x0, 0x0, 0x0, 0xea, 0x0, 0x0, 0x0, 0x43, 0xe8, 0x93, 0x10, 0x3d, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x8, 0x74, 0x65, 0x78, 0x74, 0x2f, 0x78, 0x6d, 0x6c, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3c, 0x3f, 0x78, 0x6d, 0x6c, 0x20, 0x76, 0x65, 0x72, 0x73, 0x69, 0x6f, 0x6e, 0x3d, 0x22, 0x31, 0x2e, 0x30, 0x22, 0x20, 0x65, 0x6e, 0x63, 0x6f, 0x64, 0x69, 0x6e, 0x67, 0x3d, 0x22, 0x55, 0x54, 0x46, 0x2d, 0x38, 0x22, 0x3f, 0x3e, 0x3c, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x35, 0x30, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x35, 0x30, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x33, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x2f, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0x15, 0x72, 0x19, 0x94, 0x0, 0x0, 0x0, 0x38, 0x0, 0x0, 0x0, 0x28, 0xc1, 0xc6, 0x84, 0xd4, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x3, 0x45, 0x6e, 0x64, 0xcf, 0x97, 0xd3, 0x92,
|
|
},
|
|
},
|
|
}
|
|
|
|
var csvData = []byte(`one,two,three
|
|
-1,foo,true
|
|
,bar,false
|
|
2.5,baz,true
|
|
`)
|
|
|
|
for i, testCase := range testTable {
|
|
t.Run(fmt.Sprint(i), func(t *testing.T) {
|
|
s3Select, err := NewS3Select(bytes.NewReader(testCase.requestXML))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
return ioutil.NopCloser(bytes.NewReader(csvData)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
|
|
if !reflect.DeepEqual(w.response, testCase.expectedResult) {
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
|
|
t.Errorf("received response does not match with expected reply\ngot: %#v\nwant:%#v\ndecoded:%s", w.response, testCase.expectedResult, string(got))
|
|
}
|
|
})
|
|
}
|
|
|
|
}
|
|
|
|
func TestJSONInput(t *testing.T) {
|
|
|
|
var testTable = []struct {
|
|
requestXML []byte
|
|
expectedResult []byte
|
|
}{
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT one, two, three from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>DOCUMENT</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 137, 0, 0, 0, 85, 194, 213, 168, 241, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 45, 49, 44, 102, 111, 111, 44, 116, 114, 117, 101, 10, 44, 98, 97, 114, 44, 102, 97, 108, 115, 101, 10, 50, 46, 53, 44, 98, 97, 122, 44, 116, 114, 117, 101, 10, 75, 182, 193, 80, 0, 0, 0, 237, 0, 0, 0, 67, 90, 179, 204, 45, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 49, 49, 50, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 49, 49, 50, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 51, 54, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 181, 40, 50, 250, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT COUNT(*) AS total_record_count from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>DOCUMENT</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 103, 0, 0, 0, 85, 85, 49, 209, 79, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 51, 10, 175, 58, 213, 152, 0, 0, 0, 236, 0, 0, 0, 67, 103, 211, 229, 157, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 49, 49, 50, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 49, 49, 50, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 50, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 52, 192, 77, 114, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT * from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<JSON>
|
|
<Type>DOCUMENT</Type>
|
|
</JSON>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{0x0, 0x0, 0x0, 0x89, 0x0, 0x0, 0x0, 0x55, 0xc2, 0xd5, 0xa8, 0xf1, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x18, 0x61, 0x70, 0x70, 0x6c, 0x69, 0x63, 0x61, 0x74, 0x69, 0x6f, 0x6e, 0x2f, 0x6f, 0x63, 0x74, 0x65, 0x74, 0x2d, 0x73, 0x74, 0x72, 0x65, 0x61, 0x6d, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x7, 0x52, 0x65, 0x63, 0x6f, 0x72, 0x64, 0x73, 0x74, 0x72, 0x75, 0x65, 0x2c, 0x66, 0x6f, 0x6f, 0x2c, 0x2d, 0x31, 0xa, 0x66, 0x61, 0x6c, 0x73, 0x65, 0x2c, 0x62, 0x61, 0x72, 0x2c, 0xa, 0x74, 0x72, 0x75, 0x65, 0x2c, 0x62, 0x61, 0x7a, 0x2c, 0x32, 0x2e, 0x35, 0xa, 0xef, 0x22, 0x13, 0xa3, 0x0, 0x0, 0x0, 0xed, 0x0, 0x0, 0x0, 0x43, 0x5a, 0xb3, 0xcc, 0x2d, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xd, 0x3a, 0x63, 0x6f, 0x6e, 0x74, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x8, 0x74, 0x65, 0x78, 0x74, 0x2f, 0x78, 0x6d, 0x6c, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3c, 0x3f, 0x78, 0x6d, 0x6c, 0x20, 0x76, 0x65, 0x72, 0x73, 0x69, 0x6f, 0x6e, 0x3d, 0x22, 0x31, 0x2e, 0x30, 0x22, 0x20, 0x65, 0x6e, 0x63, 0x6f, 0x64, 0x69, 0x6e, 0x67, 0x3d, 0x22, 0x55, 0x54, 0x46, 0x2d, 0x38, 0x22, 0x3f, 0x3e, 0x3c, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x31, 0x31, 0x32, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x53, 0x63, 0x61, 0x6e, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x31, 0x31, 0x32, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x50, 0x72, 0x6f, 0x63, 0x65, 0x73, 0x73, 0x65, 0x64, 0x3e, 0x3c, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x33, 0x36, 0x3c, 0x2f, 0x42, 0x79, 0x74, 0x65, 0x73, 0x52, 0x65, 0x74, 0x75, 0x72, 0x6e, 0x65, 0x64, 0x3e, 0x3c, 0x2f, 0x53, 0x74, 0x61, 0x74, 0x73, 0x3e, 0xb5, 0x28, 0x32, 0xfa, 0x0, 0x0, 0x0, 0x38, 0x0, 0x0, 0x0, 0x28, 0xc1, 0xc6, 0x84, 0xd4, 0xd, 0x3a, 0x6d, 0x65, 0x73, 0x73, 0x61, 0x67, 0x65, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x5, 0x65, 0x76, 0x65, 0x6e, 0x74, 0xb, 0x3a, 0x65, 0x76, 0x65, 0x6e, 0x74, 0x2d, 0x74, 0x79, 0x70, 0x65, 0x7, 0x0, 0x3, 0x45, 0x6e, 0x64, 0xcf, 0x97, 0xd3, 0x92},
|
|
},
|
|
}
|
|
|
|
var jsonData = []byte(`{"three":true,"two":"foo","one":-1}
|
|
{"three":false,"two":"bar","one":null}
|
|
{"three":true,"two":"baz","one":2.5}
|
|
`)
|
|
|
|
for i, testCase := range testTable {
|
|
t.Run(fmt.Sprint(i), func(t *testing.T) {
|
|
s3Select, err := NewS3Select(bytes.NewReader(testCase.requestXML))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
|
|
return ioutil.NopCloser(bytes.NewReader(jsonData)), nil
|
|
}); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
|
|
if !reflect.DeepEqual(w.response, testCase.expectedResult) {
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
|
|
t.Errorf("received response does not match with expected reply\ngot: %#v\nwant:%#v\ndecoded:%s", w.response, testCase.expectedResult, string(got))
|
|
}
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestParquetInput(t *testing.T) {
|
|
os.Setenv("MINIO_API_SELECT_PARQUET", "on")
|
|
defer os.Setenv("MINIO_API_SELECT_PARQUET", "off")
|
|
|
|
var testTable = []struct {
|
|
requestXML []byte
|
|
expectedResult []byte
|
|
}{
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT one, two, three from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 137, 0, 0, 0, 85, 194, 213, 168, 241, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 45, 49, 44, 102, 111, 111, 44, 116, 114, 117, 101, 10, 44, 98, 97, 114, 44, 102, 97, 108, 115, 101, 10, 50, 46, 53, 44, 98, 97, 122, 44, 116, 114, 117, 101, 10, 75, 182, 193, 80, 0, 0, 0, 235, 0, 0, 0, 67, 213, 243, 57, 141, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 45, 49, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 45, 49, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 51, 54, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 128, 96, 253, 66, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
{
|
|
[]byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT COUNT(*) AS total_record_count from S3Object</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV>
|
|
</CSV>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), []byte{
|
|
0, 0, 0, 103, 0, 0, 0, 85, 85, 49, 209, 79, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 24, 97, 112, 112, 108, 105, 99, 97, 116, 105, 111, 110, 47, 111, 99, 116, 101, 116, 45, 115, 116, 114, 101, 97, 109, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 7, 82, 101, 99, 111, 114, 100, 115, 51, 10, 175, 58, 213, 152, 0, 0, 0, 234, 0, 0, 0, 67, 232, 147, 16, 61, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 13, 58, 99, 111, 110, 116, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 8, 116, 101, 120, 116, 47, 120, 109, 108, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 5, 83, 116, 97, 116, 115, 60, 63, 120, 109, 108, 32, 118, 101, 114, 115, 105, 111, 110, 61, 34, 49, 46, 48, 34, 32, 101, 110, 99, 111, 100, 105, 110, 103, 61, 34, 85, 84, 70, 45, 56, 34, 63, 62, 60, 83, 116, 97, 116, 115, 62, 60, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 45, 49, 60, 47, 66, 121, 116, 101, 115, 83, 99, 97, 110, 110, 101, 100, 62, 60, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 45, 49, 60, 47, 66, 121, 116, 101, 115, 80, 114, 111, 99, 101, 115, 115, 101, 100, 62, 60, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 50, 60, 47, 66, 121, 116, 101, 115, 82, 101, 116, 117, 114, 110, 101, 100, 62, 60, 47, 83, 116, 97, 116, 115, 62, 190, 146, 162, 21, 0, 0, 0, 56, 0, 0, 0, 40, 193, 198, 132, 212, 13, 58, 109, 101, 115, 115, 97, 103, 101, 45, 116, 121, 112, 101, 7, 0, 5, 101, 118, 101, 110, 116, 11, 58, 101, 118, 101, 110, 116, 45, 116, 121, 112, 101, 7, 0, 3, 69, 110, 100, 207, 151, 211, 146,
|
|
},
|
|
},
|
|
}
|
|
|
|
for i, testCase := range testTable {
|
|
t.Run(fmt.Sprint(i), func(t *testing.T) {
|
|
getReader := func(offset int64, length int64) (io.ReadCloser, error) {
|
|
testdataFile := "testdata/testdata.parquet"
|
|
file, err := os.Open(testdataFile)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
fi, err := file.Stat()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if offset < 0 {
|
|
offset = fi.Size() + offset
|
|
}
|
|
|
|
if _, err = file.Seek(offset, io.SeekStart); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return file, nil
|
|
}
|
|
|
|
s3Select, err := NewS3Select(bytes.NewReader(testCase.requestXML))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(getReader); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
|
|
if !reflect.DeepEqual(w.response, testCase.expectedResult) {
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
|
|
t.Errorf("received response does not match with expected reply\ngot: %#v\nwant:%#v\ndecoded:%s", w.response, testCase.expectedResult, string(got))
|
|
}
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestParquetInputSchema(t *testing.T) {
|
|
os.Setenv("MINIO_API_SELECT_PARQUET", "on")
|
|
defer os.Setenv("MINIO_API_SELECT_PARQUET", "off")
|
|
|
|
var testTable = []struct {
|
|
requestXML []byte
|
|
wantResult string
|
|
}{
|
|
{
|
|
requestXML: []byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT * FROM S3Object LIMIT 5</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), wantResult: `{"shipdate":"1996-03-13T"}
|
|
{"shipdate":"1996-04-12T"}
|
|
{"shipdate":"1996-01-29T"}
|
|
{"shipdate":"1996-04-21T"}
|
|
{"shipdate":"1996-03-30T"}`,
|
|
},
|
|
{
|
|
requestXML: []byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT DATE_ADD(day, 2, shipdate) as shipdate FROM S3Object LIMIT 5</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<JSON>
|
|
</JSON>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), wantResult: `{"shipdate":"1996-03-15T"}
|
|
{"shipdate":"1996-04-14T"}
|
|
{"shipdate":"1996-01-31T"}
|
|
{"shipdate":"1996-04-23T"}
|
|
{"shipdate":"1996-04T"}`,
|
|
},
|
|
}
|
|
|
|
for i, testCase := range testTable {
|
|
t.Run(fmt.Sprint(i), func(t *testing.T) {
|
|
getReader := func(offset int64, length int64) (io.ReadCloser, error) {
|
|
testdataFile := "testdata/lineitem_shipdate.parquet"
|
|
file, err := os.Open(testdataFile)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
fi, err := file.Stat()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if offset < 0 {
|
|
offset = fi.Size() + offset
|
|
}
|
|
|
|
if _, err = file.Seek(offset, io.SeekStart); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return file, nil
|
|
}
|
|
|
|
s3Select, err := NewS3Select(bytes.NewReader(testCase.requestXML))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(getReader); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.requestXML, gotS, testCase.wantResult)
|
|
}
|
|
|
|
})
|
|
}
|
|
}
|
|
|
|
func TestParquetInputSchemaCSV(t *testing.T) {
|
|
os.Setenv("MINIO_API_SELECT_PARQUET", "on")
|
|
defer os.Setenv("MINIO_API_SELECT_PARQUET", "off")
|
|
|
|
var testTable = []struct {
|
|
requestXML []byte
|
|
wantResult string
|
|
}{
|
|
{
|
|
requestXML: []byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT * FROM S3Object LIMIT 5</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV/>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), wantResult: `1996-03-13T
|
|
1996-04-12T
|
|
1996-01-29T
|
|
1996-04-21T
|
|
1996-03-30T`,
|
|
},
|
|
{
|
|
requestXML: []byte(`
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
<SelectObjectContentRequest>
|
|
<Expression>SELECT DATE_ADD(day, 2, shipdate) as shipdate FROM S3Object LIMIT 5</Expression>
|
|
<ExpressionType>SQL</ExpressionType>
|
|
<InputSerialization>
|
|
<CompressionType>NONE</CompressionType>
|
|
<Parquet>
|
|
</Parquet>
|
|
</InputSerialization>
|
|
<OutputSerialization>
|
|
<CSV/>
|
|
</OutputSerialization>
|
|
<RequestProgress>
|
|
<Enabled>FALSE</Enabled>
|
|
</RequestProgress>
|
|
</SelectObjectContentRequest>
|
|
`), wantResult: `1996-03-15T
|
|
1996-04-14T
|
|
1996-01-31T
|
|
1996-04-23T
|
|
1996-04T`,
|
|
},
|
|
}
|
|
|
|
for i, testCase := range testTable {
|
|
t.Run(fmt.Sprint(i), func(t *testing.T) {
|
|
getReader := func(offset int64, length int64) (io.ReadCloser, error) {
|
|
testdataFile := "testdata/lineitem_shipdate.parquet"
|
|
file, err := os.Open(testdataFile)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
fi, err := file.Stat()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if offset < 0 {
|
|
offset = fi.Size() + offset
|
|
}
|
|
|
|
if _, err = file.Seek(offset, io.SeekStart); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return file, nil
|
|
}
|
|
|
|
s3Select, err := NewS3Select(bytes.NewReader(testCase.requestXML))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err = s3Select.Open(getReader); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
w := &testResponseWriter{}
|
|
s3Select.Evaluate(w)
|
|
s3Select.Close()
|
|
resp := http.Response{
|
|
StatusCode: http.StatusOK,
|
|
Body: ioutil.NopCloser(bytes.NewReader(w.response)),
|
|
ContentLength: int64(len(w.response)),
|
|
}
|
|
res, err := minio.NewSelectResults(&resp, "testbucket")
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
got, err := ioutil.ReadAll(res)
|
|
if err != nil {
|
|
t.Error(err)
|
|
return
|
|
}
|
|
gotS := strings.TrimSpace(string(got))
|
|
if !reflect.DeepEqual(gotS, testCase.wantResult) {
|
|
t.Errorf("received response does not match with expected reply. Query: %s\ngot: %s\nwant:%s", testCase.requestXML, gotS, testCase.wantResult)
|
|
}
|
|
|
|
})
|
|
}
|
|
}
|