2021-04-18 15:41:13 -04:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2020-06-25 10:31:16 -04:00
|
|
|
|
|
|
|
package data
|
|
|
|
|
|
|
|
import (
|
|
|
|
"reflect"
|
|
|
|
"testing"
|
|
|
|
|
|
|
|
"github.com/minio/minio/pkg/s3select/internal/parquet-go/gen-go/parquet"
|
|
|
|
"github.com/minio/minio/pkg/s3select/internal/parquet-go/schema"
|
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
|
|
|
v10 = int32(10)
|
|
|
|
v20 = int32(20)
|
|
|
|
v30 = int32(30)
|
|
|
|
ten = []byte("ten")
|
|
|
|
foo = []byte("foo")
|
|
|
|
bar = []byte("bar")
|
|
|
|
phone1 = []byte("1-234-567-8901")
|
|
|
|
phone2 = []byte("1-234-567-1098")
|
|
|
|
phone3 = []byte("1-111-222-3333")
|
|
|
|
)
|
|
|
|
|
|
|
|
func TestAddressBookExample(t *testing.T) {
|
|
|
|
// message AddressBook {
|
|
|
|
// required string owner;
|
|
|
|
// repeated string ownerPhoneNumbers;
|
|
|
|
// repeated group contacts {
|
|
|
|
// required string name;
|
|
|
|
// optional string phoneNumber;
|
|
|
|
// }
|
|
|
|
// }
|
|
|
|
t.Skip("Broken")
|
|
|
|
|
|
|
|
addressBook := schema.NewTree()
|
|
|
|
{
|
|
|
|
owner, err := schema.NewElement("owner", parquet.FieldRepetitionType_REQUIRED,
|
|
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
ownerPhoneNumbers, err := schema.NewElement("ownerPhoneNumbers", parquet.FieldRepetitionType_OPTIONAL,
|
|
|
|
nil, parquet.ConvertedTypePtr(parquet.ConvertedType_LIST),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
ownerPhoneNumbersList, err := schema.NewElement("list", parquet.FieldRepetitionType_REPEATED,
|
|
|
|
nil, nil,
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
ownerPhoneNumbersElement, err := schema.NewElement("element", parquet.FieldRepetitionType_REQUIRED,
|
|
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
contacts, err := schema.NewElement("contacts", parquet.FieldRepetitionType_OPTIONAL,
|
|
|
|
nil, parquet.ConvertedTypePtr(parquet.ConvertedType_LIST),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
contactsList, err := schema.NewElement("list", parquet.FieldRepetitionType_REPEATED,
|
|
|
|
nil, nil,
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
contactsElement, err := schema.NewElement("element", parquet.FieldRepetitionType_REQUIRED,
|
|
|
|
nil, nil,
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
contactName, err := schema.NewElement("name", parquet.FieldRepetitionType_REQUIRED,
|
|
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
contactPhoneNumber, err := schema.NewElement("phoneNumber", parquet.FieldRepetitionType_OPTIONAL,
|
|
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
|
|
nil, nil, nil)
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("owner", owner); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = addressBook.Set("ownerPhoneNumbers", ownerPhoneNumbers); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("ownerPhoneNumbers.list", ownerPhoneNumbersList); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("ownerPhoneNumbers.list.element", ownerPhoneNumbersElement); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = addressBook.Set("contacts", contacts); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("contacts.list", contactsList); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("contacts.list.element", contactsElement); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("contacts.list.element.name", contactName); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
if err = addressBook.Set("contacts.list.element.phoneNumber", contactPhoneNumber); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, _, err := addressBook.ToParquetSchema(); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
case2Data := `{
|
|
|
|
"owner": "foo"
|
|
|
|
}`
|
|
|
|
result2 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
case3Data := `{
|
|
|
|
"owner": "foo",
|
|
|
|
"ownerPhoneNumbers": [
|
|
|
|
"1-234-567-8901"
|
|
|
|
]
|
|
|
|
}
|
|
|
|
`
|
|
|
|
result3 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{phone1},
|
|
|
|
definitionLevels: []int64{2},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
case4Data := `{
|
|
|
|
"owner": "foo",
|
|
|
|
"ownerPhoneNumbers": [
|
|
|
|
"1-234-567-8901",
|
|
|
|
"1-234-567-1098"
|
|
|
|
]
|
|
|
|
}
|
|
|
|
`
|
|
|
|
result4 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{phone1, phone2},
|
|
|
|
definitionLevels: []int64{2, 2},
|
|
|
|
repetitionLevels: []int64{0, 1},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
case5Data := `{
|
|
|
|
"contacts": [
|
|
|
|
{
|
|
|
|
"name": "bar"
|
|
|
|
}
|
|
|
|
],
|
|
|
|
"owner": "foo"
|
|
|
|
}`
|
|
|
|
result5 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{bar},
|
|
|
|
definitionLevels: []int64{2},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.phoneNumber": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{2},
|
|
|
|
repetitionLevels: []int64{1},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
case6Data := `{
|
|
|
|
"contacts": [
|
|
|
|
{
|
|
|
|
"name": "bar",
|
|
|
|
"phoneNumber": "1-111-222-3333"
|
|
|
|
}
|
|
|
|
],
|
|
|
|
"owner": "foo"
|
|
|
|
}`
|
|
|
|
result6 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{nil},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{bar},
|
|
|
|
definitionLevels: []int64{2},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.phoneNumber": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{phone3},
|
|
|
|
definitionLevels: []int64{3},
|
|
|
|
repetitionLevels: []int64{1},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
case7Data := `{
|
|
|
|
"contacts": [
|
|
|
|
{
|
|
|
|
"name": "bar",
|
|
|
|
"phoneNumber": "1-111-222-3333"
|
|
|
|
}
|
|
|
|
],
|
|
|
|
"owner": "foo",
|
|
|
|
"ownerPhoneNumbers": [
|
|
|
|
"1-234-567-8901",
|
|
|
|
"1-234-567-1098"
|
|
|
|
]
|
|
|
|
}`
|
|
|
|
result7 := map[string]*Column{
|
|
|
|
"owner": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{foo},
|
|
|
|
definitionLevels: []int64{0},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"ownerPhoneNumbers.list.element": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{phone1, phone2},
|
|
|
|
definitionLevels: []int64{2, 2},
|
|
|
|
repetitionLevels: []int64{0, 1},
|
|
|
|
},
|
|
|
|
"contacts.list.element.name": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{bar},
|
|
|
|
definitionLevels: []int64{2},
|
|
|
|
repetitionLevels: []int64{0},
|
|
|
|
},
|
|
|
|
"contacts.list.element.phoneNumber": {
|
|
|
|
parquetType: parquet.Type_BYTE_ARRAY,
|
|
|
|
values: []interface{}{phone3},
|
|
|
|
definitionLevels: []int64{3},
|
|
|
|
repetitionLevels: []int64{1},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
testCases := []struct {
|
|
|
|
data string
|
|
|
|
expectedResult map[string]*Column
|
|
|
|
expectErr bool
|
|
|
|
}{
|
|
|
|
{`{}`, nil, true}, // err: owner: nil value for required field
|
|
|
|
{case2Data, result2, false},
|
|
|
|
{case3Data, result3, false},
|
|
|
|
{case4Data, result4, false},
|
|
|
|
{case5Data, result5, false},
|
|
|
|
{case6Data, result6, false},
|
|
|
|
{case7Data, result7, false},
|
|
|
|
}
|
|
|
|
|
|
|
|
for i, testCase := range testCases {
|
|
|
|
result, err := UnmarshalJSON([]byte(testCase.data), addressBook)
|
|
|
|
expectErr := (err != nil)
|
|
|
|
|
|
|
|
if testCase.expectErr != expectErr {
|
|
|
|
t.Fatalf("case %v: error: expected: %v, got: %v", i+1, testCase.expectErr, expectErr)
|
|
|
|
}
|
|
|
|
|
|
|
|
if !testCase.expectErr {
|
|
|
|
if !reflect.DeepEqual(result, testCase.expectedResult) {
|
|
|
|
t.Errorf("case %v: result: expected: %v, got: %v", i+1, testCase.expectedResult, result)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|