minio/pkg/s3select/internal/parquet-go/writer_test.go

153 lines
3.7 KiB
Go

/*
* Minio Cloud Storage, (C) 2019 Minio, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package parquet
import (
"os"
"testing"
"github.com/minio/minio/pkg/s3select/internal/parquet-go/data"
"github.com/minio/minio/pkg/s3select/internal/parquet-go/gen-go/parquet"
"github.com/minio/minio/pkg/s3select/internal/parquet-go/schema"
)
func TestWriterWrite(t *testing.T) {
schemaTree := schema.NewTree()
{
one, err := schema.NewElement("one", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_INT32), parquet.ConvertedTypePtr(parquet.ConvertedType_INT_16),
nil, nil, nil)
if err != nil {
t.Fatal(err)
}
two, err := schema.NewElement("two", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
nil, nil, nil)
if err != nil {
t.Fatal(err)
}
three, err := schema.NewElement("three", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_BOOLEAN), nil, nil, nil, nil)
if err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("one", one); err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("two", two); err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("three", three); err != nil {
t.Fatal(err)
}
}
file, err := os.Create("test.parquet")
if err != nil {
t.Fatal(err)
}
writer, err := NewWriter(file, schemaTree, 100)
if err != nil {
t.Fatal(err)
}
oneColumn := data.NewColumn(parquet.Type_INT32)
oneColumn.AddInt32(100, 0, 0)
twoColumn := data.NewColumn(parquet.Type_BYTE_ARRAY)
twoColumn.AddByteArray([]byte("foo"), 0, 0)
threeColumn := data.NewColumn(parquet.Type_BOOLEAN)
threeColumn.AddBoolean(true, 0, 0)
record := map[string]*data.Column{
"one": oneColumn,
"two": twoColumn,
"three": threeColumn,
}
err = writer.Write(record)
if err != nil {
t.Fatal(err)
}
err = writer.Close()
if err != nil {
t.Fatal(err)
}
}
func TestWriterWriteJSON(t *testing.T) {
schemaTree := schema.NewTree()
{
one, err := schema.NewElement("one", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_INT32), parquet.ConvertedTypePtr(parquet.ConvertedType_INT_16),
nil, nil, nil)
if err != nil {
t.Fatal(err)
}
two, err := schema.NewElement("two", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
nil, nil, nil)
if err != nil {
t.Fatal(err)
}
three, err := schema.NewElement("three", parquet.FieldRepetitionType_REQUIRED,
parquet.TypePtr(parquet.Type_BOOLEAN), nil, nil, nil, nil)
if err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("one", one); err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("two", two); err != nil {
t.Fatal(err)
}
if err := schemaTree.Set("three", three); err != nil {
t.Fatal(err)
}
}
file, err := os.Create("test.parquet")
if err != nil {
t.Fatal(err)
}
writer, err := NewWriter(file, schemaTree, 100)
if err != nil {
t.Fatal(err)
}
record := `{"one": 100, "two": "foo", "three": true}`
err = writer.WriteJSON([]byte(record))
if err != nil {
t.Fatal(err)
}
err = writer.Close()
if err != nil {
t.Fatal(err)
}
}