mirror of
https://github.com/minio/minio.git
synced 2024-12-26 23:25:54 -05:00
2d0f65a5e3
Since github.com/minio/parquet-go is archived add it as internal package.
153 lines
3.7 KiB
Go
153 lines
3.7 KiB
Go
/*
|
|
* Minio Cloud Storage, (C) 2019 Minio, Inc.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package parquet
|
|
|
|
import (
|
|
"os"
|
|
"testing"
|
|
|
|
"github.com/minio/minio/pkg/s3select/internal/parquet-go/data"
|
|
"github.com/minio/minio/pkg/s3select/internal/parquet-go/gen-go/parquet"
|
|
"github.com/minio/minio/pkg/s3select/internal/parquet-go/schema"
|
|
)
|
|
|
|
func TestWriterWrite(t *testing.T) {
|
|
schemaTree := schema.NewTree()
|
|
{
|
|
one, err := schema.NewElement("one", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_INT32), parquet.ConvertedTypePtr(parquet.ConvertedType_INT_16),
|
|
nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
two, err := schema.NewElement("two", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
three, err := schema.NewElement("three", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_BOOLEAN), nil, nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err := schemaTree.Set("one", one); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err := schemaTree.Set("two", two); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err := schemaTree.Set("three", three); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
file, err := os.Create("test.parquet")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
writer, err := NewWriter(file, schemaTree, 100)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
oneColumn := data.NewColumn(parquet.Type_INT32)
|
|
oneColumn.AddInt32(100, 0, 0)
|
|
|
|
twoColumn := data.NewColumn(parquet.Type_BYTE_ARRAY)
|
|
twoColumn.AddByteArray([]byte("foo"), 0, 0)
|
|
|
|
threeColumn := data.NewColumn(parquet.Type_BOOLEAN)
|
|
threeColumn.AddBoolean(true, 0, 0)
|
|
|
|
record := map[string]*data.Column{
|
|
"one": oneColumn,
|
|
"two": twoColumn,
|
|
"three": threeColumn,
|
|
}
|
|
|
|
err = writer.Write(record)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = writer.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestWriterWriteJSON(t *testing.T) {
|
|
schemaTree := schema.NewTree()
|
|
{
|
|
one, err := schema.NewElement("one", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_INT32), parquet.ConvertedTypePtr(parquet.ConvertedType_INT_16),
|
|
nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
two, err := schema.NewElement("two", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_BYTE_ARRAY), parquet.ConvertedTypePtr(parquet.ConvertedType_UTF8),
|
|
nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
three, err := schema.NewElement("three", parquet.FieldRepetitionType_REQUIRED,
|
|
parquet.TypePtr(parquet.Type_BOOLEAN), nil, nil, nil, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if err := schemaTree.Set("one", one); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err := schemaTree.Set("two", two); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err := schemaTree.Set("three", three); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
file, err := os.Create("test.parquet")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
writer, err := NewWriter(file, schemaTree, 100)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
record := `{"one": 100, "two": "foo", "three": true}`
|
|
err = writer.WriteJSON([]byte(record))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = writer.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|