2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2019-01-09 06:23:04 +05:30
|
|
|
|
|
|
|
package csv
|
|
|
|
|
|
|
|
import (
|
2019-03-07 00:20:10 -08:00
|
|
|
"encoding/json"
|
2019-03-09 08:13:37 -08:00
|
|
|
"errors"
|
2019-01-09 06:23:04 +05:30
|
|
|
"fmt"
|
2019-08-31 15:07:40 +08:00
|
|
|
"io"
|
2019-01-09 06:23:04 +05:30
|
|
|
|
2019-03-07 00:20:10 -08:00
|
|
|
"github.com/bcicen/jstream"
|
2021-04-27 09:49:26 -07:00
|
|
|
csv "github.com/minio/csvparser"
|
2019-01-09 06:23:04 +05:30
|
|
|
"github.com/minio/minio/pkg/s3select/sql"
|
|
|
|
)
|
|
|
|
|
2019-09-13 14:18:35 -07:00
|
|
|
// Record - is a CSV record.
|
2019-01-09 06:23:04 +05:30
|
|
|
type Record struct {
|
|
|
|
columnNames []string
|
|
|
|
csvRecord []string
|
|
|
|
nameIndexMap map[string]int64
|
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
// Get - gets the value for a column name. CSV fields do not have any
|
|
|
|
// defined type (other than the default string). So this function
|
|
|
|
// always returns fields using sql.FromBytes so that the type
|
|
|
|
// specified/implied by the query can be used, or can be automatically
|
|
|
|
// converted based on the query.
|
2019-01-09 06:23:04 +05:30
|
|
|
func (r *Record) Get(name string) (*sql.Value, error) {
|
|
|
|
index, found := r.nameIndexMap[name]
|
|
|
|
if !found {
|
|
|
|
return nil, fmt.Errorf("column %v not found", name)
|
|
|
|
}
|
|
|
|
|
|
|
|
if index >= int64(len(r.csvRecord)) {
|
2019-01-28 17:59:48 -08:00
|
|
|
// No value found for column 'name', hence return null
|
|
|
|
// value
|
|
|
|
return sql.FromNull(), nil
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
return sql.FromBytes([]byte(r.csvRecord[index])), nil
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
// Set - sets the value for a column name.
|
2020-02-13 14:03:52 -08:00
|
|
|
func (r *Record) Set(name string, value *sql.Value) (sql.Record, error) {
|
2019-01-09 06:23:04 +05:30
|
|
|
r.columnNames = append(r.columnNames, name)
|
|
|
|
r.csvRecord = append(r.csvRecord, value.CSVString())
|
2020-02-13 14:03:52 -08:00
|
|
|
return r, nil
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
2019-09-16 17:26:27 -07:00
|
|
|
// Reset data in record.
|
|
|
|
func (r *Record) Reset() {
|
|
|
|
if len(r.columnNames) > 0 {
|
|
|
|
r.columnNames = r.columnNames[:0]
|
|
|
|
}
|
|
|
|
if len(r.csvRecord) > 0 {
|
|
|
|
r.csvRecord = r.csvRecord[:0]
|
|
|
|
}
|
|
|
|
for k := range r.nameIndexMap {
|
|
|
|
delete(r.nameIndexMap, k)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-27 12:33:14 -07:00
|
|
|
// Clone the record.
|
|
|
|
func (r *Record) Clone(dst sql.Record) sql.Record {
|
|
|
|
other, ok := dst.(*Record)
|
2019-09-16 17:26:27 -07:00
|
|
|
if !ok {
|
2019-09-27 12:33:14 -07:00
|
|
|
other = &Record{}
|
2019-09-16 17:26:27 -07:00
|
|
|
}
|
2019-09-27 12:33:14 -07:00
|
|
|
if len(other.columnNames) > 0 {
|
|
|
|
other.columnNames = other.columnNames[:0]
|
|
|
|
}
|
|
|
|
if len(other.csvRecord) > 0 {
|
|
|
|
other.csvRecord = other.csvRecord[:0]
|
|
|
|
}
|
|
|
|
other.columnNames = append(other.columnNames, r.columnNames...)
|
|
|
|
other.csvRecord = append(other.csvRecord, r.csvRecord...)
|
|
|
|
return other
|
2019-09-16 17:26:27 -07:00
|
|
|
}
|
|
|
|
|
2019-08-31 15:07:40 +08:00
|
|
|
// WriteCSV - encodes to CSV data.
|
2020-04-01 23:39:34 +01:00
|
|
|
func (r *Record) WriteCSV(writer io.Writer, opts sql.WriteCSVOpts) error {
|
2019-08-31 15:07:40 +08:00
|
|
|
w := csv.NewWriter(writer)
|
2020-04-01 23:39:34 +01:00
|
|
|
w.Comma = opts.FieldDelimiter
|
|
|
|
w.AlwaysQuote = opts.AlwaysQuote
|
|
|
|
w.Quote = opts.Quote
|
|
|
|
w.QuoteEscape = opts.QuoteEscape
|
2019-01-09 06:23:04 +05:30
|
|
|
if err := w.Write(r.csvRecord); err != nil {
|
2019-08-31 15:07:40 +08:00
|
|
|
return err
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
w.Flush()
|
2021-05-25 14:17:33 -07:00
|
|
|
return w.Error()
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
2019-08-31 15:07:40 +08:00
|
|
|
// WriteJSON - encodes to JSON data.
|
|
|
|
func (r *Record) WriteJSON(writer io.Writer) error {
|
2019-03-07 00:20:10 -08:00
|
|
|
var kvs jstream.KVS = make([]jstream.KV, len(r.columnNames))
|
|
|
|
for i := 0; i < len(r.columnNames); i++ {
|
|
|
|
kvs[i] = jstream.KV{Key: r.columnNames[i], Value: r.csvRecord[i]}
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
2019-08-31 15:07:40 +08:00
|
|
|
return json.NewEncoder(writer).Encode(kvs)
|
2019-01-09 06:23:04 +05:30
|
|
|
}
|
|
|
|
|
2019-03-09 08:13:37 -08:00
|
|
|
// Raw - returns the underlying data with format info.
|
|
|
|
func (r *Record) Raw() (sql.SelectObjectFormat, interface{}) {
|
|
|
|
return sql.SelectFmtCSV, r
|
|
|
|
}
|
|
|
|
|
|
|
|
// Replace - is not supported for CSV
|
2020-02-13 14:03:52 -08:00
|
|
|
func (r *Record) Replace(_ interface{}) error {
|
2019-03-09 08:13:37 -08:00
|
|
|
return errors.New("Replace is not supported for CSV")
|
|
|
|
}
|
|
|
|
|
2019-01-09 06:23:04 +05:30
|
|
|
// NewRecord - creates new CSV record.
|
|
|
|
func NewRecord() *Record {
|
|
|
|
return &Record{}
|
|
|
|
}
|