2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2019-01-28 17:59:48 -08:00
|
|
|
|
|
|
|
package sql
|
|
|
|
|
|
|
|
import (
|
|
|
|
"errors"
|
|
|
|
"fmt"
|
|
|
|
"strings"
|
2019-03-09 08:13:37 -08:00
|
|
|
|
|
|
|
"github.com/bcicen/jstream"
|
2020-02-13 14:03:52 -08:00
|
|
|
"github.com/minio/simdjson-go"
|
2019-01-28 17:59:48 -08:00
|
|
|
)
|
|
|
|
|
2022-01-02 09:15:06 -08:00
|
|
|
var errBadLimitSpecified = errors.New("Limit value must be a positive integer")
|
2019-01-28 17:59:48 -08:00
|
|
|
|
2019-03-09 08:13:37 -08:00
|
|
|
const (
|
|
|
|
baseTableName = "s3object"
|
|
|
|
)
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
// SelectStatement is the top level parsed and analyzed structure
|
|
|
|
type SelectStatement struct {
|
|
|
|
selectAST *Select
|
|
|
|
|
|
|
|
// Analysis result of the statement
|
|
|
|
selectQProp qProp
|
|
|
|
|
|
|
|
// Result of parsing the limit clause if one is present
|
|
|
|
// (otherwise -1)
|
|
|
|
limitValue int64
|
|
|
|
|
|
|
|
// Count of rows that have been output.
|
|
|
|
outputCount int64
|
2021-04-06 08:49:04 -07:00
|
|
|
|
|
|
|
// Table alias
|
|
|
|
tableAlias string
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// ParseSelectStatement - parses a select query from the given string
|
|
|
|
// and analyzes it.
|
|
|
|
func ParseSelectStatement(s string) (stmt SelectStatement, err error) {
|
|
|
|
var selectAST Select
|
|
|
|
err = SQLParser.ParseString(s, &selectAST)
|
|
|
|
if err != nil {
|
|
|
|
err = errQueryParseFailure(err)
|
|
|
|
return
|
|
|
|
}
|
2019-10-30 09:16:55 +01:00
|
|
|
|
|
|
|
// Check if select is "SELECT s.* from S3Object s"
|
|
|
|
if !selectAST.Expression.All &&
|
|
|
|
len(selectAST.Expression.Expressions) == 1 &&
|
|
|
|
len(selectAST.Expression.Expressions[0].Expression.And) == 1 &&
|
|
|
|
len(selectAST.Expression.Expressions[0].Expression.And[0].Condition) == 1 &&
|
|
|
|
selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand != nil &&
|
|
|
|
selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand.Operand.Left != nil &&
|
|
|
|
selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand.Operand.Left.Left != nil &&
|
|
|
|
selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand.Operand.Left.Left.Primary != nil &&
|
|
|
|
selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand.Operand.Left.Left.Primary.JPathExpr != nil {
|
|
|
|
if selectAST.Expression.Expressions[0].Expression.And[0].Condition[0].Operand.Operand.Left.Left.Primary.JPathExpr.String() == selectAST.From.As+".*" {
|
|
|
|
selectAST.Expression.All = true
|
|
|
|
}
|
|
|
|
}
|
2019-01-28 17:59:48 -08:00
|
|
|
stmt.selectAST = &selectAST
|
|
|
|
|
|
|
|
// Check the parsed limit value
|
|
|
|
stmt.limitValue, err = parseLimit(selectAST.Limit)
|
|
|
|
if err != nil {
|
|
|
|
err = errQueryAnalysisFailure(err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Analyze where clause
|
|
|
|
if selectAST.Where != nil {
|
|
|
|
whereQProp := selectAST.Where.analyze(&selectAST)
|
|
|
|
if whereQProp.err != nil {
|
2019-12-02 09:28:01 -08:00
|
|
|
err = errQueryAnalysisFailure(fmt.Errorf("Where clause error: %w", whereQProp.err))
|
2019-01-28 17:59:48 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if whereQProp.isAggregation {
|
|
|
|
err = errQueryAnalysisFailure(errors.New("WHERE clause cannot have an aggregation"))
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Validate table name
|
2019-03-09 08:13:37 -08:00
|
|
|
err = validateTableName(selectAST.From)
|
|
|
|
if err != nil {
|
2019-01-28 17:59:48 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Analyze main select expression
|
|
|
|
stmt.selectQProp = selectAST.Expression.analyze(&selectAST)
|
|
|
|
err = stmt.selectQProp.err
|
|
|
|
if err != nil {
|
|
|
|
err = errQueryAnalysisFailure(err)
|
|
|
|
}
|
2021-04-06 08:49:04 -07:00
|
|
|
|
|
|
|
// Set table alias
|
|
|
|
stmt.tableAlias = selectAST.From.As
|
2024-01-10 01:19:11 +08:00
|
|
|
// Remove quotes from column aliases
|
|
|
|
if selectAST.Expression != nil {
|
|
|
|
for _, exp := range selectAST.Expression.Expressions {
|
|
|
|
if strings.HasSuffix(exp.As, "'") && strings.HasPrefix(exp.As, "'") && len(exp.As) >= 2 {
|
|
|
|
exp.As = exp.As[1 : len(exp.As)-1]
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2019-01-28 17:59:48 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-03-09 08:13:37 -08:00
|
|
|
func validateTableName(from *TableExpression) error {
|
2021-11-10 08:12:50 -08:00
|
|
|
if !strings.EqualFold(from.Table.BaseKey.String(), baseTableName) {
|
2019-03-09 08:13:37 -08:00
|
|
|
return errBadTableName(errors.New("table name must be `s3object`"))
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(from.Table.PathExpr) > 0 {
|
|
|
|
if !from.Table.PathExpr[0].ArrayWildcard {
|
|
|
|
return errBadTableName(errors.New("keypath table name is invalid - please check the service documentation"))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
func parseLimit(v *LitValue) (int64, error) {
|
|
|
|
switch {
|
|
|
|
case v == nil:
|
|
|
|
return -1, nil
|
2021-03-19 23:14:38 +07:00
|
|
|
case v.Int == nil:
|
2019-01-28 17:59:48 -08:00
|
|
|
return -1, errBadLimitSpecified
|
|
|
|
default:
|
2021-03-19 23:14:38 +07:00
|
|
|
r := int64(*v.Int)
|
2019-01-28 17:59:48 -08:00
|
|
|
if r < 0 {
|
|
|
|
return -1, errBadLimitSpecified
|
|
|
|
}
|
|
|
|
return r, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-09 08:13:37 -08:00
|
|
|
// EvalFrom evaluates the From clause on the input record. It only
|
|
|
|
// applies to JSON input data format (currently).
|
2020-03-10 22:34:58 -07:00
|
|
|
func (e *SelectStatement) EvalFrom(format string, input Record) ([]*Record, error) {
|
2020-02-13 14:03:52 -08:00
|
|
|
if !e.selectAST.From.HasKeypath() {
|
2020-03-10 22:34:58 -07:00
|
|
|
return []*Record{&input}, nil
|
2020-02-13 14:03:52 -08:00
|
|
|
}
|
|
|
|
_, rawVal := input.Raw()
|
|
|
|
|
|
|
|
if format != "json" {
|
|
|
|
return nil, errDataSource(errors.New("path not supported"))
|
|
|
|
}
|
|
|
|
switch rec := rawVal.(type) {
|
|
|
|
case jstream.KVS:
|
|
|
|
txedRec, _, err := jsonpathEval(e.selectAST.From.Table.PathExpr[1:], rec)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2019-03-09 08:13:37 -08:00
|
|
|
|
2020-02-13 14:03:52 -08:00
|
|
|
var kvs jstream.KVS
|
|
|
|
switch v := txedRec.(type) {
|
|
|
|
case jstream.KVS:
|
|
|
|
kvs = v
|
2020-03-10 22:34:58 -07:00
|
|
|
|
|
|
|
case []interface{}:
|
|
|
|
recs := make([]*Record, len(v))
|
|
|
|
for i, val := range v {
|
|
|
|
tmpRec := input.Clone(nil)
|
|
|
|
if err = tmpRec.Replace(val); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
recs[i] = &tmpRec
|
|
|
|
}
|
|
|
|
return recs, nil
|
|
|
|
|
2020-02-13 14:03:52 -08:00
|
|
|
default:
|
|
|
|
kvs = jstream.KVS{jstream.KV{Key: "_1", Value: v}}
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = input.Replace(kvs); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-03-10 22:34:58 -07:00
|
|
|
return []*Record{&input}, nil
|
2020-02-13 14:03:52 -08:00
|
|
|
case simdjson.Object:
|
|
|
|
txedRec, _, err := jsonpathEval(e.selectAST.From.Table.PathExpr[1:], rec)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
switch v := txedRec.(type) {
|
|
|
|
case simdjson.Object:
|
|
|
|
err := input.Replace(v)
|
2019-03-09 08:13:37 -08:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2020-03-10 22:34:58 -07:00
|
|
|
|
|
|
|
case []interface{}:
|
|
|
|
recs := make([]*Record, len(v))
|
|
|
|
for i, val := range v {
|
|
|
|
tmpRec := input.Clone(nil)
|
|
|
|
if err = tmpRec.Replace(val); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
recs[i] = &tmpRec
|
|
|
|
}
|
|
|
|
return recs, nil
|
|
|
|
|
2020-02-13 14:03:52 -08:00
|
|
|
default:
|
|
|
|
input.Reset()
|
|
|
|
input, err = input.Set("_1", &Value{value: v})
|
|
|
|
if err != nil {
|
2019-03-09 08:13:37 -08:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
2020-03-10 22:34:58 -07:00
|
|
|
return []*Record{&input}, nil
|
2019-03-09 08:13:37 -08:00
|
|
|
}
|
2020-02-13 14:03:52 -08:00
|
|
|
return nil, errDataSource(errors.New("unexpected non JSON input"))
|
2019-03-09 08:13:37 -08:00
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
// IsAggregated returns if the statement involves SQL aggregation
|
|
|
|
func (e *SelectStatement) IsAggregated() bool {
|
|
|
|
return e.selectQProp.isAggregation
|
|
|
|
}
|
|
|
|
|
|
|
|
// AggregateResult - returns the aggregated result after all input
|
|
|
|
// records have been processed. Applies only to aggregation queries.
|
|
|
|
func (e *SelectStatement) AggregateResult(output Record) error {
|
|
|
|
for i, expr := range e.selectAST.Expression.Expressions {
|
2021-04-06 08:49:04 -07:00
|
|
|
v, err := expr.evalNode(nil, e.tableAlias)
|
2019-01-28 17:59:48 -08:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2019-07-04 00:34:54 +01:00
|
|
|
if expr.As != "" {
|
2020-02-13 14:03:52 -08:00
|
|
|
output, err = output.Set(expr.As, v)
|
2019-07-04 00:34:54 +01:00
|
|
|
} else {
|
2020-02-13 14:03:52 -08:00
|
|
|
output, err = output.Set(fmt.Sprintf("_%d", i+1), v)
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2019-07-04 00:34:54 +01:00
|
|
|
}
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2019-02-12 13:54:26 -08:00
|
|
|
func (e *SelectStatement) isPassingWhereClause(input Record) (bool, error) {
|
|
|
|
if e.selectAST.Where == nil {
|
|
|
|
return true, nil
|
|
|
|
}
|
2021-04-06 08:49:04 -07:00
|
|
|
value, err := e.selectAST.Where.evalNode(input, e.tableAlias)
|
2019-02-12 13:54:26 -08:00
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
b, ok := value.ToBool()
|
|
|
|
if !ok {
|
|
|
|
err = fmt.Errorf("WHERE expression did not return bool")
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return b, nil
|
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
// AggregateRow - aggregates the input record. Applies only to
|
|
|
|
// aggregation queries.
|
|
|
|
func (e *SelectStatement) AggregateRow(input Record) error {
|
2019-02-12 13:54:26 -08:00
|
|
|
ok, err := e.isPassingWhereClause(input)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if !ok {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2019-01-28 17:59:48 -08:00
|
|
|
for _, expr := range e.selectAST.Expression.Expressions {
|
2021-04-06 08:49:04 -07:00
|
|
|
err := expr.aggregateRow(input, e.tableAlias)
|
2019-01-28 17:59:48 -08:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Eval - evaluates the Select statement for the given record. It
|
|
|
|
// applies only to non-aggregation queries.
|
2019-09-17 17:21:23 -07:00
|
|
|
// The function returns whether the statement passed the WHERE clause and should be outputted.
|
2019-09-27 12:33:14 -07:00
|
|
|
func (e *SelectStatement) Eval(input, output Record) (Record, error) {
|
2019-02-12 13:54:26 -08:00
|
|
|
ok, err := e.isPassingWhereClause(input)
|
2019-03-09 08:13:37 -08:00
|
|
|
if err != nil || !ok {
|
|
|
|
// Either error or row did not pass where clause
|
2019-09-27 12:33:14 -07:00
|
|
|
return nil, err
|
2019-02-12 13:54:26 -08:00
|
|
|
}
|
2019-01-28 17:59:48 -08:00
|
|
|
|
|
|
|
if e.selectAST.Expression.All {
|
|
|
|
// Return the input record for `SELECT * FROM
|
|
|
|
// .. WHERE ..`
|
|
|
|
|
|
|
|
// Update count of records output.
|
2021-11-02 19:14:46 -07:00
|
|
|
e.outputCount++
|
|
|
|
|
2020-02-13 14:03:52 -08:00
|
|
|
return input.Clone(output), nil
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
for i, expr := range e.selectAST.Expression.Expressions {
|
2021-04-06 08:49:04 -07:00
|
|
|
v, err := expr.evalNode(input, e.tableAlias)
|
2019-01-28 17:59:48 -08:00
|
|
|
if err != nil {
|
2019-09-27 12:33:14 -07:00
|
|
|
return nil, err
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Pick output column names
|
|
|
|
if expr.As != "" {
|
2020-02-13 14:03:52 -08:00
|
|
|
output, err = output.Set(expr.As, v)
|
2019-01-28 17:59:48 -08:00
|
|
|
} else if comp, ok := getLastKeypathComponent(expr.Expression); ok {
|
2020-02-13 14:03:52 -08:00
|
|
|
output, err = output.Set(comp, v)
|
2019-01-28 17:59:48 -08:00
|
|
|
} else {
|
2020-02-13 14:03:52 -08:00
|
|
|
output, err = output.Set(fmt.Sprintf("_%d", i+1), v)
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Update count of records output.
|
2021-11-02 19:14:46 -07:00
|
|
|
e.outputCount++
|
2019-01-28 17:59:48 -08:00
|
|
|
|
2019-09-27 12:33:14 -07:00
|
|
|
return output, nil
|
2019-01-28 17:59:48 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// LimitReached - returns true if the number of records output has
|
|
|
|
// reached the value of the `LIMIT` clause.
|
|
|
|
func (e *SelectStatement) LimitReached() bool {
|
|
|
|
if e.limitValue == -1 {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
return e.outputCount >= e.limitValue
|
|
|
|
}
|