select: Add IS (NOT) operators (#13906)

Add `IS` and `IS NOT` as comparison operators.

This may be a bit wider than the S3 spec, but we can rather 
easily remove the forwarding.
This commit is contained in:
Klaus Post 2021-12-14 09:54:50 -08:00 committed by GitHub
parent 44a9339c0a
commit a8d4042853
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 74 additions and 16 deletions

View File

@ -683,71 +683,117 @@ func TestCSVQueries(t *testing.T) {
} }
func TestCSVQueries2(t *testing.T) { func TestCSVQueries2(t *testing.T) {
input := `id,time,num,num2,text testInput := []byte(`id,time,num,num2,text
1,2010-01-01T,7867786,4565.908123,"a text, with comma" 1,2010-01-01T,7867786,4565.908123,"a text, with comma"
2,2017-01-02T03:04Z,-5, 0.765111, 2,2017-01-02T03:04Z,-5, 0.765111,
` `)
var testTable = []struct { var testTable = []struct {
name string name string
query string query string
input []byte
requestXML []byte // override request XML requestXML []byte // override request XML
wantResult string wantResult string
}{ }{
{ {
name: "select-all", name: "select-all",
input: testInput,
query: `SELECT * from s3object AS s WHERE id = '1'`, query: `SELECT * from s3object AS s WHERE id = '1'`,
wantResult: `{"id":"1","time":"2010-01-01T","num":"7867786","num2":"4565.908123","text":"a text, with comma"}`, wantResult: `{"id":"1","time":"2010-01-01T","num":"7867786","num2":"4565.908123","text":"a text, with comma"}`,
}, },
{ {
name: "select-all-2", name: "select-all-2",
input: testInput,
query: `SELECT * from s3object s WHERE id = 2`, query: `SELECT * from s3object s WHERE id = 2`,
wantResult: `{"id":"2","time":"2017-01-02T03:04Z","num":"-5","num2":" 0.765111","text":""}`, wantResult: `{"id":"2","time":"2017-01-02T03:04Z","num":"-5","num2":" 0.765111","text":""}`,
}, },
{ {
name: "select-text-convert", name: "select-text-convert",
input: testInput,
query: `SELECT CAST(text AS STRING) AS text from s3object s WHERE id = 1`, query: `SELECT CAST(text AS STRING) AS text from s3object s WHERE id = 1`,
wantResult: `{"text":"a text, with comma"}`, wantResult: `{"text":"a text, with comma"}`,
}, },
{ {
name: "select-text-direct", name: "select-text-direct",
input: testInput,
query: `SELECT text from s3object s WHERE id = 1`, query: `SELECT text from s3object s WHERE id = 1`,
wantResult: `{"text":"a text, with comma"}`, wantResult: `{"text":"a text, with comma"}`,
}, },
{ {
name: "select-time-direct", name: "select-time-direct",
input: testInput,
query: `SELECT time from s3object s WHERE id = 2`, query: `SELECT time from s3object s WHERE id = 2`,
wantResult: `{"time":"2017-01-02T03:04Z"}`, wantResult: `{"time":"2017-01-02T03:04Z"}`,
}, },
{ {
name: "select-int-direct", name: "select-int-direct",
input: testInput,
query: `SELECT num from s3object s WHERE id = 2`, query: `SELECT num from s3object s WHERE id = 2`,
wantResult: `{"num":"-5"}`, wantResult: `{"num":"-5"}`,
}, },
{ {
name: "select-float-direct", name: "select-float-direct",
input: testInput,
query: `SELECT num2 from s3object s WHERE id = 2`, query: `SELECT num2 from s3object s WHERE id = 2`,
wantResult: `{"num2":" 0.765111"}`, wantResult: `{"num2":" 0.765111"}`,
}, },
{ {
name: "select-in-array", name: "select-in-array",
input: testInput,
query: `select id from S3Object s WHERE id in [1,3]`, query: `select id from S3Object s WHERE id in [1,3]`,
wantResult: `{"id":"1"}`, wantResult: `{"id":"1"}`,
}, },
{ {
name: "select-in-array-matchnone", name: "select-in-array-matchnone",
input: testInput,
query: `select id from S3Object s WHERE s.id in [4,3]`, query: `select id from S3Object s WHERE s.id in [4,3]`,
wantResult: ``, wantResult: ``,
}, },
{ {
name: "select-float-by-val", name: "select-float-by-val",
input: testInput,
query: `SELECT num2 from s3object s WHERE num2 = 0.765111`, query: `SELECT num2 from s3object s WHERE num2 = 0.765111`,
wantResult: `{"num2":" 0.765111"}`, wantResult: `{"num2":" 0.765111"}`,
}, },
{ {
name: "select-non_exiting_values", name: "select-non_exiting_values",
input: testInput,
query: `SELECT _1 as first, s._100 from s3object s LIMIT 1`, query: `SELECT _1 as first, s._100 from s3object s LIMIT 1`,
wantResult: `{"first":"1","_100":null}`, wantResult: `{"first":"1","_100":null}`,
}, },
{
name: "select-is_null_noresults",
input: testInput,
query: `select _2 from S3object where _2 IS NULL`,
wantResult: ``,
},
{
name: "select-is_null_results",
input: testInput,
query: `select _2 from S3object WHERE _100 IS NULL`,
wantResult: `{"_2":"2010-01-01T"}
{"_2":"2017-01-02T03:04Z"}`,
},
{
name: "select-is_not_null_results",
input: testInput,
query: `select _2 from S3object where _2 IS NOT NULL`,
wantResult: `{"_2":"2010-01-01T"}
{"_2":"2017-01-02T03:04Z"}`,
},
{
name: "select-is_not_null_noresults",
input: testInput,
query: `select _2 from S3object WHERE _100 IS NOT NULL`,
wantResult: ``,
},
{
name: "select-is_not_string",
input: []byte(`c1,c2,c3
1,2,3
1,,3`),
query: `select * from S3object where _2 IS NOT ''`,
wantResult: `{"c1":"1","c2":"2","c3":"3"}`,
},
} }
defRequest := `<?xml version="1.0" encoding="UTF-8"?> defRequest := `<?xml version="1.0" encoding="UTF-8"?>
@ -782,7 +828,7 @@ func TestCSVQueries2(t *testing.T) {
} }
if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) { if err = s3Select.Open(func(offset, length int64) (io.ReadCloser, error) {
return ioutil.NopCloser(bytes.NewBufferString(input)), nil return ioutil.NopCloser(bytes.NewBuffer(testCase.input)), nil
}); err != nil { }); err != nil {
t.Fatal(err) t.Fatal(err)
} }

View File

@ -184,7 +184,7 @@ type ConditionRHS struct {
// Compare represents the RHS of a comparison expression // Compare represents the RHS of a comparison expression
type Compare struct { type Compare struct {
Operator string `parser:"@( \"<>\" | \"<=\" | \">=\" | \"=\" | \"<\" | \">\" | \"!=\" )"` Operator string `parser:"@( \"<>\" | \"<=\" | \">=\" | \"=\" | \"<\" | \">\" | \"!=\" | \"IS\" \"NOT\" | \"IS\")"`
Operand *Operand `parser:" @@"` Operand *Operand `parser:" @@"`
} }

View File

@ -326,12 +326,14 @@ func (v *Value) negate() {
// Supported comparison operators // Supported comparison operators
const ( const (
opLt = "<" opLt = "<"
opLte = "<=" opLte = "<="
opGt = ">" opGt = ">"
opGte = ">=" opGte = ">="
opEq = "=" opEq = "="
opIneq = "!=" opIneq = "!="
opIs = "IS"
opIsNot = "ISNOT"
) )
// InferBytesType will attempt to infer the data type of bytes. // InferBytesType will attempt to infer the data type of bytes.
@ -385,6 +387,21 @@ func (v *Value) compareOp(op string, a *Value) (res bool, err error) {
if !isValidComparisonOperator(op) { if !isValidComparisonOperator(op) {
return false, errArithInvalidOperator return false, errArithInvalidOperator
} }
switch op {
case opIs:
if a.IsNull() {
return v.IsNull(), nil
}
// Forward to Equal
op = opEq
case opIsNot:
if a.IsNull() {
return !v.IsNull(), nil
}
// Forward to not equal.
op = opIneq
default:
}
// Check if type conversion/inference is needed - it is needed // Check if type conversion/inference is needed - it is needed
// if the Value is a byte-slice. // if the Value is a byte-slice.
@ -747,12 +764,7 @@ func inferTypeAsString(v *Value) {
func isValidComparisonOperator(op string) bool { func isValidComparisonOperator(op string) bool {
switch op { switch op {
case opLt: case opLt, opLte, opGt, opGte, opEq, opIneq, opIs, opIsNot:
case opLte:
case opGt:
case opGte:
case opEq:
case opIneq:
default: default:
return false return false
} }