mint: Add more SQL tests (#9540)
parent
d348ec0f6c
commit
dfadf70a7f
@ -0,0 +1,172 @@ |
||||
#!/usr/bin/env python |
||||
# -*- coding: utf-8 -*- |
||||
# MinIO Python Library for Amazon S3 Compatible Cloud Storage, |
||||
# (C) 2015-2020 MinIO, Inc. |
||||
# |
||||
# Licensed under the Apache License, Version 2.0 (the "License"); |
||||
# you may not use this file except in compliance with the License. |
||||
# You may obtain a copy of the License at |
||||
# |
||||
# http://www.apache.org/licenses/LICENSE-2.0 |
||||
# |
||||
# Unless required by applicable law or agreed to in writing, software |
||||
# distributed under the License is distributed on an "AS IS" BASIS, |
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
||||
# See the License for the specific language governing permissions and |
||||
# limitations under the License. |
||||
|
||||
import os |
||||
import io |
||||
|
||||
from minio import Minio |
||||
from minio.select.options import (SelectObjectOptions, CSVInput, |
||||
RequestProgress, InputSerialization, |
||||
OutputSerialization, CSVOutput, JsonOutput) |
||||
|
||||
from utils import * |
||||
|
||||
def test_sql_api(test_name, client, bucket_name, input_data, sql_opts, expected_output): |
||||
""" Test if the passed SQL request has the output equal to the passed execpted one""" |
||||
object_name = generate_object_name() |
||||
got_output = b'' |
||||
try: |
||||
bytes_content = io.BytesIO(input_data) |
||||
client.put_object(bucket_name, object_name, io.BytesIO(input_data), len(input_data)) |
||||
data = client.select_object_content(bucket_name, object_name, sql_opts) |
||||
# Get the records |
||||
records = io.BytesIO() |
||||
for d in data.stream(10*1024): |
||||
records.write(d.encode('utf-8')) |
||||
got_output = records.getvalue() |
||||
except Exception as select_err: |
||||
if not isinstance(expected_output, Exception): |
||||
raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
else: |
||||
if isinstance(expected_output, Exception): |
||||
raise ValueError('Test {}: expected an exception, got {}'.format(test_name, got_output)) |
||||
if got_output != expected_output: |
||||
raise ValueError('Test {}: data mismatch. Expected : {}, Received {}'.format(test_name, expected_output, got_output)) |
||||
finally: |
||||
client.remove_object(bucket_name, object_name) |
||||
|
||||
|
||||
def test_csv_input_custom_quote_char(client, log_output): |
||||
# Get a unique bucket_name and object_name |
||||
log_output.args['bucket_name'] = bucket_name = generate_bucket_name() |
||||
|
||||
tests = [ |
||||
# Invalid quote character, should fail |
||||
('""', '"', b'col1,col2,col3\n', Exception()), |
||||
# UTF-8 quote character |
||||
('ع', '"', 'عcol1ع,عcol2ع,عcol3ع\n'.encode(), b'{"_1":"col1","_2":"col2","_3":"col3"}\n'), |
||||
# Only one field is quoted |
||||
('"', '"', b'"col1",col2,col3\n', b'{"_1":"col1","_2":"col2","_3":"col3"}\n'), |
||||
('"', '"', b'"col1,col2,col3"\n', b'{"_1":"col1,col2,col3"}\n'), |
||||
('\'', '"', b'"col1",col2,col3\n', b'{"_1":"\\"col1\\"","_2":"col2","_3":"col3"}\n'), |
||||
('', '"', b'"col1",col2,col3\n', b'{"_1":"\\"col1\\"","_2":"col2","_3":"col3"}\n'), |
||||
('', '"', b'"col1",col2,col3\n', b'{"_1":"\\"col1\\"","_2":"col2","_3":"col3"}\n'), |
||||
('', '"', b'"col1","col2","col3"\n', b'{"_1":"\\"col1\\"","_2":"\\"col2\\"","_3":"\\"col3\\""}\n'), |
||||
('"', '"', b'""""""\n', b'{"_1":"\\"\\""}\n'), |
||||
('"', '"', b'A",B\n', b'{"_1":"A\\"","_2":"B"}\n'), |
||||
('"', '"', b'A"",B\n', b'{"_1":"A\\"\\"","_2":"B"}\n'), |
||||
('"', '\\', b'A\\B,C\n', b'{"_1":"A\\\\B","_2":"C"}\n'), |
||||
('"', '"', b'"A""B","CD"\n', b'{"_1":"A\\"B","_2":"CD"}\n'), |
||||
('"', '\\', b'"A\\B","CD"\n', b'{"_1":"AB","_2":"CD"}\n'), |
||||
('"', '\\', b'"A\\,","CD"\n', b'{"_1":"A,","_2":"CD"}\n'), |
||||
('"', '\\', b'"A\\"B","CD"\n', b'{"_1":"A\\"B","_2":"CD"}\n'), |
||||
('"', '\\', b'"A\\""\n', b'{"_1":"A\\""}\n'), |
||||
('"', '\\', b'"A\\"\\"B"\n', b'{"_1":"A\\"\\"B"}\n'), |
||||
('"', '\\', b'"A\\"","\\"B"\n', b'{"_1":"A\\"","_2":"\\"B"}\n'), |
||||
] |
||||
|
||||
client.make_bucket(bucket_name) |
||||
|
||||
try: |
||||
for idx, (quote_char, escape_char, data, expected_output) in enumerate(tests): |
||||
sql_opts = SelectObjectOptions( |
||||
expression="select * from s3object", |
||||
input_serialization=InputSerialization( |
||||
compression_type="NONE", |
||||
csv=CSVInput(FileHeaderInfo="NONE", |
||||
RecordDelimiter="\n", |
||||
FieldDelimiter=",", |
||||
QuoteCharacter=quote_char, |
||||
QuoteEscapeCharacter=escape_char, |
||||
Comments="#", |
||||
AllowQuotedRecordDelimiter="FALSE",), |
||||
), |
||||
output_serialization=OutputSerialization( |
||||
json = JsonOutput( |
||||
RecordDelimiter="\n", |
||||
) |
||||
), |
||||
request_progress=RequestProgress( |
||||
enabled="False" |
||||
) |
||||
) |
||||
|
||||
test_sql_api(f'test_{idx}', client, bucket_name, data, sql_opts, expected_output) |
||||
finally: |
||||
client.remove_bucket(bucket_name) |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
def test_csv_output_custom_quote_char(client, log_output): |
||||
# Get a unique bucket_name and object_name |
||||
log_output.args['bucket_name'] = bucket_name = generate_bucket_name() |
||||
|
||||
tests = [ |
||||
# UTF-8 quote character |
||||
("''", "''", b'col1,col2,col3\n', Exception()), |
||||
("'", "'", b'col1,col2,col3\n', b"'col1','col2','col3'\n"), |
||||
("", '"', b'col1,col2,col3\n', b'\x00col1\x00,\x00col2\x00,\x00col3\x00\n'), |
||||
('"', '"', b'col1,col2,col3\n', b'"col1","col2","col3"\n'), |
||||
('"', '"', b'col"1,col2,col3\n', b'"col""1","col2","col3"\n'), |
||||
('"', '"', b'""""\n', b'""""\n'), |
||||
('"', '"', b'\n', b''), |
||||
("'", "\\", b'col1,col2,col3\n', b"'col1','col2','col3'\n"), |
||||
("'", "\\", b'col""1,col2,col3\n', b"'col\"\"1','col2','col3'\n"), |
||||
("'", "\\", b'col\'1,col2,col3\n', b"'col\\'1','col2','col3'\n"), |
||||
("'", "\\", b'"col\'1","col2","col3"\n', b"'col\\'1','col2','col3'\n"), |
||||
("'", "\\", b'col\'\n', b"'col\\''\n"), |
||||
# Two consecutive escaped quotes |
||||
("'", "\\", b'"a"""""\n', b"'a\"\"'\n"), |
||||
] |
||||
|
||||
client.make_bucket(bucket_name) |
||||
|
||||
try: |
||||
for idx, (quote_char, escape_char, input_data, expected_output) in enumerate(tests): |
||||
sql_opts = SelectObjectOptions( |
||||
expression="select * from s3object", |
||||
input_serialization=InputSerialization( |
||||
compression_type="NONE", |
||||
csv=CSVInput(FileHeaderInfo="NONE", |
||||
RecordDelimiter="\n", |
||||
FieldDelimiter=",", |
||||
QuoteCharacter='"', |
||||
QuoteEscapeCharacter='"', |
||||
Comments="#", |
||||
AllowQuotedRecordDelimiter="FALSE",), |
||||
), |
||||
output_serialization=OutputSerialization( |
||||
csv=CSVOutput(QuoteFields="ALWAYS", |
||||
RecordDelimiter="\n", |
||||
FieldDelimiter=",", |
||||
QuoteCharacter=quote_char, |
||||
QuoteEscapeCharacter=escape_char,) |
||||
), |
||||
request_progress=RequestProgress( |
||||
enabled="False" |
||||
) |
||||
) |
||||
|
||||
test_sql_api(f'test_{idx}', client, bucket_name, input_data, sql_opts, expected_output) |
||||
finally: |
||||
client.remove_bucket(bucket_name) |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
@ -0,0 +1,399 @@ |
||||
#!/usr/bin/env python |
||||
# -*- coding: utf-8 -*- |
||||
# MinIO Python Library for Amazon S3 Compatible Cloud Storage, |
||||
# (C) 2020 MinIO, Inc. |
||||
# |
||||
# Licensed under the Apache License, Version 2.0 (the "License"); |
||||
# you may not use this file except in compliance with the License. |
||||
# You may obtain a copy of the License at |
||||
# |
||||
# http://www.apache.org/licenses/LICENSE-2.0 |
||||
# |
||||
# Unless required by applicable law or agreed to in writing, software |
||||
# distributed under the License is distributed on an "AS IS" BASIS, |
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
||||
# See the License for the specific language governing permissions and |
||||
# limitations under the License. |
||||
|
||||
import io |
||||
from datetime import datetime |
||||
|
||||
from minio import Minio |
||||
from minio.select.options import (SelectObjectOptions, CSVInput, JSONInput, |
||||
RequestProgress, InputSerialization, |
||||
OutputSerialization, CSVOutput, JsonOutput) |
||||
|
||||
from utils import * |
||||
|
||||
def test_sql_expressions_custom_input_output(client, input_bytes, sql_input, sql_output, tests, log_output): |
||||
bucket_name = generate_bucket_name() |
||||
object_name = generate_object_name() |
||||
|
||||
log_output.args['total_tests'] = 0 |
||||
log_output.args['total_success'] = 0 |
||||
|
||||
client.make_bucket(bucket_name) |
||||
try: |
||||
content = io.BytesIO(bytes(input_bytes, 'utf-8')) |
||||
client.put_object(bucket_name, object_name, content, len(input_bytes)) |
||||
|
||||
for idx, (test_name, select_expression, expected_output) in enumerate(tests): |
||||
if select_expression == '': |
||||
continue |
||||
try: |
||||
log_output.args['total_tests'] += 1 |
||||
options = SelectObjectOptions( |
||||
expression=select_expression, |
||||
input_serialization=sql_input, |
||||
output_serialization=sql_output, |
||||
request_progress=RequestProgress( |
||||
enabled="False" |
||||
) |
||||
) |
||||
|
||||
data = client.select_object_content(bucket_name, object_name, options) |
||||
|
||||
# Get the records |
||||
records = io.BytesIO() |
||||
for d in data.stream(10*1024): |
||||
records.write(d.encode('utf-8')) |
||||
got_output = records.getvalue() |
||||
|
||||
if got_output != expected_output: |
||||
if type(expected_output) == datetime: |
||||
# Attempt to parse the date which will throw an exception for any issue |
||||
datetime.strptime(got_output.decode("utf-8").strip(), '%Y-%m-%dT%H:%M:%S.%f%z') |
||||
else: |
||||
raise ValueError('Test {}: data mismatch. Expected : {}. Received: {}.'.format(idx+1, expected_output, got_output)) |
||||
|
||||
log_output.args['total_success'] += 1 |
||||
except Exception as err: |
||||
continue ## TODO, raise instead |
||||
# raise Exception(err) |
||||
finally: |
||||
client.remove_object(bucket_name, object_name) |
||||
client.remove_bucket(bucket_name) |
||||
|
||||
|
||||
def test_sql_expressions(client, input_json_bytes, tests, log_output): |
||||
input_serialization = InputSerialization( |
||||
compression_type="NONE", |
||||
json=JSONInput(Type="DOCUMENT"), |
||||
) |
||||
|
||||
output_serialization=OutputSerialization( |
||||
csv=CSVOutput(QuoteFields="ASNEEDED") |
||||
) |
||||
|
||||
test_sql_expressions_custom_input_output(client, input_json_bytes, |
||||
input_serialization, output_serialization, tests, log_output) |
||||
|
||||
|
||||
def test_sql_operators(client, log_output): |
||||
|
||||
json_testfile = """{"id": 1, "name": "John", "age": 3} |
||||
{"id": 2, "name": "Elliot", "age": 4} |
||||
{"id": 3, "name": "Yves", "age": 5} |
||||
{"id": 4, "name": null, "age": 0} |
||||
""" |
||||
|
||||
tests = [ |
||||
# Logical operators |
||||
("AND", "select * from S3Object s where s.id = 1 AND s.name = 'John'", b'1,John,3\n'), |
||||
("NOT", "select * from S3Object s where NOT s.id = 1", b'2,Elliot,4\n3,Yves,5\n4,,0\n'), |
||||
("OR", "select * from S3Object s where s.id = 1 OR s.id = 3", b'1,John,3\n3,Yves,5\n'), |
||||
# Comparison Operators |
||||
("<", "select * from S3Object s where s.age < 4", b'1,John,3\n4,,0\n'), |
||||
(">", "select * from S3Object s where s.age > 4", b'3,Yves,5\n'), |
||||
("<=", "select * from S3Object s where s.age <= 4", b'1,John,3\n2,Elliot,4\n4,,0\n'), |
||||
(">=", "select * from S3Object s where s.age >= 4", b'2,Elliot,4\n3,Yves,5\n'), |
||||
("=", "select * from S3Object s where s.age = 4", b'2,Elliot,4\n'), |
||||
("<>", "select * from S3Object s where s.age <> 4", b'1,John,3\n3,Yves,5\n4,,0\n'), |
||||
("!=", "select * from S3Object s where s.age != 4", b'1,John,3\n3,Yves,5\n4,,0\n'), |
||||
("BETWEEN", "select * from S3Object s where s.age BETWEEN 4 AND 5", b'2,Elliot,4\n3,Yves,5\n'), |
||||
("IN", "select * from S3Object s where s.age IN (3,5)", b'1,John,3\n3,Yves,5\n'), |
||||
# Pattern Matching Operators |
||||
("LIKE_", "select * from S3Object s where s.name LIKE '_ves'", b'3,Yves,5\n'), |
||||
("LIKE%", "select * from S3Object s where s.name LIKE 'Ell%t'", b'2,Elliot,4\n'), |
||||
# Unitary Operators |
||||
("NULL", "select * from S3Object s where s.name IS NULL", b'4,,0\n'), |
||||
("NOT_NULL", "select * from S3Object s where s.age IS NOT NULL", b'1,John,3\n2,Elliot,4\n3,Yves,5\n4,,0\n'), |
||||
# Math Operators |
||||
("+", "select * from S3Object s where s.age = 1+3 ", b'2,Elliot,4\n'), |
||||
("-", "select * from S3Object s where s.age = 5-1 ", b'2,Elliot,4\n'), |
||||
("*", "select * from S3Object s where s.age = 2*2 ", b'2,Elliot,4\n'), |
||||
("%", "select * from S3Object s where s.age = 10%6 ", b'2,Elliot,4\n'), |
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
def test_sql_operators_precedence(client, log_output): |
||||
|
||||
json_testfile = """{"id": 1, "name": "Eric"}""" |
||||
|
||||
tests = [ |
||||
("-_1", "select -3*3 from S3Object", b'-9\n'), |
||||
("*", "select 10-3*2 from S3Object", b'4\n'), |
||||
("/", "select 13-10/5 from S3Object", b'11\n'), |
||||
("%", "select 13-10%5 from S3Object", b'13\n'), |
||||
("+", "select 1+1*3 from S3Object", b'4\n'), |
||||
("-_2", "select 1-1*3 from S3Object", b'-2\n'), |
||||
("=", "select * from S3Object as s where s.id = 13-12", b'1,Eric\n'), |
||||
("<>", "select * from S3Object as s where s.id <> 1-1", b'1,Eric\n'), |
||||
("NOT", "select * from S3Object where false OR NOT false", b'1,Eric\n'), |
||||
("AND", "select * from S3Object where true AND true OR false ", b'1,Eric\n'), |
||||
("OR", "select * from S3Object where false OR NOT false", b'1,Eric\n'), |
||||
("IN", "select * from S3Object as s where s.id <> -1 AND s.id IN (1,2,3)", b'1,Eric\n'), |
||||
("BETWEEN", "select * from S3Object as s where s.id <> -1 AND s.id BETWEEN -1 AND 3", b'1,Eric\n'), |
||||
("LIKE", "select * from S3Object as s where s.id <> -1 AND s.name LIKE 'E%'", b'1,Eric\n'), |
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
|
||||
def test_sql_functions_agg_cond_conv(client, log_output): |
||||
|
||||
json_testfile = """{"id": 1, "name": "John", "age": 3} |
||||
{"id": 2, "name": "Elliot", "age": 4} |
||||
{"id": 3, "name": "Yves", "age": 5} |
||||
{"id": 4, "name": "Christine", "age": null} |
||||
{"id": 5, "name": "Eric", "age": 0} |
||||
""" |
||||
tests = [ |
||||
# Aggregate functions |
||||
("COUNT", "select count(*) from S3Object s", b'5\n'), |
||||
("AVG", "select avg(s.age) from S3Object s", b'3\n'), |
||||
("MAX", "select max(s.age) from S3Object s", b'5\n'), |
||||
("MIN", "select min(s.age) from S3Object s", b'0\n'), |
||||
("SUM", "select sum(s.age) from S3Object s", b'12\n'), |
||||
# Conditional functions |
||||
("COALESCE", "SELECT COALESCE(s.age, 99) FROM S3Object s", b'3\n4\n5\n99\n0\n'), |
||||
("NULLIF", "SELECT NULLIF(s.age, 0) FROM S3Object s", b'3\n4\n5\n\n\n'), |
||||
## Conversion functions |
||||
("CAST", "SELECT CAST(s.age AS FLOAT) FROM S3Object s", b'3.0\n4.0\n5.0\n\n0.0\n'), |
||||
|
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
def test_sql_functions_date(client, log_output): |
||||
|
||||
json_testfile = """ |
||||
{"id": 1, "name": "John", "datez": "2017-01-02T03:04:05.006+07:30"} |
||||
""" |
||||
|
||||
tests = [ |
||||
# DATE_ADD |
||||
("DATE_ADD_1", "select DATE_ADD(year, 5, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2022-01-02T03:04:05.006+07:30\n'), |
||||
("DATE_ADD_2", "select DATE_ADD(month, 1, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017-02-02T03:04:05.006+07:30\n'), |
||||
("DATE_ADD_3", "select DATE_ADD(day, -1, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017-01-01T03:04:05.006+07:30\n'), |
||||
("DATE_ADD_4", "select DATE_ADD(hour, 1, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017-01-02T04:04:05.006+07:30\n'), |
||||
("DATE_ADD_5", "select DATE_ADD(minute, 5, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017-01-02T03:09:05.006+07:30\n'), |
||||
("DATE_ADD_6", "select DATE_ADD(second, 5, TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017-01-02T03:04:10.006+07:30\n'), |
||||
# DATE_DIFF |
||||
("DATE_DIFF_1", "select DATE_DIFF(year, TO_TIMESTAMP(s.datez), TO_TIMESTAMP('2011-01-01T')) from S3Object as s", b'-6\n'), |
||||
("DATE_DIFF_2", "select DATE_DIFF(month, TO_TIMESTAMP(s.datez), TO_TIMESTAMP('2011T')) from S3Object as s", b'-72\n'), |
||||
("DATE_DIFF_3", "select DATE_DIFF(day, TO_TIMESTAMP(s.datez), TO_TIMESTAMP('2010-01-02T')) from S3Object as s", b'-2556\n'), |
||||
# EXTRACT |
||||
("EXTRACT_1", "select EXTRACT(year FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'2017\n'), |
||||
("EXTRACT_2", "select EXTRACT(month FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'1\n'), |
||||
("EXTRACT_3", "select EXTRACT(hour FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'3\n'), |
||||
("EXTRACT_4", "select EXTRACT(minute FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'4\n'), |
||||
("EXTRACT_5", "select EXTRACT(timezone_hour FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'7\n'), |
||||
("EXTRACT_6", "select EXTRACT(timezone_minute FROM TO_TIMESTAMP(s.datez)) from S3Object as s", b'30\n'), |
||||
# TO_STRING |
||||
("TO_STRING_1", "select TO_STRING(TO_TIMESTAMP(s.datez), 'MMMM d, y') from S3Object as s", b'"January 2, 2017"\n'), |
||||
("TO_STRING_2", "select TO_STRING(TO_TIMESTAMP(s.datez), 'MMM d, yyyy') from S3Object as s", b'"Jan 2, 2017"\n'), |
||||
("TO_STRING_3", "select TO_STRING(TO_TIMESTAMP(s.datez), 'M-d-yy') from S3Object as s", b'1-2-17\n'), |
||||
("TO_STRING_4", "select TO_STRING(TO_TIMESTAMP(s.datez), 'MM-d-y') from S3Object as s", b'01-2-2017\n'), |
||||
("TO_STRING_5", "select TO_STRING(TO_TIMESTAMP(s.datez), 'MMMM d, y h:m a') from S3Object as s", b'"January 2, 2017 3:4 AM"\n'), |
||||
("TO_STRING_6", "select TO_STRING(TO_TIMESTAMP(s.datez), 'y-MM-dd''T''H:m:ssX') from S3Object as s", b'2017-01-02T3:4:05+0730\n'), |
||||
("TO_STRING_7", "select TO_STRING(TO_TIMESTAMP(s.datez), 'y-MM-dd''T''H:m:ssX') from S3Object as s", b'2017-01-02T3:4:05+0730\n'), |
||||
("TO_STRING_8", "select TO_STRING(TO_TIMESTAMP(s.datez), 'y-MM-dd''T''H:m:ssXXXX') from S3Object as s", b'2017-01-02T3:4:05+0730\n'), |
||||
("TO_STRING_9", "select TO_STRING(TO_TIMESTAMP(s.datez), 'y-MM-dd''T''H:m:ssXXXXX') from S3Object as s", b'2017-01-02T3:4:05+07:30\n'), |
||||
("TO_TIMESTAMP", "select TO_TIMESTAMP(s.datez) from S3Object as s", b'2017-01-02T03:04:05.006+07:30\n'), |
||||
("UTCNOW", "select UTCNOW() from S3Object", datetime(1,1,1)), |
||||
|
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
def test_sql_functions_string(client, log_output): |
||||
|
||||
json_testfile = """ |
||||
{"id": 1, "name": "John"} |
||||
{"id": 2, "name": " \tfoobar\t "} |
||||
{"id": 3, "name": "1112211foobar22211122"} |
||||
""" |
||||
|
||||
tests = [ |
||||
# CHAR_LENGTH |
||||
("CHAR_LENGTH", "select CHAR_LENGTH(s.name) from S3Object as s", b'4\n24\n21\n'), |
||||
("CHARACTER_LENGTH", "select CHARACTER_LENGTH(s.name) from S3Object as s", b'4\n24\n21\n'), |
||||
# LOWER |
||||
("LOWER", "select LOWER(s.name) from S3Object as s where s.id= 1", b'john\n'), |
||||
# SUBSTRING |
||||
("SUBSTRING_1", "select SUBSTRING(s.name FROM 2) from S3Object as s where s.id = 1", b'ohn\n'), |
||||
("SUBSTRING_2", "select SUBSTRING(s.name FROM 2 FOR 2) from S3Object as s where s.id = 1", b'oh\n'), |
||||
("SUBSTRING_3", "select SUBSTRING(s.name FROM -1 FOR 2) from S3Object as s where s.id = 1", b'\n'), |
||||
# TRIM |
||||
("TRIM_1", "select TRIM(s.name) from S3Object as s where s.id = 2", b'\tfoobar\t\n'), |
||||
("TRIM_2", "select TRIM(LEADING FROM s.name) from S3Object as s where s.id = 2", b'\tfoobar\t \n'), |
||||
("TRIM_3", "select TRIM(TRAILING FROM s.name) from S3Object as s where s.id = 2", b' \tfoobar\t\n'), |
||||
("TRIM_4", "select TRIM(BOTH FROM s.name) from S3Object as s where s.id = 2", b'\tfoobar\t\n'), |
||||
("TRIM_5", "select TRIM(BOTH '12' FROM s.name) from S3Object as s where s.id = 3", b'foobar\n'), |
||||
# UPPER |
||||
("UPPER", "select UPPER(s.name) from S3Object as s where s.id= 1", b'JOHN\n'), |
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
def test_sql_datatypes(client, log_output): |
||||
json_testfile = """ |
||||
{"name": "John"} |
||||
""" |
||||
tests = [ |
||||
("bool", "select CAST('true' AS BOOL) from S3Object", b'true\n'), |
||||
("int", "select CAST('13' AS INT) from S3Object", b'13\n'), |
||||
("integer", "select CAST('13' AS INTEGER) from S3Object", b'13\n'), |
||||
("string", "select CAST(true AS STRING) from S3Object", b'true\n'), |
||||
("float", "select CAST('13.3' AS FLOAT) from S3Object", b'13.3\n'), |
||||
("decimal", "select CAST('14.3' AS FLOAT) from S3Object", b'14.3\n'), |
||||
("numeric", "select CAST('14.3' AS FLOAT) from S3Object", b'14.3\n'), |
||||
("timestamp", "select CAST('2007-04-05T14:30Z' AS TIMESTAMP) from S3Object", b'2007-04-05T14:30Z\n'), |
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
def test_sql_select(client, log_output): |
||||
|
||||
json_testfile = """{"id": 1, "created": "June 27", "modified": "July 6" } |
||||
{"id": 2, "Created": "June 28", "Modified": "July 7", "Cast": "Random Date" }""" |
||||
tests = [ |
||||
("select_1", "select * from S3Object", b'1,June 27,July 6\n2,June 28,July 7,Random Date\n'), |
||||
("select_2", "select * from S3Object s", b'1,June 27,July 6\n2,June 28,July 7,Random Date\n'), |
||||
("select_3", "select * from S3Object as s", b'1,June 27,July 6\n2,June 28,July 7,Random Date\n'), |
||||
("select_4", "select s.line from S3Object as s", b'\n\n'), |
||||
("select_5", 'select s."Created" from S3Object as s', b'\nJune 28\n'), |
||||
("select_5", 'select s."Cast" from S3Object as s', b'\nRandom Date\n'), |
||||
("where", 'select s.created from S3Object as s', b'June 27\nJune 28\n'), |
||||
("limit", 'select * from S3Object as s LIMIT 1', b'1,June 27,July 6\n'), |
||||
] |
||||
|
||||
try: |
||||
test_sql_expressions(client, json_testfile, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
def test_sql_select_json(client, log_output): |
||||
json_testcontent = """{ "Rules": [ {"id": "1"}, {"expr": "y > x"}, {"id": "2", "expr": "z = DEBUG"} ]} |
||||
{ "created": "June 27", "modified": "July 6" } |
||||
""" |
||||
tests = [ |
||||
("select_1", "SELECT id FROM S3Object[*].Rules[*].id", b'{"id":"1"}\n{}\n{"id":"2"}\n{}\n'), |
||||
("select_2", "SELECT id FROM S3Object[*].Rules[*].id WHERE id IS NOT MISSING", b'{"id":"1"}\n{"id":"2"}\n'), |
||||
("select_3", "SELECT d.created, d.modified FROM S3Object[*] d", b'{}\n{"created":"June 27","modified":"July 6"}\n'), |
||||
("select_4", "SELECT _1.created, _1.modified FROM S3Object[*]", b'{}\n{"created":"June 27","modified":"July 6"}\n'), |
||||
("select_5", "Select s.rules[1].expr from S3Object s", b'{"expr":"y > x"}\n{}\n'), |
||||
] |
||||
|
||||
input_serialization = InputSerialization(json=JSONInput(Type="DOCUMENT")) |
||||
output_serialization = OutputSerialization(json=JsonOutput()) |
||||
try: |
||||
test_sql_expressions_custom_input_output(client, json_testcontent, |
||||
input_serialization, output_serialization, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
||||
def test_sql_select_csv_no_header(client, log_output): |
||||
json_testcontent = """val1,val2,val3 |
||||
val4,val5,val6 |
||||
""" |
||||
tests = [ |
||||
("select_1", "SELECT s._2 FROM S3Object as s", b'val2\nval5\n'), |
||||
] |
||||
|
||||
input_serialization=InputSerialization( |
||||
csv=CSVInput( |
||||
FileHeaderInfo="NONE", |
||||
AllowQuotedRecordDelimiter="FALSE", |
||||
), |
||||
) |
||||
|
||||
output_serialization=OutputSerialization(csv=CSVOutput()) |
||||
try: |
||||
test_sql_expressions_custom_input_output(client, json_testcontent, |
||||
input_serialization, output_serialization, tests, log_output) |
||||
except Exception as select_err: |
||||
raise select_err |
||||
# raise ValueError('Test {} unexpectedly failed with: {}'.format(test_name, select_err)) |
||||
# pass |
||||
|
||||
# Test passes |
||||
print(log_output.json_report()) |
||||
|
||||
|
@ -0,0 +1,106 @@ |
||||
#!/usr/bin/env python |
||||
# -*- coding: utf-8 -*- |
||||
# MinIO Python Library for Amazon S3 Compatible Cloud Storage, |
||||
# (C) 2015-2020 MinIO, Inc. |
||||
# |
||||
# Licensed under the Apache License, Version 2.0 (the "License"); |
||||
# you may not use this file except in compliance with the License. |
||||
# You may obtain a copy of the License at |
||||
# |
||||
# http://www.apache.org/licenses/LICENSE-2.0 |
||||
# |
||||
# Unless required by applicable law or agreed to in writing, software |
||||
# distributed under the License is distributed on an "AS IS" BASIS, |
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
||||
# See the License for the specific language governing permissions and |
||||
# limitations under the License. |
||||
|
||||
import uuid |
||||
import inspect |
||||
import json |
||||
import time |
||||
import traceback |
||||
|
||||
class LogOutput(object): |
||||
""" |
||||
LogOutput is the class for log output. It is required standard for all |
||||
SDK tests controlled by mint. |
||||
Here are its attributes: |
||||
'name': name of the SDK under test, e.g. 's3select' |
||||
'function': name of the method/api under test with its signature |
||||
The following python code can be used to |
||||
pull args information of a <method> and to |
||||
put together with the method name: |
||||
<method>.__name__+'('+', '.join(args_list)+')' |
||||
e.g. 'remove_object(bucket_name, object_name)' |
||||
'args': method/api arguments with their values, in |
||||
dictionary form: {'arg1': val1, 'arg2': val2, ...} |
||||
'duration': duration of the whole test in milliseconds, |
||||
defaults to 0 |
||||
'alert': any extra information user is needed to be alerted about, |
||||
like whether this is a Blocker/Gateway/Server related |
||||
issue, etc., defaults to None |
||||
'message': descriptive error message, defaults to None |
||||
'error': stack-trace/exception message(only in case of failure), |
||||
actual low level exception/error thrown by the program, |
||||
defaults to None |
||||
'status': exit status, possible values are 'PASS', 'FAIL', 'NA', |
||||
defaults to 'PASS' |
||||
""" |
||||
|
||||
PASS = 'PASS' |
||||
FAIL = 'FAIL' |
||||
NA = 'NA' |
||||
|
||||
def __init__(self, meth, test_name): |
||||
self.__args_list = inspect.getargspec(meth).args[1:] |
||||
self.__name = 's3select:'+test_name |
||||
self.__function = meth.__name__+'('+', '.join(self.__args_list)+')' |
||||
self.__args = {} |
||||
self.__duration = 0 |
||||
self.__alert = '' |
||||
self.__message = None |
||||
self.__error = None |
||||
self.__status = self.PASS |
||||
self.__start_time = time.time() |
||||
|
||||
@property |
||||
def name(self): return self.__name |
||||
|
||||
@property |
||||
def function(self): return self.__function |
||||
|
||||
@property |
||||
def args(self): return self.__args |
||||
|
||||
@name.setter |
||||
def name(self, val): self.__name = val |
||||
|
||||
@function.setter |
||||
def function(self, val): self.__function = val |
||||
|
||||
@args.setter |
||||
def args(self, val): self.__args = val |
||||
|
||||
def json_report(self, err_msg='', alert='', status=''): |
||||
self.__args = {k: v for k, v in self.__args.items() if v and v != ''} |
||||
entry = {'name': self.__name, |
||||
'function': self.__function, |
||||
'args': self.__args, |
||||
'duration': int(round((time.time() - self.__start_time)*1000)), |
||||
'alert': str(alert), |
||||
'message': str(err_msg), |
||||
'error': traceback.format_exc() if err_msg and err_msg != '' else '', |
||||
'status': status if status and status != '' else |
||||
self.FAIL if err_msg and err_msg != '' else self.PASS |
||||
} |
||||
return json.dumps({k: v for k, v in entry.items() if v and v != ''}) |
||||
|
||||
|
||||
def generate_bucket_name(): |
||||
return "s3select-test-" + str(uuid.uuid4()) |
||||
|
||||
def generate_object_name(): |
||||
return str(uuid.uuid4()) |
||||
|
||||
|
Loading…
Reference in new issue