;;
centos|fedora|rhel|ol|virtuozzo)
- packages=(which python3-virtualenv python36-devel libevent-devel libffi-devel libxml2-devel libxslt-devel zlib-devel arrow-devel parquet-devel)
+ packages=(which python3-virtualenv python36-devel libevent-devel libffi-devel libxml2-devel libxslt-devel zlib-devel)
for package in ${packages[@]}; do
# When the package is python36-devel we change it to python3-devel on Fedora
if [[ ${package} == "python36-devel" && -f /etc/fedora-release ]]; then
import logging
logging.basicConfig(level=logging.INFO)
-#import numpy as np
-import pandas as pd
-import pyarrow as pa
-import pyarrow.parquet as pq
-
region_name = ''
# recurssion function for generating arithmetical expression
response = c2.get_object(Bucket=bucket_name, Key=new_key)
eq(response['Body'].read().decode('utf-8'), obj, 's3select error[ downloaded object not equal to uploaded objecy')
-def parquet_generator():
-
- parquet_size = 1000000
- a=[]
- for i in range(parquet_size):
- a.append(int(random.randint(1,10000)))
-
- b=[]
- for i in range(parquet_size):
- b.append(int(random.randint(1,10000)))
-
- c=[]
- for i in range(parquet_size):
- c.append(int(random.randint(1,10000)))
-
- d=[]
- for i in range(parquet_size):
- d.append(int(random.randint(1,10000)))
-
- df3 = pd.DataFrame({'a': a,
- 'b': b,
- 'c': c,
- 'd': d}
- )
-
-
- table = pa.Table.from_pandas(df3,preserve_index=False)
-
- print (table)
-
- pq.write_table(table,version='1.0',where='/tmp/3col_int_10k.parquet')
-
def run_s3select(bucket,key,query,column_delim=",",row_delim="\n",quot_char='"',esc_char='\\',csv_header_info="NONE", progress = False):
s3 = get_client()
s3select_assert_result( res_s3select_quot, res_s3select_final )
-@attr('s3select')
-def test_parqueet():
-
- parquet_generator()
-
-