File tree Expand file tree Collapse file tree 3 files changed +31
-13
lines changed Expand file tree Collapse file tree 3 files changed +31
-13
lines changed Original file line number Diff line number Diff line change 1+ #!python3
2+ import os
3+ import pyarrow as pa
4+ import chdb
5+
6+ # get current file dir
7+ current_dir = os .path .dirname (os .path .abspath (__file__ ))
8+ test_parquet = current_dir + "/../contrib/arrow/cpp/submodules/parquet-testing/data/alltypes_dictionary.parquet"
9+
10+ # run SQL on parquet file and return arrow format
11+ res = chdb .query (f"select * from file('{ test_parquet } ', Parquet)" , "Arrow" )
12+ print ("\n result from chdb:" )
13+ print (res .get_memview ().tobytes ())
14+
15+ def to_arrowTable (res ):
16+ # convert arrow format to arrow table
17+ paTable = pa .RecordBatchFileReader (res .get_memview ()).read_all ()
18+ return paTable
19+
20+ def to_df (res ):
21+ # convert arrow format to arrow table
22+ paTable = to_arrowTable (res )
23+ # convert arrow table to pandas dataframe
24+ return paTable .to_pandas (use_threads = True )
25+
26+ print ("\n result from chdb to pyarrow:" )
27+ print (to_arrowTable (res ))
28+
29+ # convert arrow table to pandas dataframe
30+ print ("\n result from chdb to pandas:" )
31+ print (to_df (res ))
Load Diff This file was deleted.
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments