Details
-
Bug
-
Status: Resolved
-
Blocker
-
Resolution: Fixed
-
None
Description
See https://github.com/ursacomputing/crossbow/actions/runs/3240936478/jobs/5312200303#step:7:341
2022-10-13T09:42:51.5203618Z __________________________ test_run_serialized_query __________________________ 2022-10-13T09:42:51.5203890Z 2022-10-13T09:42:51.5204391Z tmpdir = local('C:\\Users\\ContainerAdministrator\\AppData\\Local\\Temp\\pytest-of-ContainerAdministrator\\pytest-0\\test_run_serialized_query0') 2022-10-13T09:42:51.5205282Z 2022-10-13T09:42:51.5205769Z def test_run_serialized_query(tmpdir): 2022-10-13T09:42:51.5206172Z substrait_query = """ 2022-10-13T09:42:51.5206505Z { 2022-10-13T09:42:51.5206828Z "relations": [ 2022-10-13T09:42:51.5207175Z {"rel": { 2022-10-13T09:42:51.5207501Z "read": { 2022-10-13T09:42:51.5207800Z "base_schema": { 2022-10-13T09:42:51.5208155Z "struct": { 2022-10-13T09:42:51.5208491Z "types": [ 2022-10-13T09:42:51.5208841Z {"i64": {}} 2022-10-13T09:42:51.5209182Z ] 2022-10-13T09:42:51.5209501Z }, 2022-10-13T09:42:51.5209829Z "names": [ 2022-10-13T09:42:51.5210168Z "foo" 2022-10-13T09:42:51.5210611Z ] 2022-10-13T09:42:51.5211097Z }, 2022-10-13T09:42:51.5211453Z "local_files": { 2022-10-13T09:42:51.5211747Z "items": [ 2022-10-13T09:42:51.5212083Z { 2022-10-13T09:42:51.5212530Z "uri_file": "file://FILENAME_PLACEHOLDER", 2022-10-13T09:42:51.5212930Z "arrow": {} 2022-10-13T09:42:51.5213261Z } 2022-10-13T09:42:51.5213579Z ] 2022-10-13T09:42:51.5213885Z } 2022-10-13T09:42:51.5214188Z } 2022-10-13T09:42:51.5214491Z }} 2022-10-13T09:42:51.5214795Z ] 2022-10-13T09:42:51.5215053Z } 2022-10-13T09:42:51.5215399Z """ 2022-10-13T09:42:51.5215708Z 2022-10-13T09:42:51.5355345Z file_name = "read_data.arrow" 2022-10-13T09:42:51.5356563Z table = pa.table([[1, 2, 3, 4, 5]], names=['foo']) 2022-10-13T09:42:51.5360922Z path = _write_dummy_data_to_disk(tmpdir, file_name, table) 2022-10-13T09:42:51.5361743Z query = tobytes(substrait_query.replace("FILENAME_PLACEHOLDER", path)) 2022-10-13T09:42:51.5362170Z 2022-10-13T09:42:51.5362589Z buf = pa._substrait._parse_json_plan(query) 2022-10-13T09:42:51.5362990Z 2022-10-13T09:42:51.5363388Z > reader = substrait.run_query(buf) 2022-10-13T09:42:51.5363692Z 2022-10-13T09:42:51.5364018Z Python\lib\site-packages\pyarrow\tests\test_substrait.py:79: 2022-10-13T09:42:51.5364520Z _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 2022-10-13T09:42:51.5365008Z pyarrow\_substrait.pyx:146: in pyarrow._substrait.run_query 2022-10-13T09:42:51.5365444Z ??? 2022-10-13T09:42:51.5365903Z pyarrow\error.pxi:144: in pyarrow.lib.pyarrow_internal_check_status 2022-10-13T09:42:51.5366352Z ??? 2022-10-13T09:42:51.5366746Z _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 2022-10-13T09:42:51.5367047Z 2022-10-13T09:42:51.5367246Z > ??? 2022-10-13T09:42:51.5376405Z E pyarrow.lib.ArrowInvalid: Cannot parse URI: 'file://C:UsersContainerAdministratorAppDataLocalTemppytest-of-ContainerAdministratorpytest-0 est_run_serialized_query0 2022-10-13T09:42:51.5377196Z ead_data.arrow' 2022-10-13T09:42:51.5377363Z 2022-10-13T09:42:51.5377519Z pyarrow\error.pxi:100: ArrowInvalid 2022-10-13T09:42:51.5377857Z __________________ test_binary_conversion_with_json_options ___________________ 2022-10-13T09:42:51.5378087Z 2022-10-13T09:42:51.5378488Z tmpdir = local('C:\\Users\\ContainerAdministrator\\AppData\\Local\\Temp\\pytest-of-ContainerAdministrator\\pytest-0\\test_binary_conversion_with_js0') 2022-10-13T09:42:51.5378905Z 2022-10-13T09:42:51.5379091Z def test_binary_conversion_with_json_options(tmpdir): 2022-10-13T09:42:51.5379432Z substrait_query = """ 2022-10-13T09:42:51.5379695Z { 2022-10-13T09:42:51.5379951Z "relations": [ 2022-10-13T09:42:51.5380229Z {"rel": { 2022-10-13T09:42:51.5380492Z "read": { 2022-10-13T09:42:51.5380954Z "base_schema": { 2022-10-13T09:42:51.5381237Z "struct": { 2022-10-13T09:42:51.5381473Z "types": [ 2022-10-13T09:42:51.5381760Z {"i64": {}} 2022-10-13T09:42:51.5382039Z ] 2022-10-13T09:42:51.5382300Z }, 2022-10-13T09:42:51.5382564Z "names": [ 2022-10-13T09:42:51.5382841Z "bar" 2022-10-13T09:42:51.5383116Z ] 2022-10-13T09:42:51.5383331Z }, 2022-10-13T09:42:51.5383604Z "local_files": { 2022-10-13T09:42:51.5383878Z "items": [ 2022-10-13T09:42:51.5384142Z { 2022-10-13T09:42:51.5384478Z "uri_file": "file://FILENAME_PLACEHOLDER", 2022-10-13T09:42:51.5384817Z "arrow": {}, 2022-10-13T09:42:51.5385109Z "metadata" : { 2022-10-13T09:42:51.5385416Z "created_by" : {}, 2022-10-13T09:42:51.5385662Z } 2022-10-13T09:42:51.5385919Z } 2022-10-13T09:42:51.5386538Z ] 2022-10-13T09:42:51.5386915Z } 2022-10-13T09:42:51.5387308Z } 2022-10-13T09:42:51.5387681Z }} 2022-10-13T09:42:51.5388028Z ] 2022-10-13T09:42:51.5388376Z } 2022-10-13T09:42:51.5388783Z """ 2022-10-13T09:42:51.5389130Z 2022-10-13T09:42:51.5389529Z file_name = "binary_json_data.arrow" 2022-10-13T09:42:51.5389993Z table = pa.table([[1, 2, 3, 4, 5]], names=['bar']) 2022-10-13T09:42:51.5390483Z path = _write_dummy_data_to_disk(tmpdir, file_name, table) 2022-10-13T09:42:51.5391031Z query = tobytes(substrait_query.replace("FILENAME_PLACEHOLDER", path)) 2022-10-13T09:42:51.5392363Z buf = pa._substrait._parse_json_plan(tobytes(query)) 2022-10-13T09:42:51.5392817Z 2022-10-13T09:42:51.5393218Z > reader = substrait.run_query(buf) 2022-10-13T09:42:51.5393520Z 2022-10-13T09:42:51.5393849Z Python\lib\site-packages\pyarrow\tests\test_substrait.py:153: 2022-10-13T09:42:51.5394315Z _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 2022-10-13T09:42:51.5394796Z pyarrow\_substrait.pyx:146: in pyarrow._substrait.run_query 2022-10-13T09:42:51.5395221Z ??? 2022-10-13T09:42:51.5395674Z pyarrow\error.pxi:144: in pyarrow.lib.pyarrow_internal_check_status 2022-10-13T09:42:51.5396125Z ??? 2022-10-13T09:42:51.5396520Z _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 2022-10-13T09:42:51.5396809Z 2022-10-13T09:42:51.5397008Z > ??? 2022-10-13T09:42:51.5398062Z E pyarrow.lib.ArrowInvalid: Cannot parse URI: 'file://C:UsersContainerAdministratorAppDataLocalTemppytest-of-ContainerAdministratorpytest-0 est_binary_conversion_with_js0inary_json_data.arrow' 2022-10-13T09:42:51.5398770Z 2022-10-13T09:42:51.5399026Z pyarrow\error.pxi:100: ArrowInvalid
Attachments
Issue Links
- is caused by
-
ARROW-16424 [C++] Update uri_path parsing in FromProto
- Resolved
- links to