@@ -180,7 +180,7 @@ def test_register_parquet_partitioned(ctx, tmp_path, path_to_str):
180180 ctx .register_parquet (
181181 "datapp" ,
182182 dir_root ,
183- table_partition_cols = [("grp" , " string" )],
183+ table_partition_cols = [("grp" , pa . string () )],
184184 parquet_pruning = True ,
185185 file_extension = ".parquet" ,
186186 )
@@ -488,9 +488,9 @@ def test_register_listing_table(
488488):
489489 dir_root = tmp_path / "dataset_parquet_partitioned"
490490 dir_root .mkdir (exist_ok = False )
491- (dir_root / "grp=a/date_id=20201005 " ).mkdir (exist_ok = False , parents = True )
492- (dir_root / "grp=a/date_id=20211005 " ).mkdir (exist_ok = False , parents = True )
493- (dir_root / "grp=b/date_id=20201005 " ).mkdir (exist_ok = False , parents = True )
491+ (dir_root / "grp=a/date=2020-10-05 " ).mkdir (exist_ok = False , parents = True )
492+ (dir_root / "grp=a/date=2021-10-05 " ).mkdir (exist_ok = False , parents = True )
493+ (dir_root / "grp=b/date=2020-10-05 " ).mkdir (exist_ok = False , parents = True )
494494
495495 table = pa .Table .from_arrays (
496496 [
@@ -501,21 +501,21 @@ def test_register_listing_table(
501501 names = ["int" , "str" , "float" ],
502502 )
503503 pa .parquet .write_table (
504- table .slice (0 , 3 ), dir_root / "grp=a/date_id=20201005 /file.parquet"
504+ table .slice (0 , 3 ), dir_root / "grp=a/date=2020-10-05 /file.parquet"
505505 )
506506 pa .parquet .write_table (
507- table .slice (3 , 2 ), dir_root / "grp=a/date_id=20211005 /file.parquet"
507+ table .slice (3 , 2 ), dir_root / "grp=a/date=2021-10-05 /file.parquet"
508508 )
509509 pa .parquet .write_table (
510- table .slice (5 , 10 ), dir_root / "grp=b/date_id=20201005 /file.parquet"
510+ table .slice (5 , 10 ), dir_root / "grp=b/date=2020-10-05 /file.parquet"
511511 )
512512
513513 dir_root = f"file://{ dir_root } /" if path_to_str else dir_root
514514
515515 ctx .register_listing_table (
516516 "my_table" ,
517517 dir_root ,
518- table_partition_cols = [("grp" , " string" ) , ("date_id " , "int" )],
518+ table_partition_cols = [("grp" , pa . string ()) , ("date " , pa . date64 () )],
519519 file_extension = ".parquet" ,
520520 schema = table .schema if pass_schema else None ,
521521 file_sort_order = file_sort_order ,
@@ -531,7 +531,7 @@ def test_register_listing_table(
531531 assert dict (zip (rd ["grp" ], rd ["count" ])) == {"a" : 5 , "b" : 2 }
532532
533533 result = ctx .sql (
534- "SELECT grp, COUNT(*) AS count FROM my_table WHERE date_id=20201005 GROUP BY grp" # noqa: E501
534+ "SELECT grp, COUNT(*) AS count FROM my_table WHERE date='2020-10-05' GROUP BY grp" # noqa: E501
535535 ).collect ()
536536 result = pa .Table .from_batches (result )
537537
0 commit comments