@@ -1178,7 +1178,7 @@ def metadata_location_gz(tmp_path_factory: pytest.TempPathFactory) -> str:
11781178 "data_file" : {
11791179 "file_path" : "/home/iceberg/warehouse/nyc/taxis_partitioned/data/VendorID=null/00000-633-d8a4223e-dc97-45a1-86e1-adaba6e8abd7-00001.parquet" ,
11801180 "file_format" : "PARQUET" ,
1181- "partition" : {"VendorID" : 1 , "tpep_pickup_datetime " : 1925 },
1181+ "partition" : {"VendorID" : 1 , "tpep_pickup_day " : 1925 },
11821182 "record_count" : 19513 ,
11831183 "file_size_in_bytes" : 388872 ,
11841184 "block_size_in_bytes" : 67108864 ,
@@ -1298,7 +1298,7 @@ def metadata_location_gz(tmp_path_factory: pytest.TempPathFactory) -> str:
12981298 "data_file" : {
12991299 "file_path" : "/home/iceberg/warehouse/nyc/taxis_partitioned/data/VendorID=1/00000-633-d8a4223e-dc97-45a1-86e1-adaba6e8abd7-00002.parquet" ,
13001300 "file_format" : "PARQUET" ,
1301- "partition" : {"VendorID" : 1 , "tpep_pickup_datetime " : None },
1301+ "partition" : {"VendorID" : 1 , "tpep_pickup_day " : None },
13021302 "record_count" : 95050 ,
13031303 "file_size_in_bytes" : 1265950 ,
13041304 "block_size_in_bytes" : 67108864 ,
@@ -1383,7 +1383,7 @@ def metadata_location_gz(tmp_path_factory: pytest.TempPathFactory) -> str:
13831383 {"key" : 3 , "value" : b"\x01 \x00 \x00 \x00 \x00 \x00 \x00 \x00 " },
13841384 {"key" : 4 , "value" : b"\x00 \x00 \x00 \x00 " },
13851385 {"key" : 5 , "value" : b"\x01 \x00 \x00 \x00 " },
1386- {"key" : 6 , "value" : b"N " },
1386+ {"key" : 6 , "value" : b"\x01 \x00 \x00 \x00 " },
13871387 {"key" : 7 , "value" : b"\x01 \x00 \x00 \x00 " },
13881388 {"key" : 8 , "value" : b"\x01 \x00 \x00 \x00 " },
13891389 {"key" : 9 , "value" : b"\x01 \x00 \x00 \x00 " },
@@ -1403,7 +1403,7 @@ def metadata_location_gz(tmp_path_factory: pytest.TempPathFactory) -> str:
14031403 {"key" : 3 , "value" : b"\x06 \x00 \x00 \x00 \x00 \x00 \x00 \x00 " },
14041404 {"key" : 4 , "value" : b"\x06 \x00 \x00 \x00 " },
14051405 {"key" : 5 , "value" : b"c\x00 \x00 \x00 " },
1406- {"key" : 6 , "value" : b"Y " },
1406+ {"key" : 6 , "value" : b"c \x00 \x00 \x00 " },
14071407 {"key" : 7 , "value" : b"\t \x01 \x00 \x00 " },
14081408 {"key" : 8 , "value" : b"\t \x01 \x00 \x00 " },
14091409 {"key" : 9 , "value" : b"\x04 \x00 \x00 \x00 " },
@@ -1677,7 +1677,7 @@ def avro_schema_manifest_entry() -> Dict[str, Any]:
16771677 {
16781678 "field-id" : 1001 ,
16791679 "default" : None ,
1680- "name" : "tpep_pickup_datetime " ,
1680+ "name" : "tpep_pickup_day " ,
16811681 "type" : ["null" , {"type" : "int" , "logicalType" : "date" }],
16821682 },
16831683 ],
@@ -1863,7 +1863,25 @@ def simple_map() -> MapType:
18631863@pytest .fixture (scope = "session" )
18641864def test_schema () -> Schema :
18651865 return Schema (
1866- NestedField (1 , "VendorID" , IntegerType (), False ), NestedField (2 , "tpep_pickup_datetime" , TimestampType (), False )
1866+ NestedField (1 , "VendorID" , IntegerType (), False ),
1867+ NestedField (2 , "tpep_pickup_datetime" , TimestampType (), False ),
1868+ NestedField (3 , "tpep_dropoff_datetime" , TimestampType (), False ),
1869+ NestedField (4 , "passenger_count" , LongType (), False ),
1870+ NestedField (5 , "trip_distance" , DoubleType (), False ),
1871+ NestedField (6 , "RatecodeID" , DoubleType (), False ),
1872+ NestedField (7 , "store_and_fwd_flag" , StringType (), False ),
1873+ NestedField (8 , "PULocationID" , IntegerType (), False ),
1874+ NestedField (9 , "DOLocationID" , IntegerType (), False ),
1875+ NestedField (10 , "payment_type" , LongType (), False ),
1876+ NestedField (11 , "fare_amount" , DoubleType (), False ),
1877+ NestedField (12 , "extra" , DoubleType (), False ),
1878+ NestedField (13 , "mta_tax" , DoubleType (), False ),
1879+ NestedField (14 , "tip_amount" , DoubleType (), False ),
1880+ NestedField (15 , "tolls_amount" , DoubleType (), False ),
1881+ NestedField (16 , "improvement_surcharge" , DoubleType (), False ),
1882+ NestedField (17 , "total_amount" , DoubleType (), False ),
1883+ NestedField (18 , "congestion_surcharge" , DoubleType (), False ),
1884+ NestedField (19 , "Airport_fee" , DoubleType (), False ),
18671885 )
18681886
18691887
@@ -1969,7 +1987,7 @@ def iceberg_manifest_entry_schema() -> Schema:
19691987 ),
19701988 NestedField (
19711989 field_id = 1001 ,
1972- name = "tpep_pickup_datetime " ,
1990+ name = "tpep_pickup_day " ,
19731991 field_type = DateType (),
19741992 required = False ,
19751993 ),
0 commit comments