@@ -700,6 +700,137 @@ parent_id: [[null,4358109269873137077,null,4358109269873137077]]
700
700
is_current_ancestor: [[true,false,true,true]]
701
701
```
702
702
703
+ ### Files
704
+
705
+ Inspect the data files in the current snapshot of the table:
706
+
707
+ ``` python
708
+ table.inspect.files()
709
+ ```
710
+
711
+ ```
712
+ pyarrow.Table
713
+ content: int8 not null
714
+ file_path: string not null
715
+ file_format: dictionary<values=string, indices=int32, ordered=0> not null
716
+ spec_id: int32 not null
717
+ record_count: int64 not null
718
+ file_size_in_bytes: int64 not null
719
+ column_sizes: map<int32, int64>
720
+ child 0, entries: struct<key: int32 not null, value: int64> not null
721
+ child 0, key: int32 not null
722
+ child 1, value: int64
723
+ value_counts: map<int32, int64>
724
+ child 0, entries: struct<key: int32 not null, value: int64> not null
725
+ child 0, key: int32 not null
726
+ child 1, value: int64
727
+ null_value_counts: map<int32, int64>
728
+ child 0, entries: struct<key: int32 not null, value: int64> not null
729
+ child 0, key: int32 not null
730
+ child 1, value: int64
731
+ nan_value_counts: map<int32, int64>
732
+ child 0, entries: struct<key: int32 not null, value: int64> not null
733
+ child 0, key: int32 not null
734
+ child 1, value: int64
735
+ lower_bounds: map<int32, binary>
736
+ child 0, entries: struct<key: int32 not null, value: binary> not null
737
+ child 0, key: int32 not null
738
+ child 1, value: binary
739
+ upper_bounds: map<int32, binary>
740
+ child 0, entries: struct<key: int32 not null, value: binary> not null
741
+ child 0, key: int32 not null
742
+ child 1, value: binary
743
+ key_metadata: binary
744
+ split_offsets: list<item: int64>
745
+ child 0, item: int64
746
+ equality_ids: list<item: int32>
747
+ child 0, item: int32
748
+ sort_order_id: int32
749
+ readable_metrics: struct<city: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: large_string, upper_bound: large_string> not null, lat: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double> not null, long: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double> not null>
750
+ child 0, city: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: string, upper_bound: string> not null
751
+ child 0, column_size: int64
752
+ child 1, value_count: int64
753
+ child 2, null_value_count: int64
754
+ child 3, nan_value_count: int64
755
+ child 4, lower_bound: large_string
756
+ child 5, upper_bound: large_string
757
+ child 1, lat: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double> not null
758
+ child 0, column_size: int64
759
+ child 1, value_count: int64
760
+ child 2, null_value_count: int64
761
+ child 3, nan_value_count: int64
762
+ child 4, lower_bound: double
763
+ child 5, upper_bound: double
764
+ child 2, long: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double> not null
765
+ child 0, column_size: int64
766
+ child 1, value_count: int64
767
+ child 2, null_value_count: int64
768
+ child 3, nan_value_count: int64
769
+ child 4, lower_bound: double
770
+ child 5, upper_bound: double
771
+ ----
772
+ content: [[0,0]]
773
+ file_path: [["s3://warehouse/default/table_metadata_files/data/00000-0-9ea7d222-6457-467f-bad5-6fb125c9aa5f.parquet","s3://warehouse/default/table_metadata_files/data/00000-0-afa8893c-de71-4710-97c9-6b01590d0c44.parquet"]]
774
+ file_format: [["PARQUET","PARQUET"]]
775
+ spec_id: [[0,0]]
776
+ record_count: [[3,3]]
777
+ file_size_in_bytes: [[5459,5459]]
778
+ column_sizes: [[keys:[1,2,3,4,5,...,8,9,10,11,12]values:[49,78,128,94,118,...,118,118,94,78,109],keys:[1,2,3,4,5,...,8,9,10,11,12]values:[49,78,128,94,118,...,118,118,94,78,109]]]
779
+ value_counts: [[keys:[1,2,3,4,5,...,8,9,10,11,12]values:[3,3,3,3,3,...,3,3,3,3,3],keys:[1,2,3,4,5,...,8,9,10,11,12]values:[3,3,3,3,3,...,3,3,3,3,3]]]
780
+ null_value_counts: [[keys:[1,2,3,4,5,...,8,9,10,11,12]values:[1,1,1,1,1,...,1,1,1,1,1],keys:[1,2,3,4,5,...,8,9,10,11,12]values:[1,1,1,1,1,...,1,1,1,1,1]]]
781
+ nan_value_counts: [[keys:[]values:[],keys:[]values:[]]]
782
+ lower_bounds: [[keys:[1,2,3,4,5,...,8,9,10,11,12]values:[00,61,61616161616161616161616161616161,01000000,0100000000000000,...,009B6ACA38F10500,009B6ACA38F10500,9E4B0000,01,00000000000000000000000000000000],keys:[1,2,3,4,5,...,8,9,10,11,12]values:[00,61,61616161616161616161616161616161,01000000,0100000000000000,...,009B6ACA38F10500,009B6ACA38F10500,9E4B0000,01,00000000000000000000000000000000]]]
783
+ upper_bounds:[[keys:[1,2,3,4,5,...,8,9,10,11,12]values:[00,61,61616161616161616161616161616161,01000000,0100000000000000,...,009B6ACA38F10500,009B6ACA38F10500,9E4B0000,01,00000000000000000000000000000000],keys:[1,2,3,4,5,...,8,9,10,11,12]values:[00,61,61616161616161616161616161616161,01000000,0100000000000000,...,009B6ACA38F10500,009B6ACA38F10500,9E4B0000,01,00000000000000000000000000000000]]]
784
+ key_metadata: [[0100,0100]]
785
+ split_offsets:[[[],[]]]
786
+ equality_ids:[[[],[]]]
787
+ sort_order_id:[[[],[]]]
788
+ readable_metrics: [
789
+ -- is_valid: all not null
790
+ -- child 0 type: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: large_string, upper_bound: large_string>
791
+ -- is_valid: all not null
792
+ -- child 0 type: int64
793
+ [140]
794
+ -- child 1 type: int64
795
+ [4]
796
+ -- child 2 type: int64
797
+ [0]
798
+ -- child 3 type: int64
799
+ [null]
800
+ -- child 4 type: large_string
801
+ ["Amsterdam"]
802
+ -- child 5 type: large_string
803
+ ["San Francisco"]
804
+ -- child 1 type: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double>
805
+ -- is_valid: all not null
806
+ -- child 0 type: int64
807
+ [135]
808
+ -- child 1 type: int64
809
+ [4]
810
+ -- child 2 type: int64
811
+ [0]
812
+ -- child 3 type: int64
813
+ [null]
814
+ -- child 4 type: double
815
+ [37.773972]
816
+ -- child 5 type: double
817
+ [53.11254]
818
+ -- child 2 type: struct<column_size: int64, value_count: int64, null_value_count: int64, nan_value_count: int64, lower_bound: double, upper_bound: double>
819
+ -- is_valid: all not null
820
+ -- child 0 type: int64
821
+ [135]
822
+ -- child 1 type: int64
823
+ [4]
824
+ -- child 2 type: int64
825
+ [0]
826
+ -- child 3 type: int64
827
+ [null]
828
+ -- child 4 type: double
829
+ [-122.431297]
830
+ -- child 5 type: double
831
+ [6.0989]]
832
+ ```
833
+
703
834
## Add Files
704
835
705
836
Expert Iceberg users may choose to commit existing parquet files to the Iceberg table as data files, without rewriting them.
0 commit comments