|
| 1 | +import numpy as np |
| 2 | +import pandas as pd |
| 3 | +import polars as pl |
| 4 | + |
| 5 | +data = pl.DataFrame({"A": [1, 2, 3, 4, 5], "B": [6, 7, 8, 9, 10]}) |
| 6 | + |
| 7 | +data.write_csv("data.csv") |
| 8 | +data.write_ndjson("data.json") |
| 9 | +data.write_parquet("data.parquet") |
| 10 | + |
| 11 | +data_csv = pl.read_csv("data.csv") |
| 12 | +data_csv_lazy = pl.scan_csv("data.csv") |
| 13 | +print(data_csv_lazy.schema) |
| 14 | + |
| 15 | +data_json = pl.read_ndjson("data.json") |
| 16 | +data_json_lazy = pl.scan_ndjson("data.json") |
| 17 | +print(data_json_lazy.schema) |
| 18 | + |
| 19 | +data_parquet = pl.read_parquet("data.parquet") |
| 20 | +data_parquet_lazy = pl.scan_parquet("data.parquet") |
| 21 | +print(data_parquet_lazy.schema) |
| 22 | + |
| 23 | +polars_data = pl.DataFrame({"A": [1, 2, 3, 4, 5], "B": [6, 7, 8, 9, 10]}) |
| 24 | + |
| 25 | +pandas_data = pd.DataFrame({"A": [1, 2, 3, 4, 5], "B": [6, 7, 8, 9, 10]}) |
| 26 | + |
| 27 | +numpy_data = np.array([[1, 2, 3, 4, 5], [6, 7, 8, 9, 10]]).T |
| 28 | + |
| 29 | +print(pl.from_pandas(pandas_data)) |
| 30 | + |
| 31 | +print(pl.from_numpy(numpy_data, schema={"A": pl.Int64, "B": pl.Int64})) |
| 32 | + |
| 33 | +print(polars_data.to_pandas()) |
| 34 | + |
| 35 | +print(polars_data.to_numpy()) |
0 commit comments