Extract data from Parquet files. Parquet is a columnar storage format optimized for analytical workloads, offering efficient compression and fast read performance for large datasets.
Examples
Data frame
Description
Documentation
Code
<?php
declare(strict_types=1);
use function Flow\ETL\Adapter\Parquet\from_parquet;
use function Flow\ETL\DSL\{data_frame, to_output};
require __DIR__ . '/vendor/autoload.php';
data_frame()
->read(from_parquet(
__DIR__ . '/input/dataset.parquet',
))
->collect()
->write(to_output(truncate: false))
->run();