API

parquetranger Package

Read and write parquet files

Classes

DfBatchWriter(trepo, record_limit, ...)

HashPartitioner([col, num_groups])

ObjIngestor(root[, root_id_key, force_key, ...])

RecordWriter(trepo, record_limit, ...)

TableRepo(root_path[, max_records, ...])

helps with storing, extending and reading tabular data in parquet format

Class Inheritance Diagram

digraph inheritance114b48ec0a { bgcolor=transparent; rankdir=LR; size="8.0, 12.0"; "DfBatchWriter" [URL="api/parquetranger.DfBatchWriter.html#parquetranger.DfBatchWriter",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top",tooltip="DfBatchWriter(trepo: parquetranger.core.TableRepo, record_limit: int = 1000000, writer_function: Callable = <function TableRepo.extend at 0x7f2e2bef2dd0>, batch: list = <factory>)"]; "RecordWriter" -> "DfBatchWriter" [arrowsize=0.5,style="setlinewidth(0.5)"]; "HashPartitioner" [URL="api/parquetranger.HashPartitioner.html#parquetranger.HashPartitioner",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top",tooltip="HashPartitioner(col: str | None = None, num_groups: int = 128)"]; "ObjIngestor" [URL="api/parquetranger.ObjIngestor.html#parquetranger.ObjIngestor",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top",tooltip="ObjIngestor(root: pathlib.Path, root_id_key: Optional[str] = None, force_key: bool = False, forward_uuids: bool = False, total_atoms: int = 0, largest_size: int = 0)"]; "RecordWriter" [URL="api/parquetranger.RecordWriter.html#parquetranger.RecordWriter",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top",tooltip="RecordWriter(trepo: parquetranger.core.TableRepo, record_limit: int = 1000000, writer_function: Callable = <function TableRepo.extend at 0x7f2e2bef2dd0>, batch: list = <factory>)"]; "TableRepo" [URL="api/parquetranger.TableRepo.html#parquetranger.TableRepo",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top",tooltip="helps with storing, extending and reading tabular data in parquet format"]; }