in tools/pq.py [0:0]
def __iter__(self):
batches = self._ds.to_batches(batch_size=self._batch_size, columns=self._columns)
rows_seen = 0
for count, record in enumerate(batches):
if self._num and rows_seen >= self._num:
break
yield record
rows_seen += record.data.num_rows