File: test_thrift_structures.py

package info (click to toggle)
python-fastparquet 2024.2.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 120,180 kB
  • sloc: python: 8,181; makefile: 187
file content (28 lines) | stat: -rw-r--r-- 686 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
import copy
import os
import pickle

from fastparquet import ParquetFile
from .util import TEST_DATA
from fastparquet.schema import schema_tree

fn = os.path.join(TEST_DATA, "nation.impala.parquet")
pf = ParquetFile(fn)


def test_serialize():
    fmd2 = pickle.loads(pickle.dumps(pf.fmd))
    # we twiddle for what would have been done during ParquetFile instantiation
    for sch in fmd2.schema:
        sch.name = sch.name.decode()
    assert str(fmd2) == str(pf.fmd)

    rg = pf.row_groups[0]
    rg2 = pickle.loads(pickle.dumps(rg))
    assert rg == rg2


def test_copy():
    fmd2 = copy.copy(pf.fmd)
    assert fmd2 is not pf.fmd
    assert fmd2.row_groups == pf.fmd.row_groups