File: test_3154_parquet_subcolumn_select.py

package info (click to toggle)
python-awkward 2.8.9-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 24,932 kB
  • sloc: python: 178,875; cpp: 33,828; sh: 432; makefile: 21; javascript: 8
file content (39 lines) | stat: -rw-r--r-- 1,109 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
# BSD 3-Clause License; see https://github.com/scikit-hep/awkward/blob/main/LICENSE

from __future__ import annotations

import os

import pytest

import awkward as ak

pa = pytest.importorskip("pyarrow")
pq = pytest.importorskip("pyarrow.parquet")


def test_parquet_subcolumn_select(tmp_path):
    ak_tbl = ak.Array(
        {
            "a": [
                {"lbl": "item 1", "idx": 11, "ids": [1, 2, 3]},
                {"lbl": "item 2", "idx": 12, "ids": [51, 52]},
                {"lbl": "item 3", "idx": 13, "ids": [61, 62, 63, 64]},
            ],
            "b": [
                [[111, 112], [121, 122]],
                [[211, 212], [221, 222]],
                [[311, 312], [321, 322]],
            ],
        }
    )
    parquet_file = os.path.join(tmp_path, "test_3514.parquet")
    ak.to_parquet(ak_tbl, parquet_file)

    selection = ak.from_parquet(parquet_file, columns=["a.ids", "b"])
    assert selection["a"].to_list() == [
        {"ids": [1, 2, 3]},
        {"ids": [51, 52]},
        {"ids": [61, 62, 63, 64]},
    ]
    assert selection["b"].to_list() == ak_tbl["b"].to_list()