File: gen_interop_data.py

package info (click to toggle)
python-avro 1.10.1%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 1,624 kB
  • sloc: python: 11,437; xml: 4,061; sh: 752; java: 386; makefile: 21
file content (73 lines) | stat: -rw-r--r-- 2,324 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
#!/usr/bin/env python

##
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import absolute_import, division, print_function

import os
import sys

import avro.datafile
import avro.io
import avro.schema
from avro.codecs import Codecs

try:
    unicode
except NameError:
    unicode = str

NULL_CODEC = 'null'
CODECS_TO_VALIDATE = Codecs.supported_codec_names()

DATUM = {
    'intField': 12,
    'longField': 15234324,
    'stringField': unicode('hey'),
    'boolField': True,
    'floatField': 1234.0,
    'doubleField': -1234.0,
    'bytesField': b'12312adf',
    'nullField': None,
    'arrayField': [5.0, 0.0, 12.0],
    'mapField': {unicode('a'): {'label': unicode('a')},
                 unicode('bee'): {'label': unicode('cee')}},
    'unionField': 12.0,
    'enumField': 'C',
    'fixedField': b'1019181716151413',
    'recordField': {'label': unicode('blah'),
                    'children': [{'label': unicode('inner'), 'children': []}]},
}


def generate(schema_path, output_path):
    with open(schema_path, 'r') as schema_file:
        interop_schema = avro.schema.parse(schema_file.read())
    for codec in CODECS_TO_VALIDATE:
        filename = output_path
        if codec != NULL_CODEC:
            base, ext = os.path.splitext(output_path)
            filename = base + "_" + codec + ext
        with avro.datafile.DataFileWriter(open(filename, 'wb'), avro.io.DatumWriter(),
                                          interop_schema, codec=codec) as dfw:
            dfw.append(DATUM)


if __name__ == "__main__":
    generate(sys.argv[1], sys.argv[2])