File: av_bench.py

package info (click to toggle)
avro-java 1.8.2-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, forky, sid, trixie
  • size: 12,784 kB
  • sloc: java: 58,236; ansic: 27,618; cpp: 15,332; cs: 12,876; python: 10,443; xml: 6,338; php: 3,836; ruby: 3,158; perl: 1,656; sh: 733; lex: 203; yacc: 140; makefile: 7
file content (119 lines) | stat: -rw-r--r-- 3,194 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
#!/usr/bin/env python3
# -*- mode: python -*-
# -*- coding: utf-8 -*-

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import logging
import random
import string
import sys
import time

import avro.datafile
import avro.io
import avro.schema


TYPES = ('A', 'CNAME',)
FILENAME = 'datafile.avr'


def GenerateRandomName():
  return ''.join(random.sample(string.ascii_lowercase, 15))


def GenerateRandomIP():
  return '%s.%s.%s.%s' % (
      random.randint(0, 255),
      random.randint(0, 255),
      random.randint(0, 255),
      random.randint(0, 255),
  )


def Write(nrecords):
  """Writes a data file with the specified number of random records.

  Args:
    nrecords: Number of records to write.
  """
  schema_s = """
  {
    "type": "record",
    "name": "Query",
    "fields" : [
      {"name": "query", "type": "string"},
      {"name": "response", "type": "string"},
      {"name": "type", "type": "string", "default": "A"}
    ]
  }
  """
  schema = avro.schema.Parse(schema_s)
  writer = avro.io.DatumWriter(schema)

  with open(FILENAME, 'wb') as out:
    with avro.datafile.DataFileWriter(
        out, writer, schema,
        # codec='deflate'
    ) as data_writer:
      for _ in range(nrecords):
        response = GenerateRandomIP()
        query = GenerateRandomName()
        type = random.choice(TYPES)
        data_writer.append({
            'query': query,
            'response': response,
            'type': type,
        })


def Read(expect_nrecords):
  """Reads the data file generated by Write()."""
  with open(FILENAME, 'rb') as f:
    reader = avro.io.DatumReader()
    with avro.datafile.DataFileReader(f, reader) as file_reader:
      nrecords = 0
      for record in file_reader:
        nrecords += 1
      assert (nrecords == expect_nrecords), (
          'Expecting %d records, got %d.' % (expected_nrecords, nrecords))


def Timing(f, *args):
  s = time.time()
  f(*args)
  e = time.time()
  return e - s


def Main(args):
  nrecords = int(args[1])
  print('Write %0.4f' % Timing(Write, nrecords))
  print('Read %0.4f' % Timing(Read, nrecords))


if __name__ == '__main__':
  log_formatter = logging.Formatter(
      '%(asctime)s %(levelname)s %(filename)s:%(lineno)s : %(message)s')
  logging.root.setLevel(logging.DEBUG)
  console_handler = logging.StreamHandler()
  console_handler.setFormatter(log_formatter)
  console_handler.setLevel(logging.DEBUG)
  logging.root.addHandler(console_handler)

  Main(sys.argv)