File: compare.collation.benchmark.tables.pl

package info (click to toggle)
lucene-solr 3.6.2%2Bdfsg-24
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 91,200 kB
  • sloc: java: 465,555; xml: 24,939; javascript: 5,291; ruby: 3,453; jsp: 2,637; python: 1,619; sh: 1,556; perl: 1,407; cpp: 305; makefile: 39
file content (91 lines) | stat: -rw-r--r-- 3,591 bytes parent folder | download | duplicates (19)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
#!/usr/bin/perl
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements.  See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License.  You may obtain a copy of the License at
# 
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# ------------------------------------------
# compare.collation.benchmark.jira.tables.pl
#
# Takes as cmdline parameters two JIRA-formatted benchmark results, as produced
# by bm2jira.pl (located in the same directory as this script), and outputs a
# third JIRA-formatted comparison table, showing the differences between two
# benchmarking runs' java.text and ICU4J columns, after accounting for the
# KeywordAnalyzer column; the "ICU4J Improvement" column is ignored.
#
# The difference is calculated as a percentage:
#
#   100 * (patched-rate - unpatched-rate / unpatched-rate)
#
# where the (un)patched-rate is:
#
#   1 / ( elapsed-(un)patched-time - elapsed-KeywordAnalyzer-time)
#

use strict;
use warnings;

my $usage = "Usage: $0 <unpatched-file> <patched-file>\n";

die $usage unless ($#ARGV == 1 && -f $ARGV[0] && -f $ARGV[1]);

my %stats = ();

open UNPATCHED, "<$ARGV[0]" || die "ERROR opening '$ARGV[0]': $!";
while (<UNPATCHED>) {
  # ||Language||java.text||ICU4J||KeywordAnalyzer||ICU4J Improvement||
  # |English|4.51s|2.47s|1.47s|204%|
  next unless (/^\|([^|]+)\|([^|s]+)s\|([^|s]+)s\|([^|s]+)s/);
  my ($lang, $jdk_elapsed, $icu_elapsed, $keyword_analyzer_elapsed)
    = ($1, $2, $3, $4);
  $stats{unpatched}{$lang}{jdk} = $jdk_elapsed;
  $stats{unpatched}{$lang}{icu} = $icu_elapsed;
  $stats{unpatched}{$lang}{keyword_analyzer} = $keyword_analyzer_elapsed;
}
close UNPATCHED;

open PATCHED, "<$ARGV[1]" || die "ERROR opening '$ARGV[1]': $!";
while (<PATCHED>) {
  # ||Language||java.text||ICU4J||KeywordAnalyzer||ICU4J Improvement||
  # |English|4.51s|2.47s|1.47s|204%|
  next unless (/^\|([^|]+)\|([^|s]+)s\|([^|s]+)s\|([^|s]+)s/);
  my ($lang, $jdk_elapsed, $icu_elapsed, $keyword_analyzer_elapsed)
    = ($1, $2, $3, $4);
  $stats{patched}{$lang}{jdk} = $jdk_elapsed;
  $stats{patched}{$lang}{icu} = $icu_elapsed;
  $stats{patched}{$lang}{keyword_analyzer} = $keyword_analyzer_elapsed;
}
close PATCHED;

print "||Language||java.text improvement||ICU4J improvement||\n";
for my $lang (sort keys %{$stats{unpatched}}) {
  my $keyword_analyzer1 = $stats{unpatched}{$lang}{keyword_analyzer};
  my $jdk1 = $stats{unpatched}{$lang}{jdk};
  my $jdk_diff1 = $jdk1 - $keyword_analyzer1;
  my $icu1 = $stats{unpatched}{$lang}{icu};
  my $icu_diff1 = $icu1 - $keyword_analyzer1;

  my $keyword_analyzer2 = $stats{patched}{$lang}{keyword_analyzer};
  my $jdk2 = $stats{patched}{$lang}{jdk};
  my $jdk_diff2 = $jdk2 - $keyword_analyzer2;
  my $icu2 = $stats{patched}{$lang}{icu};
  my $icu_diff2 = $icu2 - $keyword_analyzer2;

  my $jdk_impr 
    = int((1./$jdk_diff2 - 1./$jdk_diff1) / (1./$jdk_diff1) * 1000 + 5) / 10;
  my $icu_impr
    = int((1./$icu_diff2 - 1./$icu_diff1) / (1./$icu_diff1) * 1000 + 5) / 10;

  printf "|$lang|%2.1f%%|%2.1f%%|\n", $jdk_impr, $icu_impr;
}