File: rainbow-pr.pl

package info (click to toggle)
bow 19991122-4
  • links: PTS
  • area: main
  • in suites: woody
  • size: 2,544 kB
  • ctags: 2,987
  • sloc: ansic: 38,660; lisp: 1,072; makefile: 594; perl: 492; yacc: 149; sh: 91
file content (119 lines) | stat: -rwxr-xr-x 3,393 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
#!/usr/bin/perl
# The above line is modified by ./Makefile to match the system's
# installed location for Perl.

$usage = <<USAGE;
USAGE: pr [-bins] interval class < andrew-files
USAGE

if ($ARGV[0] eq '-bins')
{
    $bins = 1;
    shift @ARGV;
}
($interval, $class) = @ARGV;

&usage_msg unless $interval && $class;

print STDERR "Reading...\n"; 

while ($line = <STDIN>)
{
    if (($actual_class, $predicted) = $line =~ /^\S+\s+(\S+)\s+(.*)/)
    {
        for $pred (split(/\s+/, $predicted))
        {
            if (($predicted_class, $confidence) = $pred =~ /([^:]+):(.*)/)
            {
                if ($predicted_class eq $class)
                {
                    push(@predictions,
                         [ $confidence, $predicted_class, $actual_class ]);
                    last;
                }
            }
        }
    }
}

print STDERR "Sorting...\n";

@predictions = sort { $b->[0] <=> $a->[0] } @predictions;

if ($bins)
{
    print "The -bins option does not take care of predictions with identical scores properly. Look at the code and see if you want to fix it :).";

    $at_interval = $interval;
    $example_count = @predictions;
    for $prediction (@predictions)
    {
        ++$predicted_count;
        ++$bin_count;

        ++$correct_count if $prediction->[2] eq $class;

        $cov_percent = 100 * $predicted_count / $example_count;

        if ($cov_percent >= $at_interval)
        {
            $acc_percent = 100 * $correct_count / $bin_count;
            $at_interval += $interval;
            printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $bin_count, $prediction->[0]);
            $bin_count = 0;
            $correct_count = 0;
        }
    }

#    $acc_percent = 100 * $correct_count / $bin_count;
#    printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $predicted_count, $prediction->[0]);
}
else
{
$at_interval = $interval;

print STDERR "Coverage  Accuracy\n";


for $prediction (@predictions)
{
    ++$seen_count if $prediction->[2] eq $class;
}

for($index = 0; $index < @predictions; $index++)
{
    $prediction = $predictions[$index];

    ++$predicted_count;
    ++$correct_count if $prediction->[2] eq $class;

    $cov_percent = 100 * $correct_count / $seen_count;

    if (($cov_percent >= $at_interval) &&
        ($index < (@predictions - 1)) &&
        ($prediction->[0] != $predictions[$index + 1]->[0]))
    {
        $acc_percent = 100 * $correct_count / $predicted_count;
        $at_interval += $interval;
        printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $predicted_count, $prediction->[0]);
#       print $cov_percent, ' ', $acc_percent, "\n";
        $correct_count = $predicted_count = 0 if $bins;

        # Figure out what our next output point should be
        while ($at_interval <= $cov_percent) {
            $at_interval += $interval;
        }
    }

#    print $seen_count, ' ', $predicted_count, ' ', $correct_count, "\n";
}

$acc_percent = 100 * $correct_count / $predicted_count;
printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $predicted_count, $prediction->[0]);
}

sub usage_msg
{
    print STDERR $usage;
    exit 1;
}