File: rainbow-ac.pl

package info (click to toggle)
bow 19991122-4
  • links: PTS
  • area: main
  • in suites: woody
  • size: 2,544 kB
  • ctags: 2,987
  • sloc: ansic: 38,660; lisp: 1,072; makefile: 594; perl: 492; yacc: 149; sh: 91
file content (104 lines) | stat: -rwxr-xr-x 2,737 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
#!/usr/bin/perl
# The above line is modified by ./Makefile to match the system's
# installed location for Perl.

$usage = <<USAGE;
USAGE: ac [-bins] interval classes|'all' < andrew-files
USAGE

if ($ARGV[0] eq '-bins')
{
    $bins = 1;
    shift @ARGV;
}
($interval, @classes) = @ARGV;

&usage_msg unless $interval && @classes;


if (@classes == 1 && $classes[0] eq 'all')
{
    $all_classes = 1;
}
else
{
    for (@classes) { $classes{$_} = 1 }
}


print STDERR "Reading...\n"; 

while ($line = <STDIN>)
{
    if (($actual_class, $predicted) = $line =~ /^\S+\s+(\S+)\s+(\S+)/)
    {
        if (($predicted_class, $confidence) = $predicted =~ /([^:]+):(.*)/)
        {
            push(@predictions, 
                 [ $confidence, $predicted_class, $actual_class ]);
        }
    }
}

print STDERR "Got ", $predictions, " records.\nSorting...\n";

@predictions = sort { $b->[0] <=> $a->[0] } @predictions;

$at_interval = $interval;

print STDERR "Coverage  Accuracy\n";

for $prediction (@predictions)
{
    # coverage
    if ($all_classes || $classes{$prediction->[2]})
    {
        ++$seen_count;         
    }
}


for($index = 0; $index < @predictions; $index++)
{
    $prediction = $predictions[$index];

    if ($all_classes || $classes{$prediction->[1]})
    {
        ++$predicted_count;
        ++$correct_count, ++$all_correct_count
            if $prediction->[1] eq $prediction->[2];
    }

    $cov_percent = 100 * $all_correct_count / $seen_count;

    # If we've come to a reporting point and there are more predictions
    # left, and the score of this prediction is not the same as the
    # score of the next one, then we can output a point here.
    if (($cov_percent >= $at_interval) &&
        ($index < (@predictions - 1)) &&
        ($prediction->[0] != $predictions[$index + 1]->[0]))
    {
        $acc_percent = 100 * $correct_count / $predicted_count;
        $at_interval += $interval;
        printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $predicted_count, $prediction->[0]);
#       print $cov_percent, ' ', $acc_percent, "\n";
        $correct_count = $predicted_count = 0 if $bins;

        # Figure out what our next output point should be
        while ($at_interval <= $cov_percent) {
            $at_interval += $interval;
        }
    }

#    print $seen_count, ' ', $predicted_count, ' ', $correct_count, "\n";
    $final_confidence = $prediction->[0];
}

$acc_percent = 100 * $correct_count / $predicted_count;
printf("%6.2f  %8.2f (%3d correct of %3d predicted, %7f confidence)\n", $cov_percent, $acc_percent, $correct_count, $predicted_count, $final_confidence);

sub usage_msg
{
    print STDERR $usage;
    exit 1;
}