CS-Score-MASTER.pl

#!/usr/bin/perl

use warnings;
use strict;
use utf8;
use Carp;

binmode(STDOUT, ":utf8");
binmode(STDERR, ":utf8");

### DO NOT INCLUDE
use ColdStartLib;

### DO INCLUDE
##################################################################################### 
# This program scores Cold Start 2015 submissions. It takes as input
# the evaluation queries, the appropriate assessment files, and a
# submission file. The submission file is either a Slot Filling
# variant submission file, or the result of applying the evaluation
# queries to a submitted knowledge base (typically obtained by running
# CS-ResolveQueries.pl)
#
# Authors: James Mayfield, Shahzad Rajput
# Please send questions or comments to jamesmayfield "at" gmail "dot" com
#
# For usage, run with no arguments
##################################################################################### 

### DO NOT INCLUDE
# Shahzad: I have not upped any version numbers. We should up them all just prior to
# the release of the new code
### DO INCLUDE
my $version = "2017.2.0";

# Filehandles for program and error output
my @output_postfix = qw(DEBUG AP SF LDCMAX LDCMEAN SUMMARY SAMPLE SAMPLESCORES CONFIDENCE PARAMS);
my %program_output;
my $error_output;

# The default sequence of output fields
### DO NOT INCLUDE
# Shahzad: I've omitted some of our agreed upon default fields just to get it working.
# Something like the following is what we had discussed:
#my $default_fields = "EC:GT:CORRECT:INCORRECT:INEXACT:RIGHT:WRONG:REDUNDANT:IGNORED:P:R:F";
### DO INCLUDE
my $default_fields = "EC:RUNID:LEVEL:GT:SUBMITTED:CORRECT:INCORRECT:INEXACT:INCORRECT_PARENT:UNASSESSED:REDUNDANT:RIGHT:WRONG:IGNORED:P:R:F";
my $default_right = "CORRECT";
my $default_wrong = "INCORRECT:INCORRECT_PARENT:INEXACT";
my $default_ignore = "UNASSESSED:DUPLICATE";

### DO NOT INCLUDE
##################################################################################### 
# Library inclusions
##################################################################################### 
### DO INCLUDE
### DO INCLUDE Utils                  ColdStartLib.pm
### DO INCLUDE Patterns               ColdStartLib.pm
### DO INCLUDE Logger                 ColdStartLib.pm
### DO INCLUDE Provenance             ColdStartLib.pm
### DO INCLUDE Predicates             ColdStartLib.pm
### DO INCLUDE Query                  ColdStartLib.pm
### DO INCLUDE QuerySet               ColdStartLib.pm
### DO INCLUDE EvaluationQueryOutput  ColdStartLib.pm
### DO INCLUDE Scoring                ColdStartLib.pm
### DO INCLUDE Switches               ColdStartLib.pm

### DO NOT INCLUDE
# Hush up perl worrywart module. FIXME: Not sure this is still needed.
my $pattern = $main::comment_pattern;
### DO INCLUDE

package SamplesScoresPrinter;

# This package prepares sample summary scores given the samples and scores_printer

my %code = (
                  ALL_ENTRYPOINT => "ALLEP",
                  ONE_ENTRYPOINT => "ONEEP",
                  LDCMAX => "LDCMAXI",
                  LDCMEAN => "LDCMEAN",
                  SF => "SLOTFLG",
                  F1 => "F",
                  PRECISION => "P",
                  RECALL => "R",
                  0 => "0",
                  1 => "1",
                  ALL => "A",
                  "ALL-Macro" => "Ma",
                  "ALL-Micro" => "Mi"
            );

my %inverse_code = reverse %code;

sub new {
  my ($class, $logger, $samples, $scores_printer) = @_;
  my $self = {
  	LOGGER => $logger,
  	SAMPLES => $samples,
  	SCORES_PRINTER => $scores_printer,
    ORIGINAL_STATS => {$scores_printer->get_summary_stats()},
  };
  bless($self, $class);
  foreach my $score(@{$self->{SCORES_PRINTER}{SCORES}}) {
    my $duplicate_score = $score->duplicate();
    push(@{$self->{SCORES}}, $duplicate_score);
  }
  $self;
}

sub get {
  my ($self, $field, @args) = @_;
  return $self->{$field} if defined $self->{$field};
  my $method = $self->can("get_$field");
  return $method->($self, @args) if $method;
}

sub get_QUERIES_TO_SCORE {
	my ($self, $sample_num, $projection_type) = @_;
	$self->{SAMPLES}->get("QUERIES_TO_SCORE", $sample_num, $projection_type);
}

sub get_ORIGINAL_SCORE {
  my ($self, $field_code) = @_;
  my $score;
  my $score_str;

  my ($ep, $type, $aggregate_type, $level, $metric) = map {$inverse_code{$_}} split("_", $field_code);

  $score = $self->{ORIGINAL_STATS}{$type}{$aggregate_type}{$level}{$metric}
    if $ep eq "ALL_ENTRYPOINT";

  $score_str = sprintf("%0.4f", $score) if defined $score;
  $score_str = sprintf("%6s","-") unless $score;
  $score_str;
}

sub manage_duplicates {
  my ($self, $sample_num, $projection_type) = @_;
  
  my %queries_to_score = $self->{SAMPLES}->get("QUERIES_TO_SCORE", $sample_num, $projection_type);
  
  my @scores;
  
  foreach my $score(@{$self->{SCORES}}) {
  	my $query_id = $score->{QUERY_ID_BASE};
  	if(exists $queries_to_score{$query_id}) {
  	  for(my $i=1; $i<=$queries_to_score{$query_id}; $i++) {
  	  	my $duplicate_score = $score->duplicate();
  	    push(@scores, $duplicate_score);
  	  }
  	}
  }
  
  @{$self->{SCORES_PRINTER}{SCORES}} = @scores;
}

sub get_samples_summary_evals {
  my ($self) = @_;
  my %samples_summary_evals;
  foreach my $i(sort keys %{$self->{SAMPLES}{SAMPLES}}){
  	my %stats;
  	
	%{$self->{SCORES_PRINTER}{QUERIES_TO_SCORE}} = $self->get("QUERIES_TO_SCORE", $i, "ALL_ENTRYPOINT");
	$self->manage_duplicates($i, "ALL_ENTRYPOINT");
	%stats = $self->{SCORES_PRINTER}->get_summary_stats();
	$samples_summary_evals{$i}{ALL_ENTRYPOINT} = {%stats};
		
	%{$self->{SCORES_PRINTER}{QUERIES_TO_SCORE}} = $self->get("QUERIES_TO_SCORE", $i, "ONE_ENTRYPOINT");
	$self->manage_duplicates($i, "ONE_ENTRYPOINT");
	%stats = $self->{SCORES_PRINTER}->get_summary_stats();
	$samples_summary_evals{$i}{ONE_ENTRYPOINT} = {%stats};
  }
  
  %samples_summary_evals;
}

sub print_lines {
  my ($self) = @_;
  
  my $runid = $self->{SCORES_PRINTER}{RUNID};
  
  my %samples_summary_evals = $self->get_samples_summary_evals();
  
  foreach my $sample(sort {$a<=>$b} keys %{$self->{SAMPLES}{SAMPLES}}) {
  	print {$program_output{SAMPLE}} "$sample";
  	foreach my $query_num(sort {$a<=>$b} keys %{$self->{SAMPLES}{SAMPLES}{$sample}}) {
  		my $ldc_queryid = $self->{SAMPLES}{SAMPLES}{$sample}{$query_num}{LDC_QUERY_ID};
  		my $sf_queryid = $self->{SAMPLES}{SAMPLES}{$sample}{$query_num}{SF_QUERY_ID_FULL}{0};
  		print {$program_output{SAMPLE}} " $ldc_queryid:$sf_queryid";
  	}
  	print {$program_output{SAMPLE}} "\n";
  }
  
  my $skip = qr/^...EP_LDCMEAN_Mi|^ONEEP_LDCMAXI|^ONEEP_LDCMEAN_Ma/;
  
  # Print header
  my @ep_types = qw(ONE_ENTRYPOINT ALL_ENTRYPOINT);
  my @ev_types = qw(LDCMAX LDCMEAN SF);
  my @ag_types = qw(ALL-Micro ALL-Macro);
  my @levels = qw(0 1 ALL);
  my @metrices = qw(PRECISION RECALL F1);
  print {$program_output{SAMPLESCORES}} "Sample#";
  foreach my $ep_type(@ep_types) {
    foreach my $ev_type(@ev_types){
      foreach my $ag_type(@ag_types) {
        foreach my $level(@levels) {
          foreach my $metric(@metrices) {
          	my $header = join "_", map {$code{$_}} ($ep_type, $ev_type, $ag_type, $level, $metric);
          	next if ($header=~$skip);
            print {$program_output{SAMPLESCORES}} " $header";
          }
        }
      }
    }
  }
  print {$program_output{SAMPLESCORES}} " #RUNID\n";
  
  # Print lines
  my %scores;
  foreach my $sample(sort {$a<=>$b} keys %samples_summary_evals) {
  	print {$program_output{SAMPLESCORES}} sprintf("%6d", $sample);
    foreach my $ep_type(@ep_types) {
      foreach my $ev_type(@ev_types){
        foreach my $ag_type(@ag_types) {
          foreach my $level(@levels) {
            foreach my $metric(@metrices) {
              my $header = join "_", map {$code{$_}} ($ep_type, $ev_type, $ag_type, $level, $metric);
          	  next if ($header=~$skip);
              my $score = $samples_summary_evals{$sample}{$ep_type}{$ev_type}{$ag_type}{$level}{$metric};
              $scores{$header}{$sample} = $score;
              print {$program_output{SAMPLESCORES}} sprintf("               %0.4f", $score);
            }
          }
        }
      }
    }
    print {$program_output{SAMPLESCORES}} " #$runid\n";
  }
  
  # Print confidence intervals
  print {$program_output{CONFIDENCE}} " "x22, "99%(   95%(   90%(   mean   scr.   )90%   )95%   )99%\n"; 

  foreach my $header(sort keys %scores) {
    my @scores = values %{$scores{$header}};
    my $mean = $self->{SAMPLES}->mean(@scores);
    my $original_score = $self->get("ORIGINAL_SCORE", $header);
    my %confidence_intervals;
    foreach my $confidence((99, 95, 90)) {
      @{$confidence_intervals{$confidence}} = $self->{SAMPLES}->get_confidence_interval($confidence, @scores);
    }
    print {$program_output{CONFIDENCE}} "$header $confidence_intervals{99}[0] $confidence_intervals{95}[0] $confidence_intervals{90}[0] $mean $original_score $confidence_intervals{90}[1] $confidence_intervals{95}[1] $confidence_intervals{99}[1]\n"; 
  }
}

package APScoresPrinter;

our %printable_fields = (
  EC => {
  	NAME => 'EC',
    DESCRIPTION => "Query or equivalence class name",
    HEADER => 'QID/EC',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{EC} },
  },
  RUNID => {
  	NAME => 'RUNID',
    DESCRIPTION => "Run ID",
    HEADER => 'RunID',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{RUNID} },
  },
  LEVEL => {
  	NAME => 'LEVEL',
    DESCRIPTION => "Hop level",
    HEADER => 'Hop',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{LEVEL} },
  },
  AP => {
  	NAME => 'AP',
    DESCRIPTION => "Average Precision",
    HEADER => 'AP',
    FORMAT => '%6.4f',
    JUSTIFY => 'L',
    FN => sub { $_[0]->get('AP') },
  },
);

our %metrices = (
  SF => {
  	ORDER => 1,
  	NAME => "SF",
  	DESCRIPTION => "SF: Slot-filling score variant considering all entrypoints as a separate query",
  	AGGREGATES => [qw(MACRO)],
  },
  LDCMEAN => {
  	ORDER => 2,
  	NAME => "LDC-MEAN",
  	DESCRIPTION => "LDC-MEAN: LDC level score variant considering averaging scores for all coressponding entrypoints",
  	AGGREGATES => [qw(MACRO)],
  },
);

sub get_fields_to_print {
  my ($spec, $logger) = @_;
  [map {$printable_fields{$_} || $logger->NIST_die("Unknown field: $_")} split(/:/, $spec)];
}

sub new {
  my ($class, $separator, $queries, $runid, $index, $queries_to_score, $spec, $logger) = @_;
  my $fields_to_print = &get_fields_to_print($spec, $logger);
  my $self = {RUNID => $runid,
  	      INDEX => $index,
  	      QUERIES => $queries,
  	      QUERIES_TO_SCORE => $queries_to_score,
  	      FIELDS_TO_PRINT => $fields_to_print,
	        WIDTHS => {map {$_->{NAME} => length($_->{HEADER})} @{$fields_to_print}},
	        HEADERS => [map {$_->{HEADER}} @{$fields_to_print}],
	        LINES => [],
	     };
  $self->{SEPARATOR} = $separator if defined $separator;
  bless($self, $class);
  $self;
}

sub aggregate_score {
  my ($aggregates, $runid, $level, $scores) = @_;
  # Make sure the necessary aggregate structures are present
  unless (defined $aggregates->{$runid}{$level}) {
    my $scoreset = ScoreSet->new();
    $scoreset->put('RUNID', $runid);
    $scoreset->put('EC', 'ALL-Micro');
    $scoreset->put('LEVEL', $level);
    $aggregates->{$runid}{$level} = $scoreset;
  }
  # Aggregate this set of scores for regular slots
  $aggregates->{$runid}{$level}->add($scores);
}

sub add_scores {
  my ($self, @scores) = @_;
  foreach my $score(@scores) {
    next if ($score->{LEVEL} ne "ALL" && $self->{QUERIES_TO_SCORE}{$score->{QUERY_ID_BASE}} < $score->{LEVEL});
    push(@{$self->{SCORES}}, $score);
  }
}

sub compare_ec_names {
  my ($qa, @a) = split(/:/, $a->{EC});
  my ($qb, @b) = split(/:/, $b->{EC});
  $qa cmp $qb ||
    eval(join(" || ", map {$a[$_] <=> $b[$_]} 0..&main::min($#a, $#b))) ||
    scalar @a <=> scalar @b;
}

sub get_line {
  my ($self, $score) = @_;
  my %line;
  foreach my $field (@{$self->{FIELDS_TO_PRINT}}) {
    my $value = &{$field->{FN}}($score);
    # FIXME: Is this always the appropriate default value?
    $value = 0 unless defined $value;
    my $text = sprintf($field->{FORMAT}, $value);
    $line{$field->{NAME}} = $text;
    $self->{WIDTHS}{$field->{NAME}} = length($text) if length($text) > $self->{WIDTHS}{$field->{NAME}};
  }
  %line;
}

sub print_line {
  my ($self, $line, $fields, $metric_name, $program_output) = @_;
  my $separator = "";
  $fields = $self->{FIELDS_TO_PRINT} unless $fields;
  foreach my $field (@{$fields}) {
    my $value = (defined $line ? $line->{$field->{NAME}} : $field->{HEADER});
    $value = "$metric_name-$value" if $field->{NAME} eq "EC" && $metric_name;
    print $program_output $separator;
    my $numspaces = defined $self->{SEPARATOR} ? 0 : $self->{WIDTHS}{$field->{NAME}} - length($value);
    print $program_output ' ' x $numspaces if $field->{JUSTIFY} eq 'R' && !defined $self->{SEPARATOR};
    print $program_output $value;
    print $program_output ' ' x $numspaces if $field->{JUSTIFY} eq 'L' && !defined $self->{SEPARATOR};
  	$separator = defined $self->{SEPARATOR} ? $self->{SEPARATOR} : ' ';
  }
  print $program_output "\n";
}

sub add_macro_average {
  my ($self, $metric, @scores) = @_;
  my $aggregates = {};
  foreach my $score(sort compare_ec_names @scores ) {
  	&aggregate_score($aggregates, $score->{RUNID}, $score->{LEVEL}, $score);
  }
  foreach my $level (sort keys %{$aggregates->{$self->{RUNID}}}) {
  	# Print the macro-averaged scores
  	my %line;
  	foreach my $field (@{$self->{FIELDS_TO_PRINT}}) {
  	  my $value = "";
  	  if ($field->{NAME} eq 'QUERY_ID' ||
  	  	$field->{NAME} eq 'EC' ||
		$field->{NAME} eq 'RUNID' ||
		$field->{NAME} eq 'LEVEL') {
		  $value = $aggregates->{$self->{RUNID}}{$level}->get($field->{NAME});
	  }
	  elsif ($field->{NAME} eq 'AP') {
	  	$value = $aggregates->{$self->{RUNID}}{$level}->getadjustedmean($field->{NAME});
	  }
	  $value = 'ALL-Macro' if $value eq 'ALL-Micro' && $field->{NAME} eq 'EC';
	  my $format = $field->{FORMAT};
	  $format =~ s/[df]/s/ if $value eq "";
	  $format =~ s/\.\d// if $value eq "";
	  my $text = sprintf($format, $value);
	  $line{$field->{NAME}} = $text;
	  $self->{WIDTHS}{$field->{NAME}} = length($text) if length($text) > $self->{WIDTHS}{$field->{NAME}};
  	}
  	push(@{$self->{LINES}}, \%line);
  	push(@{$self->{SUMMARY}{$metric}}, \%line);
  }
}

sub projectLDCMEAN {
	my ($self) = @_;
	my %index = %{$self->{INDEX}};
	my @scores = @{$self->{SCORES}};
	my %evaluation_queries = map {$_=>1} keys %{$self->{QUERIES_TO_SCORE}};
	my %new_scores;
	my %duplicate_queries;
	foreach my $scores(@scores){
	  my $full_cssf_queryid = $scores->{EC};
	  my (undef, $cssf_queryid) = &Query::parse_queryid($full_cssf_queryid);  
	  my $csldc_queryid = $index{$cssf_queryid};
	  my $full_csldc_queryid = $self->{QUERIES}->get_full_queryid($index{$cssf_queryid});
    my $level = $scores->{LEVEL};
    if( (scalar keys %evaluation_queries > 0 && exists $evaluation_queries{$cssf_queryid})
	      || scalar keys %evaluation_queries == 0) {
	          $new_scores{$level}{$full_csldc_queryid}{$cssf_queryid} = $scores;
	  }
	}

	my @combined_scores;
	foreach my $level(sort keys %new_scores) {
	  foreach my $csldc_queryid(sort keys %{$new_scores{$level}}) {
	    my $combined_scores = Score->new;
	    my $i = 0;
	    foreach my $cssf_queryid(keys %{$new_scores{$level}{$csldc_queryid}}) {
	      my $scores = $new_scores{$level}{$csldc_queryid}{$cssf_queryid};
	      if(not exists $combined_scores->{EC}) {
          $combined_scores->put('QUERY_ID_BASE', $scores->get('QUERY_ID_BASE'));
          $combined_scores->put('EC', $csldc_queryid);
          $combined_scores->put('RUNID', $scores->get('RUNID'));
          $combined_scores->put('LEVEL', $scores->get('LEVEL'));
          $combined_scores->put('NUM_GROUND_TRUTH', $scores->get('NUM_GROUND_TRUTH'));
          $combined_scores->put('AP', $scores->get('AP'));	        
	      }
	      else{
	      	$combined_scores->put('AP', $combined_scores->get('AP') + $scores->get('AP'));
	      }
	      $combined_scores->put('NUM_GROUND_TRUTH', $scores->get('NUM_GROUND_TRUTH'))
	        if($scores->get('NUM_GROUND_TRUTH') > $combined_scores->get('NUM_GROUND_TRUTH'));
	      $i++;
	    }
	    $combined_scores->put('AP', $combined_scores->get('AP')/$i);
	    push(@combined_scores, $combined_scores);
	  }
	}
	@combined_scores;
}

sub prepare_lines {
  my ($self, $metric) = @_;
  @{$self->{SUMMARY}{$metric}} = ();
  my @scores = @{$self->{SCORES}};
  @scores = $self->projectLDCMEAN() if($metric eq "LDCMEAN");
  # Prepare lookup for associating parent scores
  my %scores;
  foreach my $score(@scores) {
    $scores{$score->{EC}} = $score;
  }
  # Prepare lines
  foreach my $score(sort compare_ec_names @scores) {
  	next if not exists $self->{QUERIES_TO_SCORE}{$score->{QUERY_ID_BASE}};
    $score->{PARENT_SCORE} = $scores{&get_parent_ec($score)}
      if &get_parent_ec($score);
  	my %line = $self->get_line($score);
  	push(@{$self->{LINES}}, \%line);
  }
  # Add aggregates
  $self->add_macro_average($metric, @scores)
  	if(grep {$_ =~ /MACRO/} @{$metrices{$metric}{AGGREGATES}});
}
  
sub print_headers {
  my ($self, @args) = @_;
  $self->print_line( undef, @args );
}

sub print_lines {
  my ($self) = @_;
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
    # Skip over if the sf-queries file passed as argument
    # This is determined by looking up keys in %{$self->{INDEX}}
    # which stores a mapping between LDC and SF query ids
    next if( ($metric eq "LDCMEAN") && (scalar keys %{$self->{INDEX}} == 0) );
    my $description = $metrices{$metric}{DESCRIPTION};
    my $fields_to_print = $self->{FIELDS_TO_PRINT};
    $self->prepare_lines($metric);
	$self->print_details() if $metric eq "SF";
	print {$program_output{AP}} "$metrices{$metric}{DESCRIPTION}\n\n";
	$self->print_headers($fields_to_print, undef, $program_output{AP}) if @{$self->{LINES}};
	foreach my $line (@{$self->{LINES}}) {
	  $self->print_line($line, $fields_to_print, undef, $program_output{AP});
	}
    print {$program_output{AP}} "\n";
	@{$self->{LINES}} = ();
  }
  $self->print_summary($program_output{AP});
  print {$program_output{"AP"}} "\n*ALL-Macro AP refer to mean of corresponding AP values.\n";
}

sub print_details {
  my ($self) = @_;
  print {$program_output{DEBUG}} "AP COMPUTATION DEBUG INFO BEGINS:\n";
  foreach my $score(sort {$a->{EC} cmp $b->{EC} || $a->{LEVEL} cmp $b->{LEVEL}} @{$self->{SCORES}}) {
  	my $query_id = $score->{EC};
  	my $level = $score->{LEVEL};
  	my $ap = sprintf("%0.4f", $score->{AP});
  	my $num_ground_truth = $score->{NUM_GROUND_TRUTH};
  	print {$program_output{DEBUG}} "="x80, "\n";
    print {$program_output{DEBUG}} "QUERY_ID:         $query_id\n";
    print {$program_output{DEBUG}} "LEVEL:            $level\n";
    print {$program_output{DEBUG}} "AP:               $ap\n";
    print {$program_output{DEBUG}} "NUM_GROUND_TRUTH: $num_ground_truth\n";
    print {$program_output{DEBUG}} "GROUND TRUTH:\n";
    print {$program_output{DEBUG}} join("\n", map {"  $_"} sort @{$score->{DEBUG}{ECS} || []}), "\n";
    print {$program_output{DEBUG}} "RANKING:\n........\nRANK NODEID CONFIDENCE MAPPED_EC V\n";
    my $rank = 1;
    foreach my $nodeid(sort {$score->{DEBUG}{NODES}{$b}{CONFIDENCE} <=> $score->{DEBUG}{NODES}{$a}{CONFIDENCE} ||
                        $score->{DEBUG}{NODES}{$a}{LINENUM} <=> $score->{DEBUG}{NODES}{$b}{LINENUM}} 
                          keys %{$score->{DEBUG}{NODES}}) {
      my $confidence = sprintf("%0.4f", $score->{DEBUG}{NODES}{$nodeid}{CONFIDENCE});
      my $ec = $score->{DEBUG}{NODES}{$nodeid}{EC};
      $ec = "-" unless $ec;
      my $v = sprintf("%0.4f", $score->{DEBUG}{NODES}{$nodeid}{V});
      print {$program_output{DEBUG}} "$rank $nodeid $confidence $ec $v\n";
      $rank++;
    }
  }
  print {$program_output{DEBUG}} "AP COMPUTATION DEBUG INFO ENDS\n";
}

sub print_summary {
  my ($self, $output_handle) = @_;
  my $fields_to_print = $self->{FIELDS_TO_PRINT};
  print $output_handle "SUMMARY: This section provides summary of AP scores\n\n";
  $self->print_headers($fields_to_print, undef, $output_handle);
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
  	my $metric_name = $metrices{$metric}{NAME};
    foreach my $line (@{$self->{SUMMARY}{$metric}}) {
      $self->print_line($line, $fields_to_print, $metric_name, $output_handle);
    }
  }
}

sub get_parent_ec {
  my ($score) = @_;
  if($score->{EC} =~ /:/) {
    my @elements = split(":", $score->{EC});
    pop @elements;
    return join(":", @elements);
  }
  return;
}

sub get_summary_stats {
  my ($self) = @_;
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
  	@{$self->{SUMMARY}{$metric}} = ();
  	$self->prepare_lines($metric);
  }
  
  my %summary = %{$self->{SUMMARY}};
  my @fields = qw(AP);
  my %stats;
  foreach my $metric(keys %summary) {
  	foreach my $line( @{$summary{$metric}} ){
  	  my $ec = $line->{EC};
  	  my $level = $line->{LEVEL};
  	  $stats{$metric}{$ec}{$level} = {map {$_=>$line->{$_}} @fields};
  	}
  }
  
  %stats;
}

# Determine which queries should be scored
sub get_queries_to_score {
  my ($logger, $spec, $queries) = @_;
  my %query_slots;
  # Spec can be empty (meaning score all queries), a colon-separated
  # list of IDs, or a filename
  if (!defined $spec) {
    my @query_ids = $queries->get_all_top_level_query_ids();
    %query_slots = map {$_=>scalar @{$queries->get($_)->{SLOTS}}-1} @query_ids;
  }
  elsif (-f $spec) {
    open(my $infile, "<:utf8", $spec) or $logger->NIST_die("Could not open $spec: $!");
    my %index;
    while(<$infile>) {
    	chomp;
    	my ($csldc_query_id, $cssf_query_id_full, $num_slots) = split(/\s+/, $_);
    	if (not exists $index{$csldc_query_id}) {
    		$index{$csldc_query_id} = defined $num_slots ? $num_slots : -1; 
    	}
    	else {
    		my $target_value = defined $num_slots ? $num_slots : -1;
    		$logger->NIST_die("$csldc_query_id has multiple/conflicting num_slots in $spec")
    			if($target_value != $index{$csldc_query_id});
    	}
    	my ($base, $cssf_query_id) = &Query::parse_queryid($cssf_query_id_full);
    	unless ($queries->get($cssf_query_id)) {
		  $logger->record_problem('UNKNOWN_QUERY_ID_WARNING', $cssf_query_id, 'NO_SOURCE');
		  next;
    	}
    	my $max_num_slot = scalar @{$queries->get($cssf_query_id)->{SLOTS}}-1;
    	$num_slots = $max_num_slot unless defined $num_slots;
    	
    	$logger->NIST_die("Unexpected num_slots value $num_slots for $csldc_query_id in $spec")
    		if $num_slots > $max_num_slot || $num_slots < 0;
    	
    	$query_slots{$cssf_query_id} = $num_slots;
    }
    close $infile;
  }
  else {
    my @query_ids = split(/:/, $spec);
    foreach my $full_query_id(@query_ids) {
      my ($base, $query_id) = &Query::parse_queryid($full_query_id);
      unless ($queries->get($query_id)) {
      	$logger->record_problem('UNKNOWN_QUERY_ID_WARNING', $query_id, 'NO_SOURCE');
      	next;
      }
      my $num_slots = scalar @{$queries->get($query_id)->{SLOTS}}-1;
      $query_slots{$query_id} = $num_slots;
    }
  }
  my %query_ids_to_score;
  foreach my $query_id (keys %query_slots) {
    my $root = $queries->get_ancestor($query_id);
    my $num_slots = $query_slots{$query_id}; 
    $query_ids_to_score{$root->get("QUERY_ID")} = $num_slots unless @{$root->get("EXPANDED_QUERY_IDS")};
    # If we've requested an unexpanded query ID, we need to add each of the expanded queries
    foreach my $expanded_query_id (@{$root->get("EXPANDED_QUERY_IDS")}) {
      $num_slots = $query_slots{$expanded_query_id}; 
      $query_ids_to_score{$expanded_query_id} = $num_slots;
    }
  }
  %query_ids_to_score;
}

package ScoresPrinter;

# This package converts scoring output to printable form.

### DO NOT INCLUDE
# Shahzad: the FNs in the following need to be kept in sync with the output of
# EvaluationQueryOutput::score_query(). Either the FIXMEs need to be replaced
# with the appropriate field name, or if we can calculate the value from that
# output, FN needs to do the calculation and return the appropriate string.
### DO INCLUDE
our %printable_fields = (
  EC => {
  	NAME => 'EC',
    DESCRIPTION => "Query or equivalence class name",
    HEADER => 'QID/EC',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{EC} },
  },
  RUNID => {
  	NAME => 'RUNID',
    DESCRIPTION => "Run ID",
    HEADER => 'RunID',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{RUNID} },
  },
  LEVEL => {
  	NAME => 'LEVEL',
    DESCRIPTION => "Hop level",
    HEADER => 'Hop',
    FORMAT => '%s',
    JUSTIFY => 'L',
    FN => sub { $_[0]{LEVEL} },
  },
  GT => {
  	NAME => 'NUM_GROUND_TRUTH',
    DESCRIPTION => "Number of ground truth values",
    HEADER => 'GT',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_GROUND_TRUTH} },
  },
  CORRECT => {
  	NAME => 'NUM_CORRECT_PRE_POLICY',
    DESCRIPTION => "Number of assessed correct responses (pre-policy)",
    HEADER => 'Correct',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_CORRECT} },
  },
  INCORRECT => {
  	NAME => 'NUM_INCORRECT_PRE_POLICY',
    DESCRIPTION => "Number of assessed incorrect responses (pre-policy)",
    HEADER => 'Incorrect',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_INCORRECT} },
  },
  INEXACT => {
  	NAME => 'NUM_INEXACT_PRE_POLICY',
    DESCRIPTION => "Number of assessed inexact responses (pre-policy)",
    HEADER => 'Inexact',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_INEXACT} },
  },
  REDUNDANT => {
  	NAME => 'NUM_REDUNDANT_POST_POLICY',
    DESCRIPTION => "Number of duplicate submitted values in equivalence clase (post-policy)",
    HEADER => 'Dup',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_REDUNDANT} },
  },
  RIGHT => {
  	NAME => 'NUM_CORRECT_POST_POLICY',
    DESCRIPTION => "Number of submitted values counted as right (post-policy)",
    HEADER => 'Right',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_RIGHT} },
  },
  WRONG => {
  	NAME => 'NUM_INCORRECT_POST_POLICY',
    DESCRIPTION => "Number of submitted values counted as wrong (post-policy)",
    HEADER => 'Wrong',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    FN => sub { $_[0]{NUM_WRONG} },
  },
  IGNORED => {
  	NAME => 'NUM_IGNORED_POST_POLICY',
    HEADER => 'Ignored',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',
    DESCRIPTION => "Number of responses that were ignored (post-policy)",
    FN => sub { $_[0]{NUM_IGNORED} },
  },
  SUBMITTED => {
  	NAME => 'NUM_SUBMITTED',
    DESCRIPTION => "Total number of submitted entries",
    HEADER => 'Submitted',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',   
    FN => sub { $_[0]{NUM_SUBMITTED} },
  },
  UNASSESSED => {
  	NAME => 'NUM_UNASSESSED',
    DESCRIPTION => "Total number of unassessed submitted entries",
    HEADER => 'Unassessed',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',   
    FN => sub { $_[0]{NUM_UNASSESSED} },
  },
  INCORRECT_PARENT => {
  	NAME => 'INCORRECT_PARENT',
    DESCRIPTION => "Total number of submitted entries with parents incorrect",
    HEADER => 'PIncorrect',
    FORMAT => '%4d',
    JUSTIFY => 'R',
    MEAN_FORMAT => '%4.2f',   
    FN => sub { $_[0]{NUM_INCORRECT_PARENT} },
  },
  P => {
  	NAME => 'PRECISION',
    DESCRIPTION => "Precision",
    HEADER => 'Prec',
    FORMAT => '%6.4f',
    JUSTIFY => 'L',
    FN => sub { $_[0]->get('PRECISION') },
  },
  R => {
  	NAME => 'RECALL',
    DESCRIPTION => "Recall",
    HEADER => 'Recall',
    FORMAT => '%6.4f',
    JUSTIFY => 'L',
    FN => sub { $_[0]->get('RECALL') },
  },
  F => {
  	NAME => 'F1',
    DESCRIPTION => "F1 = 2PR/(P+R)",
    HEADER => 'F1',
    FORMAT => '%6.4f',
    JUSTIFY => 'L',
    FN => sub { $_[0]->get('F1') },
  },
);

my %policy_options = (
  CORRECT => {
  	NAME => 'CORRECT',
    DESCRIPTION => "Number of assessed correct responses. Legal choice for -right.",
    VALUE_MAP => 'NUM_CORRECT',
    CHOICES => [qw(RIGHT)],
  },
  DUPLICATE=> {
  	NAME => 'DUPLICATE',
    DESCRIPTION => "Number of duplicate responses. Legal choice for -right, -wrong and -ignore.",
    VALUE_MAP => 'NUM_IGNORED',
    CHOICES => [qw(RIGHT WRONG IGNORE)],
  },
  INCORRECT => {
  	NAME => 'INCORRECT',
    DESCRIPTION => "Number of assessed incorrect responses. Legal choice for -wrong.",
    VALUE_MAP => 'NUM_INCORRECT',
    CHOICES => [qw(WRONG)],
  },
  INCORRECT_PARENT => {
  	NAME => 'INCORRECT_PARENT',
    DESCRIPTION => "Number of responses that had incrorrect (grand-)parent. Legal choice for -wrong and -ignore.",
    VALUE_MAP => 'NUM_INCORRECT_PARENT',
    CHOICES => [qw(WRONG IGNORE)],
  },
  INEXACT => {
  	NAME => 'INEXACT',
    DESCRIPTION => "Number of assessed inexact responses. Legal choice for -right, -wrong and -ignore.",
    VALUE_MAP => 'NUM_INEXACT',
    CHOICES => [qw(RIGHT WRONG IGNORE)],
  },
  UNASSESSED=> {
  	NAME => 'UNASSESSED',
    DESCRIPTION => "Number of unassessed responses. Legal choice for -wrong and -ignore.",
    VALUE_MAP => 'NUM_UNASSESSED',
    CHOICES => [qw(WRONG IGNORE)],
  },
);

our %metrices = (
  SF => {
  	ORDER => 1,
  	NAME => "SF",
  	DESCRIPTION => "SF: Slot-filling score variant considering all entrypoints as a separate query",
  	AGGREGATES => [qw(MICRO MACRO)],
  },
  LDCMAX => {
  	ORDER => 2,
  	NAME => "LDC-MAX",
  	DESCRIPTION => "LDC-MAX: LDC level score variant considering the run's best entrypoint per LDC query",
  	AGGREGATES => [qw(MICRO MACRO)],
  },
  LDCMEAN => {
  	ORDER => 3,
  	NAME => "LDC-MEAN",
  	DESCRIPTION => "LDC-MEAN: LDC level score variant considering averaging scores for all coressponding entrypoints",
  	AGGREGATES => [qw(MACRO)],
  },
);

sub get_fields_to_print {
  my ($spec, $logger) = @_;
  [map {$printable_fields{$_} || $logger->NIST_die("Unknown field: $_")} split(/:/, $spec)];
}

sub new {
  my ($class, $separator, $queries, $runid, $index, $queries_to_score, $spec, $logger) = @_;
  my $fields_to_print = &get_fields_to_print($spec, $logger);
  my $ldc_mean_spec = "EC:RUNID:LEVEL:P:R:F";
  my $ldc_mean_fields_to_print = &get_fields_to_print($ldc_mean_spec, $logger);
  my $self = {RUNID => $runid,
  	      INDEX => $index,
  	      QUERIES => $queries,
  	      QUERIES_TO_SCORE => $queries_to_score,
  	      FIELDS_TO_PRINT => $fields_to_print,
  	      LDC_MEAN_FIELDS_TO_PRINT => $ldc_mean_fields_to_print,
	      WIDTHS => {map {$_->{NAME} => length($_->{HEADER})} @{$fields_to_print}},
	      HEADERS => [map {$_->{HEADER}} @{$fields_to_print}],
	      LINES => [],
	     };
  $self->{SEPARATOR} = $separator if defined $separator;
  bless($self, $class);
  $self;
}

sub aggregate_score {
  my ($aggregates, $runid, $level, $scores) = @_;
  # Make sure the necessary aggregate structures are present
  unless (defined $aggregates->{$runid}{$level}) {
    my $scoreset = ScoreSet->new();
    $scoreset->put('RUNID', $runid);
    $scoreset->put('EC', 'ALL-Micro');
    $scoreset->put('LEVEL', $level);
    $aggregates->{$runid}{$level} = $scoreset;
  }
  # Aggregate this set of scores for regular slots
  $aggregates->{$runid}{$level}->add($scores);
}

sub add_scores {
	my ($self, @scores) = @_;
	
	push(@{$self->{SCORES}}, @scores);
}

# Compare two equivalence class names; comparison is alphabetic for
# the first component, and numerical for all subsequent
# components. This is broken out as a separate function to ensure that
# queries with more than two hops are supported in some fantasized
# future
sub compare_ec_names {
  my ($qa, @a) = split(/:/, $a->{EC});
  my ($qb, @b) = split(/:/, $b->{EC});
  $qa cmp $qb ||
    eval(join(" || ", map {$a[$_] <=> $b[$_]} 0..&main::min($#a, $#b))) ||
    scalar @a <=> scalar @b;
}

sub get_line {
  my ($self, $score) = @_;
  my %line;
  foreach my $field (@{$self->{FIELDS_TO_PRINT}}) {
    my $value = &{$field->{FN}}($score);
    # FIXME: Is this always the appropriate default value?
    $value = 0 unless defined $value;
    my $text = sprintf($field->{FORMAT}, $value);
    $line{$field->{NAME}} = $text;
    $self->{WIDTHS}{$field->{NAME}} = length($text) if length($text) > $self->{WIDTHS}{$field->{NAME}};
  }
  $self->{CATEGORIZED_SUBMISSIONS}{$score->{EC}} = $score->{CATEGORIZED_SUBMISSIONS}
  	if($score->{CATEGORIZED_SUBMISSIONS});
  %line;
}

sub print_line {
  my ($self, $line, $fields, $metric_name, $program_output) = @_;
  my $separator = "";
  $fields = $self->{FIELDS_TO_PRINT} unless $fields;
  foreach my $field (@{$fields}) {
    my $value = (defined $line ? $line->{$field->{NAME}} : $field->{HEADER});
    $value = "$metric_name-$value" if $field->{NAME} eq "EC" && $metric_name;
    print $program_output $separator;
    my $numspaces = defined $self->{SEPARATOR} ? 0 : $self->{WIDTHS}{$field->{NAME}} - length($value);
    print $program_output ' ' x $numspaces if $field->{JUSTIFY} eq 'R' && !defined $self->{SEPARATOR};
    print $program_output $value;
    print $program_output ' ' x $numspaces if $field->{JUSTIFY} eq 'L' && !defined $self->{SEPARATOR};
  	$separator = defined $self->{SEPARATOR} ? $self->{SEPARATOR} : ' ';
  }
  print $program_output "\n";
}

sub add_micro_average {
  my ($self, $metric, @scores) = @_;
  my $aggregates = {};	
  foreach my $score(sort compare_ec_names @scores ) {
  	&aggregate_score($aggregates, $score->{RUNID}, $score->{LEVEL}, $score);
  	&aggregate_score($aggregates, $score->{RUNID}, 'ALL', $score);
  }
  foreach my $level (sort keys %{$aggregates->{$self->{RUNID}}}) {
  	my %line = $self->get_line($aggregates->{$self->{RUNID}}{$level});
    push(@{$self->{LINES}}, \%line);
    push(@{$self->{SUMMARY}{$metric}}, \%line);
  }
}

sub add_macro_average {
  my ($self, $metric, @scores) = @_;
  my $aggregates = {};
  foreach my $score(sort compare_ec_names @scores ) {
  	&aggregate_score($aggregates, $score->{RUNID}, $score->{LEVEL}, $score);
  	&aggregate_score($aggregates, $score->{RUNID}, 'ALL', $score);
  }
  foreach my $level (sort keys %{$aggregates->{$self->{RUNID}}}) {
  	# Print the macro-averaged scores
  	my %line;
  	foreach my $field (@{$self->{FIELDS_TO_PRINT}}) {
  	  my $value = "";
  	  if ($field->{NAME} eq 'QUERY_ID' ||
  	  	$field->{NAME} eq 'EC' ||
		$field->{NAME} eq 'RUNID' ||
		$field->{NAME} eq 'LEVEL') {
		  $value = $aggregates->{$self->{RUNID}}{$level}->get($field->{NAME});
	  }
	  elsif ($field->{NAME} eq 'F1' || $field->{NAME} eq 'PRECISION' || $field->{NAME} eq 'RECALL') {
	  	$value = $aggregates->{$self->{RUNID}}{$level}->getadjustedmean($field->{NAME});
	  }
	  $value = 'ALL-Macro' if $value eq 'ALL-Micro' && $field->{NAME} eq 'EC';
	  my $format = $field->{FORMAT};
	  $format =~ s/[df]/s/ if $value eq "";
	  $format =~ s/\.\d// if $value eq "";
	  my $text = sprintf($format, $value);
	  $line{$field->{NAME}} = $text;
	  $self->{WIDTHS}{$field->{NAME}} = length($text) if length($text) > $self->{WIDTHS}{$field->{NAME}};
  	}
  	push(@{$self->{LINES}}, \%line);
  	push(@{$self->{SUMMARY}{$metric}}, \%line);
  }
}

sub projectLDCMEAN {
	my ($self) = @_;
	my %index = %{$self->{INDEX}};
	my @scores = @{$self->{SCORES}};
	my %evaluation_queries = map {$_=>1} keys %{$self->{QUERIES_TO_SCORE}};
	my %new_scores;
	my %duplicate_queries;
	foreach my $scores(@scores){
	  my $cssf_query_ec = $scores->{EC};
	  my ($full_cssf_queryid, $cssf_ec) = split(":", $cssf_query_ec);
	  my ($query_id_base, $cssf_queryid, $level, $expanded) 
  		= &Query::parse_queryid($full_cssf_queryid);  
	  my $csldc_queryid = $index{$cssf_queryid};
	  my $full_csldc_queryid = $self->{QUERIES}->get_full_queryid($index{$cssf_queryid});
	  my $csldc_query_ec = "$full_csldc_queryid";
	  $csldc_query_ec .= ":$cssf_ec" if(defined $cssf_ec);

      if( (scalar keys %evaluation_queries > 0 && exists $evaluation_queries{$cssf_queryid})
	      || scalar keys %evaluation_queries == 0) {
	          $duplicate_queries{$csldc_query_ec}++;
	          $new_scores{$csldc_query_ec}{$cssf_query_ec} = $scores;
	  }
	}

	foreach my $key(keys %duplicate_queries) {
	  $duplicate_queries{$key} /= scalar keys %{$new_scores{$key}};
	}

	my @combined_scores;
	foreach my $csldc_query_ec(sort keys %new_scores) {
	  my $combined_scores = Score->new;
	  my $i = 0;
	  foreach my $cssf_query_ec(keys %{$new_scores{$csldc_query_ec}}) {
	  	my $scores = $new_scores{$csldc_query_ec}{$cssf_query_ec};
   	    if(not exists $combined_scores->{EC}) {
          $combined_scores->put('QUERY_ID_BASE', $scores->get('QUERY_ID_BASE'));
          $combined_scores->put('EC', $csldc_query_ec);
          $combined_scores->put('RUNID', $scores->get('RUNID'));
          $combined_scores->put('LEVEL', $scores->get('LEVEL'));
          $combined_scores->put('NUM_GROUND_TRUTH', $scores->get('NUM_GROUND_TRUTH'));
          $combined_scores->put('F1', $scores->get('F1'));
          $combined_scores->put('PRECISION', $scores->get('PRECISION'));
          $combined_scores->put('RECALL', $scores->get('RECALL'));
  	    }
  	    else{
          my $f1 = $combined_scores->get('F1');
          my $precision = $combined_scores->get('PRECISION');
          my $recall = $combined_scores->get('RECALL');
          $combined_scores->put('F1', $f1 + $scores->get('F1'));
          $combined_scores->put('PRECISION', $precision + $scores->get('PRECISION'));
          $combined_scores->put('RECALL', $recall + $scores->get('RECALL'));
  	    }
  	    $i++;
	  }
	  my $f1 = $combined_scores->get('F1');
	  my $precision = $combined_scores->get('PRECISION');
	  my $recall = $combined_scores->get('RECALL');
	  $combined_scores->put('F1', $f1/$i);
	  $combined_scores->put('PRECISION', $precision/$i);
	  $combined_scores->put('RECALL', $recall/$i);
	  for(my $dup_count = 0; $dup_count < $duplicate_queries{$csldc_query_ec}; $dup_count++){
	    push(@combined_scores, $combined_scores);
	  }
	}
	@combined_scores;
}

sub projectLDCMAX {
	my ($self) = @_;
	my %index = %{$self->{INDEX}};
	my @scores = @{$self->{SCORES}};
	my %evaluation_queries = map {$_=>1} keys %{$self->{QUERIES_TO_SCORE}};
	# Get the max as the new score for the main query
	my %new_scores;
	foreach my $scores(@scores){
	  my $cssf_query_ec = $scores->{EC};
	  my ($full_cssf_queryid, $cssf_ec) = split(":", $cssf_query_ec);
	  my ($query_id_base, $cssf_queryid, $level, $expanded) 
  		= &Query::parse_queryid($full_cssf_queryid);  
	  my $csldc_queryid = $index{$cssf_queryid};
	  	  
	  my $csldc_query_ec = "$csldc_queryid";
	  $csldc_query_ec .= ":$cssf_ec" if(defined $cssf_ec);
	  
	  push(@{$new_scores{$csldc_queryid}{$cssf_queryid}}, $scores) 
	  	if( (scalar keys %evaluation_queries > 0 && exists $evaluation_queries{$cssf_queryid})
	  		|| scalar keys %evaluation_queries == 0);
	}
	
	my %F1;
	foreach my $csldc_queryid(sort keys %new_scores) {
	  foreach my $cssf_queryid(keys %{$new_scores{$csldc_queryid}}) {
	  	my $combined_scores = Score->new;
	  	foreach my $scores(@{$new_scores{$csldc_queryid}{$cssf_queryid}}){
	  	  if(not exists $combined_scores->{EC}) {
	  	  	my $name = $scores->get('EC');
	  	  	$name =~ s/:.*?$//;
	  	  	$combined_scores->put('EC', $name);
	  	  	$combined_scores->put('RUNID', $scores->get('RUNID'));
	  	  	$combined_scores->put('LEVEL', 'ALL');
	  	  	foreach my $key( grep {$_ =~ /^NUM_/} keys %{$scores} ) { 
	  	  	  $combined_scores->put($key, $scores->get($key));
	  	  	}
	  	  }
	  	  else{
	  	  	foreach my $key( grep {$_ =~ /^NUM_/} keys %{$scores} ) { 
	  	  	  $combined_scores->put($key, $combined_scores->get($key) + $scores->get($key));
	  	  	}
	  	  }
	  	}
	  	if(not exists $F1{$csldc_queryid}) {
	  	  $F1{$csldc_queryid} = {QUERYID=>$cssf_queryid, F1=>$combined_scores->get('F1')};
	  	}
	  	else {
	  	  if($F1{$csldc_queryid}{F1} < $combined_scores->get('F1')) {
	  	  	$F1{$csldc_queryid} = {QUERYID=>$cssf_queryid, F1=>$combined_scores->get('F1')};
	  	  }
	  	}	
	  }
	}
	
	my @filtered_scores;
	foreach my $original_scores(@scores){
	  my $scores = $original_scores->duplicate("CATEGORIZED_SUBMISSIONS");
	  my $cssf_query_ec = $scores->{EC};
	  my ($full_cssf_queryid, $cssf_ec) = split(":", $cssf_query_ec);
	  my ($query_id_base, $cssf_queryid, $level, $expanded) 
  		= &Query::parse_queryid($full_cssf_queryid);  
  	  my $csldc_queryid = $index{$cssf_queryid};
	  my $full_csldc_queryid = $self->{QUERIES}->get_full_queryid($index{$cssf_queryid});
	  my $csldc_query_ec = "$full_csldc_queryid";
	  $csldc_query_ec .= ":$cssf_ec" if(defined $cssf_ec);
	  next if( not( (scalar keys %evaluation_queries > 0  && exists $evaluation_queries{$cssf_queryid})
	  		|| not scalar keys %evaluation_queries > 0 ) );
	  next if $F1{$csldc_queryid}{QUERYID} ne $cssf_queryid;
	  $scores->{EC} = $csldc_query_ec;
	  push(@filtered_scores, $scores);
	}
	
	@filtered_scores;
}


sub get_projected_scores {
  my ($self, $metric) = @_;
  return $self->projectLDCMAX() if($metric eq "LDCMAX");
  return $self->projectLDCMEAN() if($metric eq "LDCMEAN");
}

sub prepare_lines {
  my ($self, $metric) = @_;
  @{$self->{SUMMARY}{$metric}} = ();
  my @scores = @{$self->{SCORES} || []};
  if($metric eq "LDCMAX" || $metric eq "LDCMEAN") {
  	@scores = $self->get_projected_scores($metric);
  }
  # Prepare lookup for associating parent scores
  my %scores;
  foreach my $score(@scores) {
    $scores{$score->{EC}} = $score;
  }
  # Prepare lines
  foreach my $score(sort compare_ec_names @scores) {
  	next if not exists $self->{QUERIES_TO_SCORE}{$score->{QUERY_ID_BASE}};
    $score->{PARENT_SCORE} = $scores{&get_parent_ec($score)}
      if &get_parent_ec($score);
  	my %line = $self->get_line($score);
  	push(@{$self->{LINES}}, \%line);
  }
  # Add aggregates
  $self->add_micro_average($metric, @scores) 
  	if(grep {$_ =~ /MICRO/} @{$metrices{$metric}{AGGREGATES}});
  $self->add_macro_average($metric, @scores)
  	if(grep {$_ =~ /MACRO/} @{$metrices{$metric}{AGGREGATES}});
}
  
sub print_headers {
  my ($self, @args) = @_;
  $self->print_line( undef, @args );
}

sub print_lines {
  my ($self) = @_;
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
  	
  	# Skip over if the sf-queries file passed as argument
  	# This is determined by looking up keys in %{$self->{INDEX}}
  	# which stores a mapping between LDC and SF query ids
  	next if( (($metric eq "LDCMAX")||($metric eq "LDCMEAN")) && (scalar keys %{$self->{INDEX}} == 0) );
  	my $description = $metrices{$metric}{DESCRIPTION};
  	my $fields_to_print;
  	$fields_to_print = $self->{LDC_MEAN_FIELDS_TO_PRINT} 
  		if $metric eq "LDCMEAN"; 
	$self->prepare_lines($metric);
	$self->print_details() if $metric eq "SF";
	$self->print_headers($fields_to_print, undef, $program_output{$metric}) if @{$self->{LINES}};
	foreach my $line (@{$self->{LINES}}) {
	  $self->print_line($line, $fields_to_print, undef, $program_output{$metric});
	}
	@{$self->{LINES}} = ();
	print {$program_output{$metric}} "\n*ALL-Macro Prec, Recall and F1 refer to mean-precision, mean-recall and mean-F1.\n";
  }
  $self->print_summary($program_output{SUMMARY});

  print {$program_output{"SUMMARY"}} "\n*ALL-Macro Prec, Recall and F1 refer to mean-precision, mean-recall and mean-F1.\n";
}

sub print_details {
  my ($self) = @_;
  foreach my $ec (sort keys %{$self->{CATEGORIZED_SUBMISSIONS}}) {
    my %summary;
    foreach my $label(grep {$_ ne "SUBMITTED" && $_ ne "ASSESSMENTS"} keys %{$self->{CATEGORIZED_SUBMISSIONS}{$ec}}) {
      foreach my $submission(@{$self->{CATEGORIZED_SUBMISSIONS}{$ec}{$label}}) {
        my $assessment = ($submission->{ASSESSMENT} && keys %{$submission->{ASSESSMENT}}) ? $submission->{ASSESSMENT}{ASSESSMENT} : "UNASSESSED";
        my $assessment_line = ($submission->{ASSESSMENT} && keys %{$submission->{ASSESSMENT}}) ? $submission->{ASSESSMENT}{LINE} : "-";
        if($assessment ne $label) {
          my $postpolicy_assessment = $label;
          unless ($summary{$submission->{LINENUM}}) {
		        $summary{$submission->{LINENUM}} = {
                                                 LINE => $submission->{LINE},
                                                 FQNODEID => $submission->{FQNODEID} ? $submission->{FQNODEID} : "-",
                                                 TARGET_QUERY_ID => $submission->{TARGET_QUERY}->get("FULL_QUERY_ID"),
                                                 ASSESSMENT_LINE => $assessment_line,
                                                 PREPOLICY_ASSESSMENT => $assessment,
                                                 POSTPOLICY_ASSESSMENT => [$label]
		                                           };
          }
          else {
            push (@{$summary{$submission->{LINENUM}}{POSTPOLICY_ASSESSMENT}}, $label);
          }
  			}
  		}
  	}
		
	print {$program_output{DEBUG}}  "="x80, "\n";
	print {$program_output{DEBUG}} "$ec\n";
	
	foreach my $line_num(sort {$a<=>$b} keys %summary) {
		print {$program_output{DEBUG}} "\tFQNODEID:\t", $summary{$line_num}{FQNODEID}, "\n";
		print {$program_output{DEBUG}} "\tSUBMISSION:\t", $summary{$line_num}{LINE}, "\n";
		print {$program_output{DEBUG}} "\tTARGET_QID:\t", $summary{$line_num}{TARGET_QUERY_ID}, "\n";
		print {$program_output{DEBUG}} "\tASSESSMENT:\t", $summary{$line_num}{ASSESSMENT_LINE}, "\n\n";
		print {$program_output{DEBUG}} "\tPREPOLICY ASSESSMENT:\t", $summary{$line_num}{PREPOLICY_ASSESSMENT}, "\n";
		print {$program_output{DEBUG}} "\tPOSTPOLICY ASSESSMENT:\t", join(",", sort @{$summary{$line_num}{POSTPOLICY_ASSESSMENT}}), "\n";
		print {$program_output{DEBUG}} "."x80, "\n";
	}
  }
  print {$program_output{DEBUG}} "\n";
}

sub print_summary {
  my ($self, $output_handle) = @_;
  my $fields_to_print = $self->{LDC_MEAN_FIELDS_TO_PRINT};
  $self->print_headers($fields_to_print, undef, $output_handle);
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
  	my $metric_name = $metrices{$metric}{NAME};
    foreach my $line (@{$self->{SUMMARY}{$metric}}) {
      $self->print_line($line, $fields_to_print, $metric_name, $output_handle);
    }
  }
}

sub get_parent_ec {
  my ($score) = @_;
  if($score->{EC} =~ /:/) {
    my @elements = split(":", $score->{EC});
    pop @elements;
    return join(":", @elements);
  }
  return;
}

sub get_summary_stats {
  my ($self) = @_;
  foreach my $metric(sort {$metrices{$a}{ORDER}<=>$metrices{$b}{ORDER}} keys %metrices) {
  	@{$self->{SUMMARY}{$metric}} = ();
  	$self->prepare_lines($metric);
  }
  
  my %summary = %{$self->{SUMMARY}};
  my @fields = qw(PRECISION RECALL F1);
  my %stats;
  foreach my $metric(keys %summary) {
  	foreach my $line( @{$summary{$metric}} ){
  	  my $ec = $line->{EC};
  	  my $level = $line->{LEVEL};
  	  $stats{$metric}{$ec}{$level} = {map {$_=>$line->{$_}} @fields};
  	}
  }
  
  %stats;
}

# Determine which queries should be scored
sub get_queries_to_score {
  my ($logger, $spec, $queries) = @_;
  my %query_slots;
  # Spec can be empty (meaning score all queries), a colon-separated
  # list of IDs, or a filename
  if (!defined $spec) {
    my @query_ids = $queries->get_all_top_level_query_ids();
    %query_slots = map {$_=>scalar @{$queries->get($_)->{SLOTS}}-1} @query_ids;
  }
  elsif (-f $spec) {
    open(my $infile, "<:utf8", $spec) or $logger->NIST_die("Could not open $spec: $!");
    my %index;
    while(<$infile>) {
    	chomp;
    	my ($csldc_query_id, $cssf_query_id_full, $num_slots) = split(/\s+/, $_);
    	if (not exists $index{$csldc_query_id}) {
    		$index{$csldc_query_id} = defined $num_slots ? $num_slots : -1; 
    	}
    	else {
    		my $target_value = defined $num_slots ? $num_slots : -1;
    		$logger->NIST_die("$csldc_query_id has multiple/conflicting num_slots in $spec")
    			if($target_value != $index{$csldc_query_id});
    	}
    	my ($base, $cssf_query_id) = &Query::parse_queryid($cssf_query_id_full);
    	unless ($queries->get($cssf_query_id)) {
		  $logger->record_problem('UNKNOWN_QUERY_ID_WARNING', $cssf_query_id, 'NO_SOURCE');
		  next;
    	}
    	my $max_num_slot = scalar @{$queries->get($cssf_query_id)->{SLOTS}}-1;
    	$num_slots = $max_num_slot unless defined $num_slots;
    	
    	$logger->NIST_die("Unexpected num_slots value $num_slots for $csldc_query_id in $spec")
    		if $num_slots > $max_num_slot || $num_slots < 0;
    	
    	$query_slots{$cssf_query_id} = $num_slots;
    }
    close $infile;
  }
  else {
    my @query_ids = split(/:/, $spec);
    foreach my $full_query_id(@query_ids) {
      my ($base, $query_id) = &Query::parse_queryid($full_query_id);
      unless ($queries->get($query_id)) {
      	$logger->record_problem('UNKNOWN_QUERY_ID_WARNING', $query_id, 'NO_SOURCE');
      	next;
      }
      my $num_slots = scalar @{$queries->get($query_id)->{SLOTS}}-1;
      $query_slots{$query_id} = $num_slots;
    }
  }
  my %query_ids_to_score;
  foreach my $query_id (keys %query_slots) {
    my $root = $queries->get_ancestor($query_id);
    my $num_slots = $query_slots{$query_id}; 
    $query_ids_to_score{$root->get("QUERY_ID")} = $num_slots unless @{$root->get("EXPANDED_QUERY_IDS")};
    # If we've requested an unexpanded query ID, we need to add each of the expanded queries
    foreach my $expanded_query_id (@{$root->get("EXPANDED_QUERY_IDS")}) {
      $num_slots = $query_slots{$expanded_query_id}; 
      $query_ids_to_score{$expanded_query_id} = $num_slots;
    }
  }
  %query_ids_to_score;
}

# Handle run-time switches
my $switches = SwitchProcessor->new($0,
   "Score one or more TAC Cold Start runs",
   "-discipline is one of the following:\n" . EvaluationQueryOutput::get_all_disciplines() .
   "-fields is a colon-separated list drawn from the following:\n" . &main::build_documentation(\%printable_fields) .
   "policy options are a colon-separated list drawn from the following:\n" . &main::build_documentation(\%policy_options) .
   "");
$switches->addHelpSwitch("help", "Show help");
$switches->addHelpSwitch("h", undef);

$switches->addVarSwitch('output_file', "Where should program output be sent? (prefix of filename, stdout or stderr)");
$switches->put('output_file', 'stdout');
$switches->addVarSwitch("error_file", "Where should error output be sent? (filename, stdout or stderr)");
$switches->put("error_file", "stderr");
$switches->addConstantSwitch("tabs", "true", "Use tabs to separate output fields instead of spaces (useful for export to spreadsheet)");
$switches->addVarSwitch("discipline", "Discipline for identifying ground truth (see below for options)");
$switches->put("discipline", 'ASSESSED');
$switches->addVarSwitch("samples", "Specify the Bootstrap resamples file.");
$switches->addVarSwitch("expand", "Expand multi-entrypoint queries, using string provided as base for expanded query names");

$switches->addVarSwitch("queries", "file (one LDC query ID, SF query ID pair, separated by space, per line with an optional number separated " .
					 	"by space representing the hop upto which evaluation is to be performed) " .
					 	"or colon-separated list of SF query IDs to be scored " .
			           "(if omitted, all query files in 'files' parameter will be scored)");
$switches->addVarSwitch("runids", "Colon-separated list of run IDs to be scored (if omitted, all runids will be scored)");
$switches->addVarSwitch("right", "Colon-separated list of assessment codes, submitted value corresponding to which to be counted as right (post-policy) (see policy options below for legal choices)");
$switches->put("right", $default_right);
$switches->addVarSwitch("wrong", "Colon-separated list of assessment codes, submitted value corresponding to which to be counted as wrong (post-policy) (see policy options below for legal choices)");
$switches->put("wrong", $default_wrong);
$switches->addVarSwitch("ignore", "Colon-separated list of assessment codes, submitted value corresponding to which to be ignored (post-policy) (see policy options below for legal choices)");
$switches->put("ignore", $default_ignore);
$switches->addVarSwitch("fields", "Colon-separated list of output fields to print (see below for options)");
$switches->put("fields", $default_fields);
$switches->addVarSwitch('justifications', "Are multiple justifications allowed? " .
			"Legal values are of the form A:B where A represents justifications per document and B represents total justifications. " .
			"Use \'M\' to allow any number of justifications, for e.g., \'M:10\' to allow multiple justifications per document ".
			"but overall not more than 10 (best or top) justifications.");
$switches->put('justifications', "1:3");
$switches->addImmediateSwitch('version', sub { print "$0 version $version\n"; exit 0; }, "Print version number and exit");
### DO NOT INCLUDE
# Shahzad: Which of thes switches do we want to keep?
#$switches->addConstantSwitch('showmissing', 'true', "Show missing assessments");
# $switches->addConstantSwitch('components', 'true', "Show component scores for each query");
### DO INCLUDE
$switches->addParam("files", "required", "all others", "Query file, submission file and judgment file");

my $argsin = join(" ", @ARGV);

$switches->process(@ARGV);

my $logger = Logger->new();
$logger->ignore_warning('MULTIPLE_RUNIDS');

# Allow redirection of stdout and stderr
my $output_filename_prefix = $switches->get("output_file");

foreach my $output_postfix(@output_postfix) {
  if (lc $output_filename_prefix eq 'stdout') {
    $program_output{$output_postfix} = *STDOUT{IO};
  }
  elsif (lc $output_filename_prefix eq 'stderr') {
    $program_output{$output_postfix} = *STDERR{IO};
  }
  else {
  	# Suppress producing empty files
  	next if ($output_postfix =~ /^LDC/ && not defined $switches->get('expand'));
  	next if ($output_postfix =~ /^SAMPLE/ && not defined $switches->get('samples'));
  	next if ($output_postfix =~ "CONFIDENCE" && not defined $switches->get('samples'));
  	
    open($program_output{$output_postfix}, ">:utf8", $output_filename_prefix . "." . lc($output_postfix)) or $logger->NIST_die("Could not open $output_filename_prefix . "." . lc($output_postfix): $!");
  }
}

my $error_filename = $switches->get("error_file");
$logger->set_error_output($error_filename);
$error_output = $logger->get_error_output();

my $discipline = $switches->get('discipline');
my $use_tabs = $switches->get("tabs");
my $query_base = $switches->get('expand');
my %policy_selected = (
  RIGHT => $switches->get('right'),
  WRONG => $switches->get('wrong'),
  IGNORE => $switches->get('ignore'),
);

# Validate selected policy options
foreach my $option(sort keys %policy_selected) {
  my @choices = split(":", $policy_selected{$option});
  foreach my $choice(@choices) {
  	$logger->NIST_die("Unexpected choice $choice for $option")
  	  if(!grep {$_ eq $option} @{$policy_options{$choice}{CHOICES}});
  }
}

my $samples_file = $switches->get("samples");

# How should multiple justifications be handled?
my $justifications_allowed = $switches->get("justifications");
$logger->NIST_die("Argument to -justifications switch must be of the form A:B where A and B are " .
                  "either positive numbers or character \'M\' representing infinity.")
  unless $justifications_allowed =~ /^[\dM]:[\dM]$/;

my @filenames = @{$switches->get("files")};
my @queryfilenames = grep {/\.xml$/} @filenames;
my @runfilenames = grep {!/\.xml$/} @filenames;
my $queries = QuerySet->new($logger, @queryfilenames);
$queries->expand($query_base) if $query_base;

my %index = $queries->get_index();

my %queries_to_score = &get_queries_to_score($logger, $switches->get("queries"), $queries);

my $submissions_and_assessments = EvaluationQueryOutput->new($logger, $discipline, $queries,
                    {JUSTIFICATIONS_ALLOWED=>$justifications_allowed},
                    @runfilenames);

package main;

use Cwd;

sub score_ap {
  my ($runid, $submissions_and_assessments, $queries, $queries_to_score, $use_tabs, $spec, $policy_options, $policy_selected, $logger) = @_;
  my $ap_printer = APScoresPrinter->new($use_tabs ? "\t" : undef, $queries, $runid, \%index, $queries_to_score, 'EC:RUNID:LEVEL:AP', $logger);
  # Score each query, printing the query-by-query scores
 foreach my $query_id (sort keys %{$queries_to_score}) {
    my $query = $queries->get($query_id);
    # Get the scores just for this query in this run
    my @scores = $submissions_and_assessments->score_query_aps($query, $policy_options, $policy_selected,
							   DISCIPLINE => $discipline,
							   RUNID => $runid,
							   QUERY_BASE => $query_base);
		$ap_printer->add_scores(@scores);
  }
  $ap_printer;
}

sub score_runid {
  my ($runid, $submissions_and_assessments, $queries, $queries_to_score, $use_tabs, $spec, $policy_options, $policy_selected, $logger) = @_;
  my $scores_printer = ScoresPrinter->new($use_tabs ? "\t" : undef, $queries, $runid, \%index, $queries_to_score, $spec, $logger);
  # Score each query, printing the query-by-query scores
 foreach my $query_id (sort keys %{$queries_to_score}) {
    my $query = $queries->get($query_id);
    # Get the scores just for this query in this run
    my @scores = $submissions_and_assessments->score_query($query, $policy_options, $policy_selected,
							   DISCIPLINE => $discipline,
							   RUNID => $runid,
							   QUERY_BASE => $query_base);
	foreach my $score(@scores) {
	  my $full_query_id = $score->{EC};
	  if($full_query_id =~ /^(.*?):/) {
	  	$full_query_id = $1;
	  }
	  my ($base, $query_id) = &Query::parse_queryid($full_query_id);
	 $scores_printer->add_scores($score) 
	 		if($score->{LEVEL} <= $queries_to_score->{$query_id});
	}
  }
  $scores_printer;
}

my $runids = $switches->get("runids");
my @runids = $runids ? split(/:/, $runids) : $submissions_and_assessments->get_all_runids();
my $spec = $switches->get("fields");

# Print the arguments in ".arguments" file
my $current_directory = Cwd::cwd();
my $now_string = localtime;
print {$program_output{PARAMS}} "#At: $now_string\n\n";
print {$program_output{PARAMS}} "#Invoked as:\n$current_directory\$ perl $0 ", $argsin, "\n\n";
print {$program_output{PARAMS}} "#Policy Selected:\n";
foreach my $option(sort keys %policy_selected) {
  my $choices = $policy_selected{$option};
  print {$program_output{PARAMS}} "  $option => $choices\n";
}
print {$program_output{PARAMS}} "\nSAMPLE => BOOTSTRAP RESAMPLE" if defined $samples_file;

# Score the runs
foreach my $runid (@runids) {
  my $scores_printer = &score_runid($runid, $submissions_and_assessments, $queries, \%queries_to_score, $use_tabs, $spec, \%policy_options, \%policy_selected, $logger);
  $scores_printer->print_lines();
  my $ap_printer = &score_ap($runid, $submissions_and_assessments, $queries, \%queries_to_score, $use_tabs, $spec, \%policy_options, \%policy_selected, $logger);
  $ap_printer->print_lines();
  if($samples_file) {
    my $samples = Bootstrap->new($logger, $samples_file);
    my $samples_scores_printer = SamplesScoresPrinter->new($logger, $samples, $scores_printer);
    $samples_scores_printer->print_lines();
  }
}

# Close program output
foreach my $output_postfix(@output_postfix) {
  next if ($output_postfix =~ /^LDC/ && not defined $switches->get('expand'));
  next if ($output_postfix =~ /^SAMPLE/ && not defined $switches->get('samples'));
  next if ($output_postfix =~ "CONFIDENCE" && not defined $switches->get('samples'));
  close $program_output{$output_postfix};
}

$logger->report_all_problems();

# The NIST submission system wants an exit code of 255 if errors are encountered
my ($num_errors, $num_warnings) = $logger->report_all_problems();
if ($num_errors) {
  $logger->NIST_die("$num_errors error" . ($num_errors == 1 ? '' : 's') . " encountered");
}
else {
  print $error_output ($num_warnings || 'No'), " warning", ($num_warnings == 1 ? '' : 's'), " encountered\n";
}

# Close error output
$logger->close_error_output();

################################################################################
# Revision History
################################################################################

# 2017.2.0 - Code state at the release of scores
# 2017.1.6 - EvaluationQueryOutput->new() takes a hash named options as one of the args
# 2017.1.5 - Node mapping function changed to traverse the nodetree in breadth 
#            first order rather than depth first.
# 2017.1.4 - Node confidence computation function changed to have the denomerator
#            same irrespective of how many justifications were provided.
#            Also support added to have the confidence vary depending on allowed
#            justifications passed through parameter -justifications
# 2017.1.3 - Minor changes and formatting correction. Number have been verifed using
#            an initial set of test cases
# 2017.1.2 - New implementation of AP computation added
#          - Results are being printed to a single AP file, to be split later, upon
#            verification of correctness
# 2017.1.1 - AP computation from the last version removed; to be corrected in the next
#            version
# 2017.1.0 - Initial version of 2017; AP is being produced in addition to last year
#            stats
# 3.0 - Modified file extensions and suppressed empty file creation
#     - Some clarification in the usage messages
# 2.9 - Added the .arguments output file listing the arguments and policy selected
#       when the scorer was invoked.
#     - Changed 'Run ID' to 'RunID' in the header of output file(s)
# 2.8 - Added actual score `scr.` to .confidence output file
# 2.7 - Removed bug in LDCMEAN computation when duplicate LDC queries appear in
#       the sample.
# 2.6 - First version of the scorer for 2016
#     - Output is split across files
#     - Bootstrap sampling applied over the scores
# 2.5 - Adding mean-precision and mean-recall for ALL-Macro scores.
#     - Added precision and pecall columns to LDC-MEAN scores and SUMMARY scores.
# 2.4.4 - -queries file format changed. Additional mandatory first column added 
#		  containing CSLDC queryid corresponding to the CSSF queryid mentioned on 
#		  that line, required for sanity checking. 
# 2.4.3 - -queries file format changed. Allows one to add an additional column 
#         per query id specifying the hop number upto which evaluation is performed
# 2.4.2 - LDC-MEAN Macro-averaging over only NON-NIL queries
# 2.4.1 - Reporting LDC level scores
# 2.4 - Added support for specifying policy (-right, -wrong, and -ignore)
#     - Removed -combo because this is not needed and all variant should be 
#       reported as part of the output, presently only CSSF-Micro being reported
#     - queryid and full_queryid have been separated
#     - Verbose output can be seen using -verbose
#     - cleanup 
# 2.3.1 - Fixed a bug that gave a warning when hop-1 answers were not assessed 
#         because the parent was incorrect. The scores remain unchanged.
# 2.3 - small modifications to implement SPEEDUP
# 2.2 - Added -queries switch
# 2.1j - Added -combo
# 2.0 - Rewrite to operate off of ground truth tree
# 1.1 - Merged with Shahzad's pseudoslot scoring; added fuzzy match hooks
# 1.0 - Initial version

1;