You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@spamassassin.apache.org by Justin Mason <jm...@jmason.org> on 2006/10/11 11:24:07 UTC
Re: svn commit: r462695 - in /spamassassin/branches/check_plugin: lib/Mail/SpamAssassin.pm lib/Mail/SpamAssassin/PerMsgStatus.pm lib/Mail/SpamAssassin/Plugin/Check.pm rules/v320.pre

hey, couple of unsolicited comments ;)

1. regarding "why not do the plugin call directly" for
have_shortcircuited() -- it's simply shorter (less bytes) to write 'return
if $self->have_shortcircuited()' than to spell out the call_plugins method
call each time.  Basically in my opinion we should be trying to
collapse down as much of the common code in those do_XXX_tests()
methods into shared functions where possible.

2. '+      # XXX - why isn't it _body_uri_test??'
good question.  an accidental/legacy thing I think.

--j.

parker@apache.org writes:
> Author: parker
> Date: Tue Oct 10 21:28:24 2006
> New Revision: 462695
> 
> URL: http://svn.apache.org/viewvc?view=rev&rev=462695
> Log:
> first crack at the check plugin functionality
> 
> Added:
>     spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/Plugin/Check.pm
> Modified:
>     spamassassin/branches/check_plugin/lib/Mail/SpamAssassin.pm
>     spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/PerMsgStatus.pm
>     spamassassin/branches/check_plugin/rules/v320.pre
> 
> Modified: spamassassin/branches/check_plugin/lib/Mail/SpamAssassin.pm
> URL: http://svn.apache.org/viewvc/spamassassin/branches/check_plugin/lib/Mail/SpamAssassin.pm?view=diff&rev=462695&r1=462694&r2=462695
> ==============================================================================
> --- spamassassin/branches/check_plugin/lib/Mail/SpamAssassin.pm (original)
> +++ spamassassin/branches/check_plugin/lib/Mail/SpamAssassin.pm Tue Oct 10 21:28:24 2006
> @@ -1332,7 +1332,9 @@
>  sub finish {
>    my ($self) = @_;
>  
> -  Mail::SpamAssassin::PerMsgStatus::finish_tests($self->{conf});
> +  $self->call_plugins("finish_tests", { conf => $self->{conf},
> +                                        main => $self });
> +
>    $self->{conf}->finish(); delete $self->{conf};
>    $self->{plugins}->finish(); delete $self->{plugins};
>  
> 
> Modified: spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/PerMsgStatus.pm
> URL: http://svn.apache.org/viewvc/spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/PerMsgStatus.pm?view=diff&rev=462695&r1=462694&r2=462695
> ==============================================================================
> --- spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/PerMsgStatus.pm (original)
> +++ spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/PerMsgStatus.pm Tue Oct 10 21:28:24 2006
> @@ -152,95 +152,9 @@
>      $self->{conf}->set_score_set ($set|2);
>    }
>  
> -  {
> -    # bug 4353:
> -    # Do this before the RBL tests are kicked off.  The metadata parsing
> -    # will figure out the (un)trusted relays and such, which are used in the
> -    # rbl calls.
> -    $self->extract_message_metadata();
> -
> -    # Here, we launch all the DNS RBL queries and let them run while we
> -    # inspect the message
> -    $self->run_rbl_eval_tests ($self->{conf}->{rbl_evals});
> -    my $needs_dnsbl_harvest_p = 1; # harvest needs to be run
> -
> -    my $decoded = $self->get_decoded_stripped_body_text_array();
> -    my $bodytext = $self->get_decoded_body_text_array();
> -    my $fulltext = $self->{msg}->get_pristine();
> -
> -    my @uris = $self->get_uri_list();
> -
> -    foreach my $priority (sort { $a <=> $b } keys %{$self->{conf}->{priorities}}) {
> -      # no need to run if there are no priorities at this level.  This can
> -      # happen in Conf.pm when we switch a rules from one priority to another
> -      next unless ($self->{conf}->{priorities}->{$priority} > 0);
> -
> -      # if shortcircuiting is hit, we skip all other priorities...
> -      last if $self->have_shortcircuited();
> -
> -      dbg("check: running tests for priority: $priority");
> -
> -      # only harvest the dnsbl queries once priority HARVEST_DNSBL_PRIORITY
> -      # has been reached and then only run once
> -      if ($priority >= HARVEST_DNSBL_PRIORITY && $needs_dnsbl_harvest_p
> -            && !$self->have_shortcircuited())
> -      {
> -	# harvest the DNS results
> -	$self->harvest_dnsbl_queries();
> -	$needs_dnsbl_harvest_p = 0;
> -
> -	# finish the DNS results
> -	$self->rbl_finish();
> -	$self->{main}->call_plugins ("check_post_dnsbl", { permsgstatus => $self });
> -       $self->{resolver}->finish_socket() if $self->{resolver};
> -      }
> -
> -      # do head tests
> -      $self->do_head_tests($priority);
> -      $self->do_head_eval_tests($priority);
> -
> -      $self->do_body_tests($priority, $decoded);
> -      $self->do_body_uri_tests($priority, @uris);
> -      $self->do_body_eval_tests($priority, $decoded);
> -  
> -      $self->do_rawbody_tests($priority, $bodytext);
> -      $self->do_rawbody_eval_tests($priority, $bodytext);
> -  
> -      $self->do_full_tests($priority, \$fulltext);
> -      $self->do_full_eval_tests($priority, \$fulltext);
> -
> -      $self->do_meta_tests($priority);
> -
> -      # we may need to call this more often than once through the loop, but
> -      # it needs to be done at least once, either at the beginning or the end.
> -      $self->{main}->call_plugins ("check_tick", { permsgstatus => $self });
> -    }
> -
> -    # sanity check, it is possible that no rules >= HARVEST_DNSBL_PRIORITY ran so the harvest
> -    # may not have run yet.  Check, and if so, go ahead and harvest here.
> -    if ($needs_dnsbl_harvest_p) {
> -      if (!$self->have_shortcircuited()) {
> -        # harvest the DNS results
> -        $self->harvest_dnsbl_queries();
> -      }
> -
> -      # finish the DNS results
> -      # TODO: this should be consolidated with the identical code above
> -      $self->rbl_finish();
> -      $self->{main}->call_plugins ("check_post_dnsbl", { permsgstatus => $self });
> -      $self->{resolver}->finish_socket() if $self->{resolver};
> -    }
> -
> -    # finished running rules
> -    delete $self->{current_rule_name};
> -    undef $decoded;
> -    undef $bodytext;
> -    undef $fulltext;
> -
> -    # auto-learning
> -    $self->learn();
> -    $self->{main}->call_plugins ("check_post_learn", { permsgstatus => $self });
> -  }
> +  # The primary check functionality occurs via a plugin call.  For more information please
> +  # see: Mail::SpamAssassin::Plugin::Check
> +  $self->{main}->call_plugins ("check_main", { permsgstatus => $self });
>  
>    # delete temporary storage and memory allocation used during checking
>    $self->delete_fulltext_tmpfile();
> @@ -1659,369 +1573,6 @@
>  
>  ###########################################################################
>  
> -sub start_rules_plugin_code {
> -  my ($self, $ruletype) = @_;
> -
> -  my $evalstr = '
> -
> -      # start_rules_plugin_code '.$ruletype.'
> -      my $scoresptr = $self->{conf}->{scores};
> -
> -  ';
> -
> -  if ($self->{main}->have_plugin("start_rules")) {
> -    $evalstr .= '
> -
> -      $self->{main}->call_plugins ("start_rules", { permsgstatus => $self, ruletype
> -=> \''.$ruletype.'\' });
> -
> -    ';
> -  }
> -
> -  return $evalstr;
> -}
> -
> -sub hit_rule_plugin_code {
> -  my ($self, $rulename, $ruletype, $loop_break_directive) = @_;
> -
> -  # note: keep this in 'single quotes' to avoid the $ & performance hit,
> -  # unless specifically requested by the caller.   Also split the
> -  # two chars, just to be paranoid and ensure that a buggy perl interp
> -  # doesn't impose that hit anyway (just in case)
> -  my $match = '($' . '&' . '|| "negative match")';
> -
> -  my $debug_code = '';
> -  if (exists($self->{should_log_rule_hits})) {
> -    $debug_code = '
> -        dbg("rules: ran '.$ruletype.' rule '.$rulename.' ======> got hit: \"" . '.
> -            $match.' . "\"");
> -    ';
> -  }
> -
> -  my $save_hits_code = '';
> -  if ($self->{save_pattern_hits}) {
> -    $save_hits_code = '
> -        $self->{pattern_hits}->{q{'.$rulename.'}} = '.$match.';
> -    ';
> -  }
> -
> -  # if we're not running "tflags multiple", break out of the matching
> -  # loop this way
> -  my $multiple_code = '';
> -  if ($self->{conf}->{tflags}->{$rulename} !~ /\bmultiple\b/) {
> -    $multiple_code = $loop_break_directive.';';
> -  }
> -
> -  return $debug_code.$save_hits_code.$multiple_code;
> -}
> -
> -sub ran_rule_plugin_code {
> -  my ($self, $rulename, $ruletype) = @_;
> -
> -  return '' unless $self->{main}->have_plugin("ran_rule");
> -
> -  return '
> -    $self->{main}->call_plugins ("ran_rule", { permsgstatus => $self, rulename => \''.$rulename.'\', ruletype => \''.$ruletype.'\' });
> -  ';
> -}
> -
> -sub hash_line_for_rule {
> -  my ($self, $rulename) = @_;
> -  return "\n".'#line 1 "'.
> -        $self->{conf}->{source_file}->{$rulename}.
> -        ', rule '.$rulename.',"';
> -}
> -
> -###########################################################################
> -
> -sub do_head_tests {
> -  my ($self, $priority) = @_;
> -  local ($_);
> -
> -  return if $self->have_shortcircuited();
> -
> -  # note: we do this only once for all head pattern tests.  Only
> -  # eval tests need to use stuff in here.
> -  $self->{test_log_msgs} = ();        # clear test state
> -
> -  dbg("rules: running header regexp tests; score so far=".$self->{score});
> -
> -  my $doing_user_rules = 
> -    $self->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_HEAD_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  # speedup code provided by Matt Sergeant
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_head_tests_'.$clean_priority}
> -      && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_head_tests_'.$clean_priority}($self);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  my $use_rule_subs = $self->{main}->{use_rule_subs};
> -
> -  my $evalstr = $self->start_rules_plugin_code("header");
> -  my $evalstr2 = '';
> -
> -  # hash to hold the rules, "header\tdefault value" => rulename
> -  my %ordered = ();
> -  my %testcode = ();
> -
> -  while (my($rulename, $rule) = each %{$self->{conf}{head_tests}->{$priority}}) {
> -    my $def = '';
> -    my ($hdrname, $testtype, $pat) =
> -        $rule =~ /^\s*(\S+)\s*(\=|\!)\~\s*(\S.*?\S)\s*$/;
> -
> -    if (!defined $pat) {
> -      warn "rules: invalid rule: $rulename\n";
> -      $self->{rule_errors}++;
> -      next;
> -    }
> -
> -    if ($pat =~ s/\s+\[if-unset:\s+(.+)\]\s*$//) { $def = $1; }
> -
> -    $hdrname =~ s/#/[HASH]/g;                # avoid probs with eval below
> -    $def =~ s/#/[HASH]/g;
> -
> -    push(@{$ordered{"$hdrname\t$def"}}, $rulename);
> -
> -    if ($doing_user_rules) {
> -      next if (!$self->is_user_rule_sub ($rulename.'_head_test'));
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr2 .= '
> -	sub '.$rulename.'_head_test {
> -	  my($self,$text) = @_;
> -	  '.$self->hash_line_for_rule($rulename).'
> -	  while ($text '.$testtype.'~ '.$pat.'g) {
> -	    $self->got_hit(q#'.$rulename.'#, "", ruletype => "header");
> -	    '. $self->hit_rule_plugin_code($rulename, "header", "last") . '
> -	  }
> -	}
> -      ';
> -      push (@TEMPORARY_METHODS, $rulename.'_head_test');
> -    }
> -    else {
> -      # store for use below
> -      $testcode{$rulename} = $testtype.'~ '.$pat.'g';
> -    }
> -  }
> -
> -  # setup the function to run the rules
> -  while(my($k,$v) = each %ordered) {
> -    my($hdrname, $def) = split(/\t/, $k, 2);
> -    $evalstr .= ' $hval = $self->get(q#'.$hdrname.'#, q#'.$def.'#);';
> -    foreach my $rulename (@{$v}) {
> -      if ($use_rule_subs) {
> -	$evalstr .= '
> -	  if ($scoresptr->{q#'.$rulename.'#}) {
> -	     '.$rulename.'_head_test($self, $hval);
> -	     '.$self->ran_rule_plugin_code($rulename, "header").'
> -	  }
> -	';
> -      }
> -      else {
> -        my $testcode = $testcode{$rulename};
> -
> -	$evalstr .= '
> -	  if ($scoresptr->{q#'.$rulename.'#}) {
> -	    pos $hval = 0;
> -	    '.$self->hash_line_for_rule($rulename).'
> -	    while ($hval '.$testcode.') {
> -	      $self->got_hit(q#'.$rulename.'#, "", ruletype => "header");
> -	      '.$self->hit_rule_plugin_code($rulename, "header", "last").'
> -	    }
> -	    '.$self->ran_rule_plugin_code($rulename, "header").'
> -	  }
> -	';
> -      }
> -    }
> -  }
> -
> -  # clear out a previous version of this fn, if already defined
> -  if (defined &{'_head_tests_'.$clean_priority}) {
> -    undef &{'_head_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  $evalstr = <<"EOT";
> -{
> -    package Mail::SpamAssassin::PerMsgStatus;
> -
> -    $evalstr2
> -
> -    sub _head_tests_$clean_priority {
> -        my (\$self) = \@_;
> -        my \$hval;
> -
> -        $evalstr;
> -    }
> -
> -    1;
> -}
> -EOT
> -
> -  eval $evalstr;
> -
> -  if ($@) {
> -    warn "rules: failed to run header tests, skipping some: $@\n";
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    my $method = '_head_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self);
> -    use strict "refs";
> -  }
> -}
> -
> -sub do_body_tests {
> -  my ($self, $priority, $textary) = @_;
> -  local ($_);
> -    
> -  return if $self->have_shortcircuited();
> -
> -  dbg("rules: running body-text per-line regexp tests; score so far=".$self->{score});
> -
> -  my $doing_user_rules = 
> -    $self->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_BODY_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  $self->{test_log_msgs} = ();        # clear test state
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_body_tests_'.$clean_priority}
> -       && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_body_tests_'.$clean_priority}($self, @$textary);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  # caller can set this member of the Mail::SpamAssassin object to
> -  # override this; useful for profiling rule runtimes, although I think
> -  # the HitFreqsRuleTiming.pm plugin is probably better nowadays anyway
> -  my $use_rule_subs = $self->{main}->{use_rule_subs};
> -
> -  # build up the eval string...
> -  my $evalstr = $self->start_rules_plugin_code("body");
> -  my $evalstr2 = '';
> -  my $loopid = 0;
> -
> -  while (my($rulename, $pat) = each %{$self->{conf}{body_tests}->{$priority}})
> -  {
> -    my $sub;
> -    if ($self->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/)
> -    {
> -      # support multiple matches
> -      $loopid++;
> -      $sub = '
> -      body_'.$loopid.': foreach my $l (@_) {
> -	pos $l = 0;
> -	'.$self->hash_line_for_rule($rulename).'
> -	while ($l =~ '.$pat.'g) { 
> -	  $self->got_hit(q{'.$rulename.'}, "BODY: ", ruletype => "body"); 
> -	  '. $self->hit_rule_plugin_code($rulename, "body",
> -				    "last body_".$loopid) . '
> -	}
> -      }
> -      ';
> -    }
> -    else {
> -      # omitting the "pos" call, "body_loopid" label, use of while()
> -      # instead of if() etc., shaves off 8 perl OPs.
> -      $sub = '
> -      foreach my $l (@_) {
> -	'.$self->hash_line_for_rule($rulename).'
> -	if ($l =~ '.$pat.') { 
> -	  $self->got_hit(q{'.$rulename.'}, "BODY: ", ruletype => "body"); 
> -	  '. $self->hit_rule_plugin_code($rulename, "body", "last") .'
> -	}
> -      }
> -      ';
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	  '.$rulename.'_body_test($self,@_); 
> -	  '.$self->ran_rule_plugin_code($rulename, "body").'
> -	}
> -      ';
> -    }
> -    else {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	  '.$sub.'
> -	  '.$self->ran_rule_plugin_code($rulename, "body").'
> -	}
> -      ';
> -    }
> -
> -    if ($doing_user_rules) {
> -      next if (!$self->is_user_rule_sub ($rulename.'_body_test'));
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr2 .= '
> -	sub '.$rulename.'_body_test { my $self = shift; '.$sub.' }
> -      ';
> -      push (@TEMPORARY_METHODS, $rulename.'_body_test');
> -    }
> -  }
> -
> -  # clear out a previous version of this fn, if already defined
> -  if (defined &{'_body_tests_'.$clean_priority}) {
> -    undef &{'_body_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  # generate the loop that goes through each line...
> -  $evalstr = <<"EOT";
> -{
> -  package Mail::SpamAssassin::PerMsgStatus;
> -
> -  $evalstr2
> -
> -  sub _body_tests_$clean_priority {
> -    my \$self = shift;
> -    $evalstr;
> -  }
> -
> -  1;
> -}
> -EOT
> -
> -  # and run it.
> -  eval $evalstr;
> -  if ($@) {
> -    warn("rules: failed to compile body tests, skipping:\n" . "\t($@)\n");
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    my $method = '_body_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self,@$textary);
> -    use strict "refs";
> -  }
> -}
> -
> -sub is_user_rule_sub {
> -  my ($self, $subname) = @_;
> -  return 0 if (eval 'defined &Mail::SpamAssassin::PerMsgStatus::'.$subname);
> -  1;
> -}
> -
>  # Taken from URI and URI::Find
>  my $reserved   = q(;/?:@&=+$,[]\#|);
>  my $mark       = q(-_.!~*'());                                    #'; emacs
> @@ -2338,553 +1889,9 @@
>    return @{$self->{parsed_uri_list}};
>  }
>  
> -sub do_body_uri_tests {
> -  my ($self, $priority, @uris) = @_;
> -  local ($_);
> -
> -  return if $self->have_shortcircuited();
> -  
> -  dbg("uri: running uri tests; score so far=".$self->{score});
> -
> -  my $doing_user_rules = 
> -    $self->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_URI_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  $self->{test_log_msgs} = ();        # clear test state
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_body_uri_tests_'.$clean_priority}
> -      && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_body_uri_tests_'.$clean_priority}($self, @uris);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  my $use_rule_subs = $self->{main}->{use_rule_subs};
> -
> -  # otherwise build up the eval string...
> -  my $evalstr = $self->start_rules_plugin_code("uri");
> -  my $evalstr2 = '';
> -  my $loopid = 0;
> -
> -  while (my($rulename, $pat) = each %{$self->{conf}{uri_tests}->{$priority}}) {
> -    my $sub;
> -    if ($self->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/)
> -    {
> -      $loopid++;
> -      $sub = '
> -      uri_'.$loopid.': foreach my $l (@_) {
> -	pos $l = 0;
> -	'.$self->hash_line_for_rule($rulename).'
> -	while ($l =~ '.$pat.'g) { 
> -	   $self->got_hit(q{'.$rulename.'}, "URI: ", ruletype => "uri");
> -	   '. $self->hit_rule_plugin_code($rulename, "uri",
> -				    "last uri_".$loopid) . '
> -	}
> -      }
> -      ';
> -    } else {
> -      $sub = '
> -      foreach my $l (@_) {
> -	'.$self->hash_line_for_rule($rulename).'
> -	if ($l =~ '.$pat.') { 
> -	   $self->got_hit(q{'.$rulename.'}, "URI: ", ruletype => "uri");
> -	   '. $self->hit_rule_plugin_code($rulename, "uri", "last") .'
> -	}
> -      }
> -      ';
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	  '.$rulename.'_uri_test($self, @_);
> -	  '.$self->ran_rule_plugin_code($rulename, "uri").'
> -	}
> -      ';
> -    }
> -    else {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	  '.$sub.'
> -	  '.$self->ran_rule_plugin_code($rulename, "uri").'
> -	}
> -      ';
> -    }
> -
> -    if ($doing_user_rules) {
> -      next if (!$self->is_user_rule_sub ($rulename.'_uri_test'));
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr2 .= '
> -        sub '.$rulename.'_uri_test { my $self = shift; '.$sub.' }
> -      ';
> -      push (@TEMPORARY_METHODS, $rulename.'_uri_test');
> -    }
> -  }
> -
> -  # clear out a previous version of this fn, if already defined
> -  if (defined &{'_body_uri_tests_'.$clean_priority}) {
> -    undef &{'_body_uri_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  # generate the loop that goes through each line...
> -  $evalstr = <<"EOT";
> -{
> -  package Mail::SpamAssassin::PerMsgStatus;
> -
> -  $evalstr2
> -
> -  sub _body_uri_tests_$clean_priority {
> -    my \$self = shift;
> -    $evalstr;
> -  }
> -
> -  1;
> -}
> -EOT
> -
> -  # and run it.
> -  eval $evalstr;
> -  if ($@) {
> -    warn("rules: failed to compile URI tests, skipping:\n" . "\t($@)\n");
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    my $method = '_body_uri_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self, @uris);
> -    use strict "refs";
> -  }
> -}
> -
> -sub do_rawbody_tests {
> -  my ($self, $priority, $textary) = @_;
> -  local ($_);
> -
> -  return if $self->have_shortcircuited();
> -
> -  dbg("rules: running raw-body-text per-line regexp tests; score so far=".$self->{score});
> -
> -  my $doing_user_rules = 
> -    $self->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_RAWBODY_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  $self->{test_log_msgs} = ();        # clear test state
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_rawbody_tests_'.$clean_priority}
> -      && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_rawbody_tests_'.$clean_priority}($self, @$textary);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  my $use_rule_subs = $self->{main}->{use_rule_subs};
> -
> -  # build up the eval string...
> -  my $evalstr = $self->start_rules_plugin_code("rawbody");
> -  my $evalstr2 = '';
> -  my $loopid = 0;
> -
> -  while (my($rulename, $pat) = each %{$self->{conf}{rawbody_tests}->{$priority}}) {
> -    my $sub;
> -    if ($self->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/)
> -    {
> -      # support multiple matches
> -      $loopid++;
> -      $sub = '
> -      rawbody_'.$loopid.': foreach my $l (@_) {
> -	pos $l = 0;
> -	'.$self->hash_line_for_rule($rulename).'
> -	while ($l =~ '.$pat.'g) { 
> -	   $self->got_hit(q{'.$rulename.'}, "RAW: ", ruletype => "rawbody");
> -	   '. $self->hit_rule_plugin_code($rulename, "rawbody",
> -				    "last rawbody_".$loopid) . '
> -	}
> -      }
> -      ';
> -    }
> -    else {
> -      $sub = '
> -      foreach my $l (@_) {
> -	'.$self->hash_line_for_rule($rulename).'
> -	if ($l =~ '.$pat.') { 
> -	   $self->got_hit(q{'.$rulename.'}, "RAW: ", ruletype => "rawbody");
> -	   '. $self->hit_rule_plugin_code($rulename, "rawbody", "last") . '
> -	}
> -      }
> -      ';
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	   '.$rulename.'_rawbody_test($self, @_);
> -	   '.$self->ran_rule_plugin_code($rulename, "rawbody").'
> -	}
> -      ';
> -    }
> -    else {
> -      $evalstr .= '
> -	if ($scoresptr->{q{'.$rulename.'}}) {
> -	  '.$sub.'
> -	  '.$self->ran_rule_plugin_code($rulename, "rawbody").'
> -	}
> -      ';
> -    }
> -
> -    if ($doing_user_rules) {
> -      next if (!$self->is_user_rule_sub ($rulename.'_rawbody_test'));
> -    }
> -
> -    if ($use_rule_subs) {
> -      $evalstr2 .= '
> -	sub '.$rulename.'_rawbody_test { my $self = shift; '.$sub.' }
> -      ';
> -      push (@TEMPORARY_METHODS, $rulename.'_rawbody_test');
> -    }
> -  }
> -
> -  # clear out a previous version of this fn, if already defined
> -  if (defined &{'_rawbody_tests_'.$clean_priority}) {
> -    undef &{'_rawbody_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  # generate the loop that goes through each line...
> -  $evalstr = <<"EOT";
> -{
> -  package Mail::SpamAssassin::PerMsgStatus;
> -
> -  $evalstr2
> -
> -  sub _rawbody_tests_$clean_priority {
> -    my \$self = shift;
> -    $evalstr;
> -  }
> -
> -  1;
> -}
> -EOT
> -
> -  # and run it.
> -  eval $evalstr;
> -  if ($@) {
> -    warn("rules: failed to compile body tests, skipping:\n" . "\t($@)\n");
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    my $method = '_rawbody_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self, @$textary);
> -    use strict "refs";
> -  }
> -}
> -
> -sub do_full_tests {
> -  my ($self, $priority, $fullmsgref) = @_;
> -  local ($_);
> -    
> -  return if $self->have_shortcircuited();
> -  
> -  dbg("rules: running full-text regexp tests; score so far=".$self->{score});
> -
> -  my $doing_user_rules = 
> -    $self->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_FULL_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  $self->{test_log_msgs} = ();        # clear test state
> -
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_full_tests_'.$clean_priority}
> -      && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_full_tests_'.$clean_priority}($self, $fullmsgref);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  # build up the eval string...
> -  my $evalstr = $self->start_rules_plugin_code("full");
> -
> -  while (my($rulename, $pat) = each %{$self->{conf}{full_tests}->{$priority}}) {
> -    $evalstr .= '
> -      if ($scoresptr->{q{'.$rulename.'}}) {
> -        pos $$fullmsgref = 0;
> -        '.$self->hash_line_for_rule($rulename).'
> -        while ($$fullmsgref =~ '.$pat.'g) {
> -          $self->got_hit(q{'.$rulename.'}, "FULL: ", ruletype => "full");
> -          '. $self->hit_rule_plugin_code($rulename, "full", "last") . '
> -        }
> -        '.$self->ran_rule_plugin_code($rulename, "full").'
> -      }
> -    ';
> -  }
> -
> -  if (defined &{'_full_tests_'.$clean_priority}) {
> -    undef &{'_full_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  # and compile it.
> -  $evalstr = <<"EOT";
> -  {
> -    package Mail::SpamAssassin::PerMsgStatus;
> -
> -    sub _full_tests_$clean_priority {
> -        my (\$self, \$fullmsgref) = \@_;
> -        study \$\$fullmsgref;
> -        $evalstr
> -    }
> -
> -    1;
> -  }
> -EOT
> -  eval $evalstr;
> -
> -  if ($@) {
> -    warn "rules: failed to compile full tests, skipping:\n" . "\t($@)\n";
> -    $self->{rule_errors}++;
> -  } else {
> -    my $method = '_full_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self, $fullmsgref);
> -    use strict "refs";
> -  }
> -}
>  
>  ###########################################################################
>  
> -sub do_head_eval_tests {
> -  my ($self, $priority) = @_;
> -  return unless (defined($self->{conf}->{head_evals}->{$priority}));
> -  $self->run_eval_tests ($Mail::SpamAssassin::Conf::TYPE_HEAD_EVALS,
> -                         $self->{conf}->{head_evals}->{$priority}, '', $priority);
> -}
> -
> -sub do_body_eval_tests {
> -  my ($self, $priority, $bodystring) = @_;
> -  return unless (defined($self->{conf}->{body_evals}->{$priority}));
> -  $self->run_eval_tests ($Mail::SpamAssassin::Conf::TYPE_BODY_EVALS,
> -                         $self->{conf}->{body_evals}->{$priority}, 'BODY: ',
> -                         $priority, $bodystring);
> -}
> -
> -sub do_rawbody_eval_tests {
> -  my ($self, $priority, $bodystring) = @_;
> -  return unless (defined($self->{conf}->{rawbody_evals}->{$priority}));
> -  $self->run_eval_tests ($Mail::SpamAssassin::Conf::TYPE_RAWBODY_EVALS,
> -                         $self->{conf}->{rawbody_evals}->{$priority}, 'RAW: ',
> -                         $priority, $bodystring);
> -}
> -
> -sub do_full_eval_tests {
> -  my ($self, $priority, $fullmsgref) = @_;
> -  return unless (defined($self->{conf}->{full_evals}->{$priority}));
> -  $self->run_eval_tests ($Mail::SpamAssassin::Conf::TYPE_FULL_EVALS,
> -                         $self->{conf}->{full_evals}->{$priority}, '',
> -                         $priority, $fullmsgref);
> -}
> -
> -###########################################################################
> -
> -sub do_meta_tests {
> -  my ($self, $priority) = @_;
> -  local ($_);
> -    
> -  return if $self->have_shortcircuited();
> -
> -  dbg("rules: running meta tests; score so far=" . $self->{score} );
> -  my $conf = $self->{conf};
> -
> -  my $doing_user_rules = 
> -    $conf->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_META_TESTS};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  # speedup code provided by Matt Sergeant
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::_meta_tests_'.$clean_priority}
> -       && !$doing_user_rules) {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::_meta_tests_'.$clean_priority}($self);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  my (%rule_deps, %setup_rules, %meta, $rulename);
> -  my $evalstr = q{
> -
> -    my $h = $self->{tests_already_hit};
> -
> -  };
> -
> -  # Get the list of meta tests
> -  my @metas = keys %{ $conf->{meta_tests}->{$priority} };
> -
> -  # Go through each rule and figure out what we need to do
> -  foreach $rulename (@metas) {
> -    my $rule   = $conf->{meta_tests}->{$priority}->{$rulename};
> -    my $token;
> -
> -    # Lex the rule into tokens using a rather simple RE method ...
> -    my $lexer = ARITH_EXPRESSION_LEXER;
> -    my @tokens = ($rule =~ m/$lexer/g);
> -
> -    # Set the rule blank to start
> -    $meta{$rulename} = "";
> -
> -    # List dependencies that are meta tests in the same priority band
> -    $rule_deps{$rulename} = [ ];
> -
> -    # Go through each token in the meta rule
> -    foreach $token (@tokens) {
> -
> -      # Numbers can't be rule names
> -      if ($token =~ /^(?:\W+|\d+)$/) {
> -        $meta{$rulename} .= "$token ";
> -      }
> -      else {
> -        $meta{$rulename} .= "\$h->{'$token'} ";
> -        $setup_rules{$token}=1;
> -
> -        if (!exists $conf->{scores}->{$token}) {
> -          info("rules: meta test $rulename has undefined dependency '$token'");
> -        }
> -        elsif ($conf->{scores}->{$token} == 0) {
> -          my $dowarn = 1;
> -
> -          # there are some cases where this is expected; don't warn
> -          # in those cases.
> -          if ((($self->{conf}->get_score_set()) & 1) == 0 &&
> -              $conf->{tflags}->{$token} && 
> -              $conf->{tflags}->{$token} =~ /\bnet\b/)
> -          {
> -            $dowarn = 0;    # bug 5040: net rules in a non-net scoreset
> -          }
> -
> -          $dowarn and info("rules: meta test $rulename has dependency '$token' with a zero score");
> -        }
> -
> -        # If the token is another meta rule, add it as a dependency
> -        push (@{ $rule_deps{$rulename} }, $token)
> -          if (exists $conf->{meta_tests}->{$priority}->{$token});
> -      }
> -    }
> -  }
> -
> -  # avoid "undefined" warnings by providing a default value for needed rules
> -  $evalstr .= join("\n", (map { "\$h->{'$_'} ||= 0;" } keys %setup_rules), "");
> -
> -  # Sort by length of dependencies list.  It's more likely we'll get
> -  # the dependencies worked out this way.
> -  @metas = sort { @{ $rule_deps{$a} } <=> @{ $rule_deps{$b} } } @metas;
> -
> -  my $count;
> -  my $tflags = $conf->{tflags};
> -
> -  # Now go ahead and setup the eval string
> -  do {
> -    $count = $#metas;
> -    my %metas = map { $_ => 1 } @metas; # keep a small cache for fast lookups
> -
> -    # Go through each meta rule we haven't done yet
> -    for (my $i = 0 ; $i <= $#metas ; $i++) {
> -
> -      # If we depend on meta rules that haven't run yet, skip it
> -      next if (grep( $metas{$_}, @{ $rule_deps{ $metas[$i] } }));
> -
> -      # If we depend on network tests, call ensure_rules_are_complete()
> -      # to block until they are
> -      my $alldeps = join ' ', grep {
> -              $tflags->{$_} =~ /\bnet\b/
> -            } @{ $conf->{meta_dependencies}->{ $metas[$i] } };
> -
> -      if ($alldeps ne '') {
> -        $evalstr .= '  $self->ensure_rules_are_complete(q{'.$metas[$i].'}, qw{'.$alldeps.'});';
> -      }
> -
> -      # Add this meta rule to the eval line
> -      $evalstr .= '
> -        $r = '.$meta{$metas[$i]}.';
> -        if ($r) { $self->got_hit(q#'.$metas[$i].'#, "", ruletype => "meta", value => $r); }
> -      ';
> -
> -      splice @metas, $i--, 1;    # remove this rule from our list
> -    }
> -  } while ($#metas != $count && $#metas > -1); # run until we can't go anymore
> -
> -  # If there are any rules left, we can't solve the dependencies so complain
> -  my %metas = map { $_ => 1 } @metas; # keep a small cache for fast lookups
> -  foreach $rulename (@metas) {
> -    $self->{rule_errors}++; # flag to --lint that there was an error ...
> -    my $msg =
> -	"rules: excluding meta test $rulename, unsolved meta dependencies: " .
> -	    join(", ", grep($metas{$_}, @{ $rule_deps{$rulename} }));
> -    if ($self->{main}->{lint_rules}) {
> -      warn $msg."\n";
> -    }
> -    else {
> -      info($msg);
> -    }
> -  }
> -
> -  if (defined &{'_meta_tests_'.$clean_priority}) {
> -    undef &{'_meta_tests_'.$clean_priority};
> -  }
> -
> -  return unless ($evalstr);
> -
> -  # setup the environment for meta tests
> -  $evalstr = <<"EOT";
> -{
> -    package Mail::SpamAssassin::PerMsgStatus;
> -
> -    sub _meta_tests_$clean_priority {
> -        # note: cannot set \$^W here on perl 5.6.1 at least, it
> -        # crashes meta tests.
> -
> -        my (\$self) = \@_;
> -	my \$r;
> -
> -        $evalstr;
> -    }
> -
> -    1;
> -}
> -EOT
> -
> -  eval $evalstr;
> -
> -  if ($@) {
> -    warn "rules: failed to run meta tests, skipping some: $@\n";
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    my $method = '_meta_tests_'.$clean_priority;
> -    push @TEMPORARY_METHODS, $method;
> -    no strict "refs";
> -    &{$method}($self);
> -    use strict "refs";
> -  }
> -}    # do_meta_tests()
> -
>  sub ensure_rules_are_complete {
>    my $self = shift;
>    my $metarule = shift;
> @@ -2910,163 +1917,8 @@
>  
>  ###########################################################################
>  
> -sub run_eval_tests {
> -  my ($self, $testtype, $evalhash, $prepend2desc, $priority, @extraevalargs) = @_;
> -  local ($_);
> -
> -  return if $self->have_shortcircuited();
> -
> -  my $doing_user_rules = $self->{conf}->{user_rules_to_compile}->{$testtype};
> -
> -  # clean up priority value so it can be used in a subroutine name
> -  my $clean_priority;
> -  ($clean_priority = $priority) =~ s/-/neg/;
> -
> -  my $scoreset = $self->{conf}->get_score_set();
> -
> -  my $methodname = '_eval_tests'.
> -                        '_type'.$testtype .
> -                        '_pri'.$clean_priority .
> -                        '_set'.$scoreset;
> -
> -  # Some of the rules are scoreset specific, so we need additional 
> -  # subroutines to handle those
> -  if (defined &{'Mail::SpamAssassin::PerMsgStatus::'.$methodname}
> -        && !$doing_user_rules)
> -  {
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::'.$methodname}($self,@extraevalargs);
> -    use strict "refs";
> -    return;
> -  }
> -
> -  # look these up once in advance to save repeated lookups in loop below
> -  my $tflagsref = $self->{conf}->{tflags};
> -  my $have_start_rules = $self->{main}->have_plugin("start_rules");
> -  my $have_ran_rule = $self->{main}->have_plugin("ran_rule");
> -
> -  # the buffer for the evaluated code
> -  my $evalstr = q{ };
> -$evalstr .= q{ my $function; };
> -
> -  # conditionally include the dbg in the eval str
> -  my $dbgstr = q{ };
> -  if (would_log('dbg')) {
> -    $dbgstr = q{ 
> -      dbg("rules: ran eval rule $rulename ======> got hit ($result)");
> -    };
> -  }
> -
> -  while (my ($rulename, $test) = each %{$evalhash})
> -  {
> -    if ($tflagsref->{$rulename}) {
> -      # If the rule is a net rule, and we are in a non-net scoreset, skip it.
> -      if ($tflagsref->{$rulename} =~ /\bnet\b/) {
> -        next if (($scoreset & 1) == 0);
> -      }
> -      # If the rule is a bayes rule, and we are in a non-bayes scoreset, skip it.
> -      if ($tflagsref->{$rulename} =~ /\bbayes\b/) {
> -        next if (($scoreset & 2) == 0);
> -      }
> -    }
> -
> -    my ($function, @args) = @{$test};
> -    if (!$function) {
> -      warn "rules: error: no function defined for $rulename";
> -      next;
> -    }
> -
> -    $evalstr .= '
> -      $rulename = q#'.$rulename.'#;
> -      $self->{test_log_msgs} = ();
> -    ';
> -
> -    # only need to set current_rule_name for plugin evals
> -    if ($self->{conf}->{eval_plugins}->{$function}) {
> -      # let plugins get the name of the rule that is currently being run,
> -      # and ensure their eval functions exist
> -      $evalstr .= '
> -        $self->{current_rule_name} = $rulename;
> -        $self->register_plugin_eval_glue(q#'.$function.'#);
> -      ';
> -    }
> -
> -    # this stuff is quite slow, and totally superfluous if
> -    # no plugin is loaded for those hooks
> -    if ($have_start_rules) {
> -      $evalstr .= '
> -        $self->{main}->call_plugins("start_rules", {
> -                permsgstatus => $self, ruletype => "eval"
> -              });
> -      ';
> -    }
> -
> -    my $argstr = '';
> -    if (scalar @args > 0) {
> -      $argstr = ',' . join (', ', map { "q#".$_."#" } @args);
> -    }
> -
> -    $evalstr .= '
> -      eval {
> -        $result = $self->' . $function . ' (@extraevalargs '. $argstr .' );
> -      };
> -      if ($@) { $self->handle_eval_rule_errors($rulename); }
> -    ';
> -
> -    if ($have_ran_rule) {
> -      $evalstr .= '
> -        $self->{main}->call_plugins("ran_rule", {
> -            permsgstatus => $self, ruletype => "eval", rulename => $rulename
> -          });
> -      ';
> -    }
> -
> -    $evalstr .= '
> -      if ($result) {
> -        $self->got_hit($rulename, $prepend2desc, ruletype => "eval", value => $result);
> -        '.$dbgstr.'
> -      }
> -    ';
> -  }
> -
> -  # nothing done in the loop, that means no rules
> -  return unless ($evalstr);
> -
> -  $evalstr = <<"EOT";
> -{
> -  package Mail::SpamAssassin::PerMsgStatus;
> -
> -    sub ${methodname} {
> -      my (\$self, \@extraevalargs) = \@_;
> -
> -      my \$prepend2desc = q#$prepend2desc#;
> -      my \$rulename;
> -      my \$result;
> -
> -      $evalstr
> -    }
> -
> -  1;
> -}
> -EOT
> -
> -  eval $evalstr;
> -
> -  push (@TEMPORARY_METHODS, $methodname);
> -
> -  if ($@) {
> -    warn "rules: failed to compile eval tests, skipping some: $@\n";
> -    $self->{rule_errors}++;
> -  }
> -  else {
> -    push (@TEMPORARY_METHODS, $methodname);
> -    no strict "refs";
> -    &{'Mail::SpamAssassin::PerMsgStatus::'.$methodname}($self,@extraevalargs);
> -    use strict "refs";
> -  }
> -}
> -
>  # use a separate sub here, for brevity
> +# called out of generated eval
>  sub handle_eval_rule_errors {
>    my ($self, $rulename) = @_;
>    warn "rules: failed to run $rulename test, skipping:\n\t($@)\n";
> @@ -3110,38 +1962,6 @@
>  
>    # ensure this method is deleted if finish_tests() is called
>    push (@TEMPORARY_METHODS, $function);
> -}
> -
> -###########################################################################
> -
> -sub run_rbl_eval_tests {
> -  my ($self, $evalhash) = @_;
> -  local ($_);
> -
> -  if ($self->{main}->{local_tests_only}) {
> -    dbg("rules: local tests only, ignoring RBL eval");
> -    return 0;
> -  }
> -  
> -  while (my ($rulename, $test) = each %{$evalhash}) {
> -    my $score = $self->{conf}->{scores}->{$rulename};
> -    next unless $score;
> -
> -    $self->{test_log_msgs} = ();        # clear test state
> -
> -    my ($function, @args) = @{$test};
> -
> -    my $result;
> -    eval {
> -       $result = $self->$function($rulename, @args);
> -    };
> -
> -    if ($@) {
> -      warn "rules: failed to run $rulename RBL test, skipping:\n" . "\t($@)\n";
> -      $self->{rule_errors}++;
> -      next;
> -    }
> -  }
>  }
>  
>  ###########################################################################
> 
> Added: spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/Plugin/Check.pm
> URL: http://svn.apache.org/viewvc/spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/Plugin/Check.pm?view=auto&rev=462695
> ==============================================================================
> --- spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/Plugin/Check.pm (added)
> +++ spamassassin/branches/check_plugin/lib/Mail/SpamAssassin/Plugin/Check.pm Tue Oct 10 21:28:24 2006
> @@ -0,0 +1,1267 @@
> +=head1 NAME
> +
> +Mail::SpamAssassin::Plugin::Check
> +
> +=head1 SYNOPSIS
> +
> +loadplugin Mail::SpamAssassin::Plugin::Check
> +
> +=head1 DESCRIPTION
> +
> +This plugin provides the primary message check functionality.
> +
> +=cut
> +
> +package Mail::SpamAssassin::Plugin::Check;
> +
> +use Mail::SpamAssassin::Plugin;
> +use Mail::SpamAssassin::Logger;
> +use Mail::SpamAssassin::Util;
> +use Mail::SpamAssassin::Constants qw(:sa);
> +
> +use strict;
> +use warnings;
> +use bytes;
> +
> +use vars qw(@ISA @TEMPORARY_METHODS);
> +@ISA = qw(Mail::SpamAssassin::Plugin);
> +
> +# methods defined by the compiled ruleset; deleted in finish_tests() 
> +@TEMPORARY_METHODS = (); 
> +
> +# constructor
> +sub new {
> +  my $class = shift;
> +  my $mailsaobject = shift;
> +
> +  $class = ref($class) || $class;
> +  my $self = $class->SUPER::new($mailsaobject);
> +  bless ($self, $class);
> +
> +  return $self;
> +}
> +
> +sub check_main {
> +  my ($self, $args) = @_;
> +
> +  my $pms = $args->{permsgstatus};
> +
> +  # bug 4353:
> +  # Do this before the RBL tests are kicked off.  The metadata parsing
> +  # will figure out the (un)trusted relays and such, which are used in the
> +  # rbl calls.
> +  $pms->extract_message_metadata();
> +
> +  # Here, we launch all the DNS RBL queries and let them run while we
> +  # inspect the message
> +  $self->run_rbl_eval_tests($pms);
> +  my $needs_dnsbl_harvest_p = 1; # harvest needs to be run
> +
> +  my $decoded = $pms->get_decoded_stripped_body_text_array();
> +  my $bodytext = $pms->get_decoded_body_text_array();
> +  my $fulltext = $pms->{msg}->get_pristine();
> +
> +  my @uris = $pms->get_uri_list();
> +
> +  foreach my $priority (sort { $a <=> $b } keys %{$pms->{conf}->{priorities}}) {
> +    # no need to run if there are no priorities at this level.  This can
> +    # happen in Conf.pm when we switch a rules from one priority to another
> +    next unless ($pms->{conf}->{priorities}->{$priority} > 0);
> +
> +    # if shortcircuiting is hit, we skip all other priorities...
> +    last if $pms->have_shortcircuited();
> +
> +    dbg("check: running tests for priority: $priority");
> +
> +    # only harvest the dnsbl queries once priority HARVEST_DNSBL_PRIORITY
> +    # has been reached and then only run once
> +    if ($priority >= HARVEST_DNSBL_PRIORITY && $needs_dnsbl_harvest_p
> +	&& !$pms->have_shortcircuited()) {
> +      # harvest the DNS results
> +      $pms->harvest_dnsbl_queries();
> +      $needs_dnsbl_harvest_p = 0;
> +
> +      # finish the DNS results
> +      $pms->rbl_finish();
> +      $self->{main}->call_plugins("check_post_dnsbl", { permsgstatus => $pms });
> +      $pms->{resolver}->finish_socket() if $pms->{resolver};
> +    }
> +
> +    # do head tests
> +    $self->do_head_tests($pms, $priority);
> +    $self->do_head_eval_tests($pms, $priority);
> +
> +    $self->do_body_tests($pms, $priority, $decoded);
> +    $self->do_body_uri_tests($pms, $priority, @uris);
> +    $self->do_body_eval_tests($pms, $priority, $decoded);
> +  
> +    $self->do_rawbody_tests($pms, $priority, $bodytext);
> +    $self->do_rawbody_eval_tests($pms, $priority, $bodytext);
> +  
> +    $self->do_full_tests($pms, $priority, \$fulltext);
> +    $self->do_full_eval_tests($pms, $priority, \$fulltext);
> +
> +    $self->do_meta_tests($pms, $priority);
> +
> +    # we may need to call this more often than once through the loop, but
> +    # it needs to be done at least once, either at the beginning or the end.
> +    $self->{main}->call_plugins ("check_tick", { permsgstatus => $pms });
> +  }
> +
> +  # sanity check, it is possible that no rules >= HARVEST_DNSBL_PRIORITY ran so the harvest
> +  # may not have run yet.  Check, and if so, go ahead and harvest here.
> +  if ($needs_dnsbl_harvest_p) {
> +    if (!$pms->have_shortcircuited()) {
> +      # harvest the DNS results
> +      $pms->harvest_dnsbl_queries();
> +    }
> +
> +    # finish the DNS results
> +    $pms->rbl_finish();
> +    $self->{main}->call_plugins ("check_post_dnsbl", { permsgstatus => $pms });
> +    $pms->{resolver}->finish_socket() if $pms->{resolver};
> +  }
> +
> +  # finished running rules
> +  delete $pms->{current_rule_name};
> +  undef $decoded;
> +  undef $bodytext;
> +  undef $fulltext;
> +
> +  # auto-learning
> +  $pms->learn();
> +  $self->{main}->call_plugins ("check_post_learn", { permsgstatus => $pms });
> +
> +  return;
> +}
> +
> +sub finish_tests {
> +  my ($self, $params) = @_;
> +
> +  foreach my $method (@TEMPORARY_METHODS) {
> +    undef &{$method};
> +  }
> +  @TEMPORARY_METHODS = ();      # clear for next time
> +}
> +
> +sub run_rbl_eval_tests {
> +  my ($self, $pms) = @_;
> +  my ($rulename, $pat, @args);
> +  local ($_);
> +
> +  # XXX - possible speed up, moving this check out of the subroutine into Check->new()
> +  if ($self->{main}->{local_tests_only}) {
> +    dbg("rules: local tests only, ignoring RBL eval");
> +    return 0;
> +  }
> +
> +  while (my ($rulename, $test) = each %{$pms->{conf}->{rbl_evals}}) {
> +    my $score = $pms->{conf}->{scores}->{$rulename};
> +    next unless $score;
> +
> +    $pms->{test_log_msgs} = ();        # clear test state
> +
> +    my ($function, @args) = @{$test};
> +
> +    my $result;
> +    eval {
> +       $result = $pms->$function($rulename, @args);
> +    };
> +
> +    if ($@) {
> +      warn "rules: failed to run $rulename RBL test, skipping:\n" . "\t($@)\n";
> +      $pms->{rule_errors}++;
> +      next;
> +    }
> +  }
> +}
> +
> +sub do_meta_tests {
> +  my ($self, $pms, $priority) = @_;
> +  local ($_);
> +  
> +  # XXX - why not just make the plugin call?
> +  return if $pms->have_shortcircuited();
> +
> +  dbg("rules: running meta tests; score so far=" . $pms->{score} );
> +  my $conf = $pms->{conf};
> +
> +  my $doing_user_rules = 
> +    $conf->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_META_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  # speedup code provided by Matt Sergeant
> +  if (defined &{"${package_name}::_meta_tests_${clean_priority}"}
> +       && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_meta_tests_${clean_priority}"}($pms);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  my (%rule_deps, %setup_rules, %meta, $rulename);
> +  my $evalstr = '';
> +
> +  # Get the list of meta tests
> +  my @metas = keys %{$conf->{meta_tests}->{$priority}};
> +
> +  # Go through each rule and figure out what we need to do
> +  foreach $rulename (@metas) {
> +    my $rule = $conf->{meta_tests}->{$priority}->{$rulename};
> +    my $token;
> +
> +    # Lex the rule into tokens using a rather simple RE method ...
> +    my $lexer = ARITH_EXPRESSION_LEXER;
> +    my @tokens = ($rule =~ m/$lexer/g);
> +
> +    # Set the rule blank to start
> +    $meta{$rulename} = "";
> +
> +    # List dependencies that are meta tests in the same priority band
> +    $rule_deps{$rulename} = [ ];
> +
> +    # Go through each token in the meta rule
> +    foreach $token (@tokens) {
> +
> +      # Numbers can't be rule names
> +      if ($token =~ /^(?:\W+|\d+)$/) {
> +        $meta{$rulename} .= "$token ";
> +      }
> +      else {
> +        $meta{$rulename} .= "\$h->{'$token'} ";
> +        $setup_rules{$token}=1;
> +      
> +        if (!exists $conf->{scores}->{$token}) {
> +          info("rules: meta test $rulename has undefined dependency '$token'");
> +        }
> +        elsif ($conf->{scores}->{$token} == 0) {
> +          my $dowarn = 1;
> +
> +          # there are some cases where this is expected; don't warn
> +          # in those cases.
> +          if ((($conf->get_score_set()) & 1) == 0 &&
> +              $conf->{tflags}->{$token} && 
> +              $conf->{tflags}->{$token} =~ /\bnet\b/) {
> +            $dowarn = 0;    # bug 5040: net rules in a non-net scoreset
> +          }
> +
> +          $dowarn and info("rules: meta test $rulename has dependency '$token' with a zero score");
> +        }
> +
> +        # If the token is another meta rule, add it as a dependency
> +        push (@{ $rule_deps{$rulename} }, $token)
> +          if (exists $conf->{meta_tests}->{$priority}->{$token});
> +      }
> +    }
> +  }
> +
> +  # avoid "undefined" warnings by providing a default value for needed rules
> +  $evalstr .= join("\n", (map { "\$h->{'$_'} ||= 0;" } keys %setup_rules), "");
> +
> +  # Sort by length of dependencies list.  It's more likely we'll get
> +  # the dependencies worked out this way.
> +  @metas = sort { @{ $rule_deps{$a} } <=> @{ $rule_deps{$b} } } @metas;
> +
> +  my $count;
> +  my $tflags = $conf->{tflags};
> +
> +  # Now go ahead and setup the eval string
> +  do {
> +    $count = $#metas;
> +    my %metas = map { $_ => 1 } @metas; # keep a small cache for fast lookups
> +
> +    # Go through each meta rule we haven't done yet
> +    for (my $i = 0 ; $i <= $#metas ; $i++) {
> +
> +      # If we depend on meta rules that haven't run yet, skip it
> +      next if (grep( $metas{$_}, @{ $rule_deps{ $metas[$i] } }));
> +
> +      # If we depend on network tests, call ensure_rules_are_complete()
> +      # to block until they are
> +      my $alldeps = join ' ', grep {
> +              $tflags->{$_} =~ /\bnet\b/
> +            } @{ $conf->{meta_dependencies}->{ $metas[$i] } };
> +
> +      if ($alldeps ne '') {
> +        $evalstr .= '  $pms->ensure_rules_are_complete(q{'.$metas[$i].'}, qw{'.$alldeps.'});';
> +      }
> +
> +      # Add this meta rule to the eval line
> +      $evalstr .= '
> +        $r = '.$meta{$metas[$i]}.';
> +        if ($r) { $pms->got_hit(q#'.$metas[$i].'#, "", ruletype => "meta", value => $r); }
> +      ';
> +
> +      splice @metas, $i--, 1;    # remove this rule from our list
> +    }
> +  } while ($#metas != $count && $#metas > -1); # run until we can't go anymore
> +
> +  # If there are any rules left, we can't solve the dependencies so complain
> +  my %metas = map { $_ => 1 } @metas; # keep a small cache for fast lookups
> +  foreach $rulename (@metas) {
> +    $pms->{rule_errors}++; # flag to --lint that there was an error ...
> +    my $msg =
> +	"rules: excluding meta test $rulename, unsolved meta dependencies: " .
> +	    join(", ", grep($metas{$_}, @{ $rule_deps{$rulename} }));
> +    if ($self->{main}->{lint_rules}) {
> +      warn $msg."\n";
> +    }
> +    else {
> +      info($msg);
> +    }
> +  }
> +
> +  no strict "subs";
> +  undef &{"${package_name}::_meta_tests_${clean_priority}"};
> +  use strict "subs";
> +
> +  return unless ($evalstr);
> +
> +  # setup the environment for meta tests
> +  $evalstr = <<"EOT";
> +{
> +    package $package_name;
> +
> +    sub _meta_tests_$clean_priority {
> +        # note: cannot set \$^W here on perl 5.6.1 at least, it
> +        # crashes meta tests.
> +
> +        my (\$pms) = \@_;
> +	my \$r;
> +
> +        my \$h = \$pms->{tests_already_hit};
> +
> +        $evalstr;
> +    }
> +
> +    1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn "rules: failed to run meta tests, skipping some: $@\n";
> +    $pms->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::_meta_tests_${clean_priority}";
> +    push @TEMPORARY_METHODS, $method;
> +    no strict "refs";
> +    &{$method}($pms);
> +    use strict "refs";
> +  }
> +}    # do_meta_tests()
> +
> +sub do_head_tests {
> +  my ($self, $pms, $priority) = @_;
> +  local ($_);
> +
> +  # XXX - why not just do the plugin call?
> +  return if $pms->have_shortcircuited();
> +
> +  # note: we do this only once for all head pattern tests.  Only
> +  # eval tests need to use stuff in here.
> +  $pms->{test_log_msgs} = ();        # clear test state
> +
> +  dbg("rules: running header regexp tests; score so far=".$pms->{score});
> +
> +  my $doing_user_rules = 
> +    $pms->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_HEAD_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  # speedup code provided by Matt Sergeant
> +  if (defined &{"${package_name}::_head_tests_${clean_priority}"}
> +      && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_head_tests_${clean_priority}"}($pms);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  my $use_rule_subs = $self->{main}->{use_rule_subs};
> +
> +  my $evalstr = $self->start_rules_plugin_code("header");
> +  my $evalstr2 = '';
> +
> +  # hash to hold the rules, "header\tdefault value" => rulename
> +  my %ordered = ();
> +  my %testcode = ();
> +
> +  while (my($rulename, $rule) = each %{$pms->{conf}{head_tests}->{$priority}}) {
> +    my $def = '';
> +    my ($hdrname, $testtype, $pat) =
> +        $rule =~ /^\s*(\S+)\s*(\=|\!)\~\s*(\S.*?\S)\s*$/;
> +
> +    if (!defined $pat) {
> +      warn "rules: invalid rule: $rulename\n";
> +      $pms->{rule_errors}++;
> +      next;
> +    }
> +
> +    if ($pat =~ s/\s+\[if-unset:\s+(.+)\]\s*$//) { $def = $1; }
> +
> +    $hdrname =~ s/#/[HASH]/g;                # avoid probs with eval below
> +    $def =~ s/#/[HASH]/g;
> +
> +    push(@{$ordered{"$hdrname\t$def"}}, $rulename);
> +
> +    if ($doing_user_rules) {
> +      next if (!$self->is_user_rule_sub ($rulename.'_head_test'));
> +    }
> +
> +    if ($use_rule_subs) {
> +      $evalstr2 .= '
> +        sub '.$rulename.'_head_test {
> +          my($self,$text) = @_;
> +          '.$self->hash_line_for_rule($pms, $rulename).'
> +	    while ($text '.$testtype.'~ '.$pat.'g) {
> +            $self->got_hit(q#'.$rulename.'#, "", ruletype => "header");
> +            '. $self->hit_rule_plugin_code($pms, $rulename, "header", "last") . '
> +			 }
> +        }
> +      ';
> +      push (@TEMPORARY_METHODS, $rulename.'_head_test');
> +    }
> +    else {
> +      # store for use below
> +      $testcode{$rulename} = $testtype.'~ '.$pat.'g';
> +    }
> +  }
> +
> +  # setup the function to run the rules
> +  while(my($k,$v) = each %ordered) {
> +    my($hdrname, $def) = split(/\t/, $k, 2);
> +    $evalstr .= ' $hval = $self->get(q#'.$hdrname.'#, q#'.$def.'#);';
> +    foreach my $rulename (@{$v}) {
> +      if ($use_rule_subs) {
> +        $evalstr .= '
> +          if ($scoresptr->{q#'.$rulename.'#}) {
> +             '.$rulename.'_head_test($self, $hval);
> +             '.$self->ran_rule_plugin_code($rulename, "header").'
> +          }
> +        ';
> +      }
> +      else {
> +        my $testcode = $testcode{$rulename};
> +
> +        $evalstr .= '
> +          if ($scoresptr->{q#'.$rulename.'#}) {
> +            pos $hval = 0;
> +            '.$self->hash_line_for_rule($pms, $rulename).'
> +            while ($hval '.$testcode.') {
> +              $self->got_hit(q#'.$rulename.'#, "", ruletype => "header");
> +              '.$self->hit_rule_plugin_code($pms, $rulename, "header", "last").'
> +            }
> +            '.$self->ran_rule_plugin_code($pms, $rulename, "header").'
> +          }
> +        ';
> +      }
> +    }
> +  }
> +
> +  # clear out a previous version of this fn, if already defined
> +  no strict "subs";
> +  undef &{"${package_name}::_head_tests_${clean_priority}"};
> +  use strict "subs";
> +
> +  return unless ($evalstr);
> +
> +  $evalstr = <<"EOT";
> +{
> +    package $package_name;
> +
> +    $evalstr2
> +
> +    sub _head_tests_$clean_priority {
> +        my (\$self) = \@_;
> +        my \$hval;
> +
> +        $evalstr;
> +    }
> +
> +    1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn "rules: failed to run header tests, skipping some: $@\n";
> +    $pms->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::_head_tests_${clean_priority}";
> +    push @TEMPORARY_METHODS, $method;
> +    no strict "refs";
> +    &{$method}($pms);
> +    use strict "refs";
> +  }
> +}
> +
> +sub do_body_tests {
> +  my ($self, $pms, $priority, $textary) = @_;
> +  local ($_);
> +
> +  # XXX - why not just make the plugin call directly?
> +  return if $pms->have_shortcircuited();
> +
> +  dbg("rules: running body-text per-line regexp tests; score so far=".$pms->{score});
> +
> +  my $doing_user_rules = 
> +    $pms->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_BODY_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  $pms->{test_log_msgs} = ();        # clear test state
> +
> +  if (defined &{"${package_name}::_body_tests_${clean_priority}"}
> +       && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_body_tests_${clean_priority}"}($pms, @$textary);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  # caller can set this member of the Mail::SpamAssassin object to
> +  # override this; useful for profiling rule runtimes, although I think
> +  # the HitFreqsRuleTiming.pm plugin is probably better nowadays anyway
> +  my $use_rule_subs = $self->{main}->{use_rule_subs};
> +
> +  # build up the eval string...
> +  my $evalstr = $self->start_rules_plugin_code("body");
> +  my $evalstr2 = '';
> +  my $loopid = 0;
> +
> +  while (my($rulename, $pat) = each %{$pms->{conf}{body_tests}->{$priority}}) {
> +    my $sub;
> +    if ($pms->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/)
> +      {
> +      # support multiple matches
> +      $loopid++;
> +      $sub = '
> +      body_'.$loopid.': foreach my $l (@_) {
> +        pos $l = 0;
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        while ($l =~ '.$pat.'g) { 
> +          $self->got_hit(q{'.$rulename.'}, "BODY: ", ruletype => "body"); 
> +          '. $self->hit_rule_plugin_code($pms, $rulename, "body",
> +					 "last body_".$loopid) . '
> +        }
> +      }
> +      ';
> +    }
> +    else {
> +      # omitting the "pos" call, "body_loopid" label, use of while()
> +      # instead of if() etc., shaves off 8 perl OPs.
> +      $sub = '
> +      foreach my $l (@_) {
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        if ($l =~ '.$pat.') { 
> +          $self->got_hit(q{'.$rulename.'}, "BODY: ", ruletype => "body"); 
> +          '. $self->hit_rule_plugin_code($pms, $rulename, "body", "last") .'
> +        }
> +      }
> +      ';
> +    }
> +
> +    if ($use_rule_subs) {
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +          '.$rulename.'_body_test($self,@_); 
> +          '.$self->ran_rule_plugin_code($rulename, "body").'
> +        }
> +      ';
> +    }
> +    else {
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +          '.$sub.'
> +          '.$self->ran_rule_plugin_code($rulename, "body").'
> +        }
> +      ';
> +    }
> +
> +    if ($doing_user_rules) {
> +      next if (!$self->is_user_rule_sub ($rulename.'_body_test'));
> +    }
> +
> +    if ($use_rule_subs) {
> +      $evalstr2 .= '
> +        sub '.$rulename.'_body_test { my $self = shift; '.$sub.' }
> +      ';
> +      push (@TEMPORARY_METHODS, $rulename.'_body_test');
> +    }
> +  }
> +
> +  # clear out a previous version of this fn
> +  undef &{"${package_name}::_body_tests_${clean_priority}"};
> +
> +  return unless ($evalstr);
> +
> +  # generate the loop that goes through each line...
> +  $evalstr = <<"EOT";
> +{
> +  package $package_name;
> +
> +  $evalstr2
> +
> +  sub _body_tests_$clean_priority {
> +    my \$self = shift;
> +
> +    $evalstr;
> +  }
> +
> +  1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn("rules: failed to compile body tests, skipping:\n" . "\t($@)\n");
> +    $pms->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::_body_tests_${clean_priority}";
> +    no strict "refs";
> +    &{$method}($pms, @$textary);
> +    use strict "refs";
> +  }
> +}
> +
> +sub do_body_uri_tests {
> +  my ($self, $pms, $priority, @uris) = @_;
> +  local ($_);
> +
> +  # XXX - why not just do the direct plugin call?
> +  return if $pms->have_shortcircuited();
> +
> +  dbg("uri: running uri tests; score so far=".$pms->{score});
> +
> +  my $doing_user_rules = 
> +    $pms->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_URI_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  $pms->{test_log_msgs} = ();        # clear test state
> +
> +  if (defined &{"${package_name}::_body_uri_tests_${clean_priority}"}
> +      && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_body_uri_tests_${clean_priority}"}($pms, @uris);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  my $use_rule_subs = $self->{main}->{use_rule_subs};
> +
> +  # otherwise build up the eval string...
> +  my $evalstr = $self->start_rules_plugin_code("uri");
> +  my $evalstr2 = '';
> +  my $loopid = 0;
> +
> +  while (my($rulename, $pat) = each %{$pms->{conf}{uri_tests}->{$priority}}) {
> +    my $sub;
> +    if ($pms->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/) {
> +      $loopid++;
> +      $sub = '
> +      uri_'.$loopid.': foreach my $l (@_) {
> +        pos $l = 0;
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        while ($l =~ '.$pat.'g) { 
> +           $self->got_hit(q{'.$rulename.'}, "URI: ", ruletype => "uri");
> +           '. $self->hit_rule_plugin_code($pms, $rulename, "uri",
> +					  "last uri_".$loopid) . '
> +        }
> +      }
> +      ';
> +    } else {
> +      $sub = '
> +      foreach my $l (@_) {
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        if ($l =~ '.$pat.') { 
> +           $self->got_hit(q{'.$rulename.'}, "URI: ", ruletype => "uri");
> +           '. $self->hit_rule_plugin_code($pms, $rulename, "uri", "last") .'
> +        }
> +      }
> +      ';
> +    }
> +
> +    if ($use_rule_subs) {
> +      # XXX - why isn't it _body_uri_test??
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +          '.$rulename.'_uri_test($self, @_);
> +          '.$self->ran_rule_plugin_code($rulename, "uri").'
> +        }
> +      ';
> +    }
> +    else {
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +          '.$sub.'
> +          '.$self->ran_rule_plugin_code($rulename, "uri").'
> +        }
> +      ';
> +    }
> +
> +    if ($doing_user_rules) {
> +      next if (!$self->is_user_rule_sub($rulename.'_uri_test'));
> +    }
> +
> +    if ($use_rule_subs) {
> +      # XXX - why isn't it _body_uri_test??
> +      $evalstr2 .= '
> +        sub '.$rulename.'_uri_test { my $self = shift; '.$sub.' }
> +      ';
> +      push (@TEMPORARY_METHODS, $rulename.'_uri_test');
> +    }
> +  }
> +
> +  # clear out a previous version of this fn
> +  undef &{"${package_name}::_body_uri_tests_${clean_priority}"};
> +
> +  return unless ($evalstr);
> +
> +  # generate the loop that goes through each line...
> +  $evalstr = <<"EOT";
> +{
> +  package $package_name;
> +
> +  $evalstr2
> +
> +  sub _body_uri_tests_$clean_priority {
> +    my \$self = shift;
> +    $evalstr;
> +  }
> +
> +  1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn("rules: failed to compile URI tests, skipping:\n" . "\t($@)\n");
> +    $pms->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::_body_uri_tests_${clean_priority}";
> +    push @TEMPORARY_METHODS, $method;
> +    no strict "refs";
> +    &{$method}($pms, @uris);
> +    use strict "refs";
> +  }
> +}
> +
> +sub do_rawbody_tests {
> +  my ($self, $pms, $priority, $textary) = @_;
> +  local ($_);
> +
> +  # XXX - why not just do the plugin call here??
> +  return if $pms->have_shortcircuited();
> +
> +  dbg("rules: running raw-body-text per-line regexp tests; score so far=".$pms->{score});
> +
> +  my $doing_user_rules = 
> +    $pms->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_RAWBODY_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  $pms->{test_log_msgs} = ();        # clear test state
> +  dbg("rules: in middle of raw-body-text");
> +  if (defined &{"${package_name}::_rawbody_tests_${clean_priority}"}
> +      && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_rawbody_tests_${clean_priority}"}($pms, @$textary);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  my $use_rule_subs = $self->{main}->{use_rule_subs};
> +
> +  # build up the eval string...
> +  my $evalstr = $self->start_rules_plugin_code("rawbody");
> +  my $evalstr2 = '';
> +  my $loopid = 0;
> +
> +  while (my($rulename, $pat) = each %{$pms->{conf}{rawbody_tests}->{$priority}}) {
> +    my $sub;
> +    if ($pms->{conf}->{tflags}->{$rulename} =~ /\bmultiple\b/)
> +      {
> +      # support multiple matches
> +      $loopid++;
> +      $sub = '
> +      rawbody_'.$loopid.': foreach my $l (@_) {
> +        pos $l = 0;
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        while ($l =~ '.$pat.'g) { 
> +           $self->got_hit(q{'.$rulename.'}, "RAW: ", ruletype => "rawbody");
> +           '. $self->hit_rule_plugin_code($pms, $rulename, "rawbody",
> +					  "last rawbody_".$loopid) . '
> +        }
> +      }
> +      ';
> +    }
> +    else {
> +      $sub = '
> +      foreach my $l (@_) {
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        if ($l =~ '.$pat.') { 
> +           $self->got_hit(q{'.$rulename.'}, "RAW: ", ruletype => "rawbody");
> +           '. $self->hit_rule_plugin_code($pms, $rulename, "rawbody", "last") . '
> +        }
> +      }
> +      ';
> +    }
> +
> +    if ($use_rule_subs) {
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +           '.$rulename.'_rawbody_test($self, @_);
> +           '.$self->ran_rule_plugin_code($rulename, "rawbody").'
> +        }
> +      ';
> +    }
> +    else {
> +      $evalstr .= '
> +        if ($scoresptr->{q{'.$rulename.'}}) {
> +          '.$sub.'
> +          '.$self->ran_rule_plugin_code($rulename, "rawbody").'
> +        }
> +      ';
> +    }
> +
> +    if ($doing_user_rules) {
> +      next if (!$self->is_user_rule_sub($rulename.'_rawbody_test'));
> +    }
> +
> +    if ($use_rule_subs) {
> +      $evalstr2 .= '
> +        sub '.$rulename.'_rawbody_test { my $self = shift; '.$sub.' }
> +      ';
> +      push (@TEMPORARY_METHODS, $rulename.'_rawbody_test');
> +    }
> +  }
> +
> +  # clear out a previous version of this fn
> +  undef &{"${package_name}::_rawbody_tests_${clean_priority}"};
> +
> +  return unless ($evalstr);
> +
> +  # generate the loop that goes through each line...
> +  $evalstr = <<"EOT";
> +{
> +  package $package_name;
> +
> +  $evalstr2
> +
> +  sub _rawbody_tests_$clean_priority {
> +    my \$self = shift;
> +    $evalstr;
> +  }
> +
> +  1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn("rules: failed to compile body tests, skipping:\n" . "\t($@)\n");
> +    $pms->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::_rawbody_tests_${clean_priority}";
> +    push @TEMPORARY_METHODS, $method;
> +    no strict "refs";
> +    &{$method}($pms, @$textary);
> +    use strict "refs";
> +  }
> +}
> +
> +sub do_full_tests {
> +  my ($self, $pms, $priority, $fullmsgref) = @_;
> +  local ($_);
> +  
> +  # XXX - why not just do the plugin call directly?
> +  return if $pms->have_shortcircuited();
> +
> +  dbg("rules: running full-text regexp tests; score so far=".$pms->{score});
> +
> +  my $doing_user_rules = 
> +    $pms->{conf}->{user_rules_to_compile}->{$Mail::SpamAssassin::Conf::TYPE_FULL_TESTS};
> +
> +  # clean up priority value so it can be used in a subroutine name
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $package_name = __PACKAGE__;
> +
> +  $pms->{test_log_msgs} = ();        # clear test state
> +
> +  if (defined &{"${package_name}::_full_tests_${clean_priority}"}
> +      && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::_full_tests_${clean_priority}"}($pms, $fullmsgref);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  # build up the eval string...
> +  my $evalstr = $self->start_rules_plugin_code("full");
> +
> +  while (my($rulename, $pat) = each %{$pms->{conf}{full_tests}->{$priority}}) {
> +    $evalstr .= '
> +      if ($scoresptr->{q{'.$rulename.'}}) {
> +        pos $$fullmsgref = 0;
> +        '.$self->hash_line_for_rule($pms, $rulename).'
> +        while ($$fullmsgref =~ '.$pat.'g) {
> +          $self->got_hit(q{'.$rulename.'}, "FULL: ", ruletype => "full");
> +          '. $self->hit_rule_plugin_code($pms, $rulename, "full", "last") . '
> +        }
> +        '.$self->ran_rule_plugin_code($rulename, "full").'
> +      }
> +    ';
> +  }
> +
> +  undef &{"${package_name}::_full_tests_${clean_priority}"};
> +
> +  return unless ($evalstr);
> +
> +  # and compile it.
> +  $evalstr = <<"EOT";
> +  {
> +    package $package_name;
> +
> +    sub _full_tests_$clean_priority {
> +        my (\$self, \$fullmsgref) = \@_;
> +        study \$\$fullmsgref;
> +        $evalstr
> +    }
> +
> +    1;
> +  }
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn "rules: failed to compile full tests, skipping:\n" . "\t($@)\n";
> +    $pms->{rule_errors}++;
> +  } else {
> +    my $method = "${package_name}::_full_tests_${clean_priority}";
> +    push @TEMPORARY_METHODS, $method;
> +    no strict "refs";
> +    &{$method}($pms, $fullmsgref);
> +    use strict "refs";
> +  }
> +}
> +
> +sub do_head_eval_tests {
> +  my ($self, $pms, $priority) = @_;
> +  return unless (defined($pms->{conf}->{head_evals}->{$priority}));
> +  $self->run_eval_tests ($pms, $Mail::SpamAssassin::Conf::TYPE_HEAD_EVALS,
> +			 $pms->{conf}->{head_evals}->{$priority}, '', $priority);
> +}
> +
> +sub do_body_eval_tests {
> +  my ($self, $pms, $priority, $bodystring) = @_;
> +  return unless (defined($pms->{conf}->{body_evals}->{$priority}));
> +  $self->run_eval_tests ($pms, $Mail::SpamAssassin::Conf::TYPE_BODY_EVALS,
> +			 $pms->{conf}->{body_evals}->{$priority}, 'BODY: ',
> +			 $priority, $bodystring);
> +}
> +
> +sub do_rawbody_eval_tests {
> +  my ($self, $pms, $priority, $bodystring) = @_;
> +  return unless (defined($pms->{conf}->{rawbody_evals}->{$priority}));
> +  $self->run_eval_tests ($pms, $Mail::SpamAssassin::Conf::TYPE_RAWBODY_EVALS,
> +			 $pms->{conf}->{rawbody_evals}->{$priority}, 'RAW: ',
> +			 $priority, $bodystring);
> +}
> +
> +sub do_full_eval_tests {
> +  my ($self, $pms, $priority, $fullmsgref) = @_;
> +  return unless (defined($pms->{conf}->{full_evals}->{$priority}));
> +  $self->run_eval_tests($pms, $Mail::SpamAssassin::Conf::TYPE_FULL_EVALS,
> +			$pms->{conf}->{full_evals}->{$priority}, '',
> +			$priority, $fullmsgref);
> +}
> +
> +sub run_eval_tests {
> +  my ($self, $pms, $testtype, $evalhash, $prepend2desc, $priority, @extraevalargs) = @_;
> +  local ($_);
> +  
> +  # XXX - why not just call the plugin directly?
> +  return if $pms->have_shortcircuited();
> +
> +  my $doing_user_rules = $self->{conf}->{user_rules_to_compile}->{$testtype};
> +
> +  # clean up priority value so it can be used in a subroutine name 
> +  my $clean_priority;
> +  ($clean_priority = $priority) =~ s/-/neg/;
> +
> +  my $scoreset = $pms->{conf}->get_score_set();
> +
> +  my $package_name = __PACKAGE__;
> +
> +  my $methodname = '_eval_tests'.
> +    '_type'.$testtype .
> +      '_pri'.$clean_priority .
> +	'_set'.$scoreset;
> +
> +  # Some of the rules are scoreset specific, so we need additional
> +  # subroutines to handle those
> +  if (defined &{"${package_name}::${methodname}"}
> +      && !$doing_user_rules) {
> +    no strict "refs";
> +    &{"${package_name}::${methodname}"}($pms,@extraevalargs);
> +    use strict "refs";
> +    return;
> +  }
> +
> +  # look these up once in advance to save repeated lookups in loop below
> +  my $tflagsref = $pms->{conf}->{tflags};
> +  my $have_start_rules = $self->{main}->have_plugin("start_rules");
> +  my $have_ran_rule = $self->{main}->have_plugin("ran_rule");
> +
> +  # the buffer for the evaluated code 
> +  my $evalstr = q{ };
> +  $evalstr .= q{ my $function; };
> + 
> +  # conditionally include the dbg in the eval str
> +  my $dbgstr = q{ };
> +  if (would_log('dbg')) {
> +    $dbgstr = q{
> +      dbg("rules: ran eval rule $rulename ======> got hit ($result)");
> +    };
> +  }
> +
> +  while (my ($rulename, $test) = each %{$evalhash})  { 
> +    if ($tflagsref->{$rulename}) {
> +      # If the rule is a net rule, and we are in a non-net scoreset, skip it.
> +      if ($tflagsref->{$rulename} =~ /\bnet\b/) {
> +        next if (($scoreset & 1) == 0);
> +      }
> +      # If the rule is a bayes rule, and we are in a non-bayes scoreset, skip it.
> +      if ($tflagsref->{$rulename} =~ /\bbayes\b/) {
> +        next if (($scoreset & 2) == 0);
> +      }
> +    }
> + 
> +    my ($function, @args) = @{$test};
> +    if (!$function) {
> +      warn "rules: error: no function defined for $rulename";
> +      next;
> +    }
> + 
> +    $evalstr .= '
> +      $rulename = q#'.$rulename.'#;
> +      $self->{test_log_msgs} = ();
> +    ';
> + 
> +    # only need to set current_rule_name for plugin evals
> +    if ($pms->{conf}->{eval_plugins}->{$function}) {
> +      # let plugins get the name of the rule that is currently being run,
> +      # and ensure their eval functions exist
> +      $evalstr .= '
> +
> +        $self->{current_rule_name} = $rulename;
> +        $self->register_plugin_eval_glue(q#'.$function.'#);
> +
> +      ';
> +    }
> +
> +    # this stuff is quite slow, and totally superfluous if
> +    # no plugin is loaded for those hooks
> +    if ($have_start_rules) {
> +      # XXX - should we use helper function here?
> +      $evalstr .= '
> +
> +        $self->{main}->call_plugins("start_rules", {
> +                permsgstatus => $self, ruletype => "eval"
> +              });
> +
> +      ';
> +    }
> + 
> +    my $argstr = '';
> +    if (scalar @args > 0) {
> +      $argstr = ',' . join (', ', map { "q#".$_."#" } @args);
> +    }
> +
> +    $evalstr .= '
> +
> +      eval {
> +        $result = $self->' . $function . ' (@extraevalargs '. $argstr .' );
> +      };
> +      if ($@) { $self->handle_eval_rule_errors($rulename); }
> +
> +    ';
> +
> +    if ($have_ran_rule) {
> +      # XXX - should we use helper function here?
> +      $evalstr .= '
> +
> +        $self->{main}->call_plugins("ran_rule", {
> +            permsgstatus => $self, ruletype => "eval", rulename => $rulename
> +          });
> +
> +      ';
> +    }
> +
> +    $evalstr .= '
> +
> +      if ($result) {
> +        $self->got_hit($rulename, $prepend2desc, ruletype => "eval", value => $result);
> +        '.$dbgstr.'
> +      }
> +
> +    ';
> +  }
> +
> +  # nothing done in the loop, that means no rules 
> +  return unless ($evalstr);
> + 
> +  $evalstr = <<"EOT";
> +{
> +  package $package_name;
> +
> +    sub ${methodname} {
> +      my (\$self, \@extraevalargs) = \@_;
> +
> +      my \$prepend2desc = q#$prepend2desc#;
> +      my \$rulename;
> +      my \$result;
> +
> +      $evalstr
> +    }
> +
> +  1;
> +}
> +EOT
> +
> +  eval $evalstr;
> +
> +  if ($@) {
> +    warn "rules: failed to compile eval tests, skipping some: $@\n";
> +    $self->{rule_errors}++;
> +  }
> +  else {
> +    my $method = "${package_name}::${methodname}";
> +    push (@TEMPORARY_METHODS, $methodname);
> +    no strict "refs";
> +    &{$method}($pms,@extraevalargs);
> +    use strict "refs";
> +  }
> +}
> +
> +# Helper Functions
> +
> +sub hash_line_for_rule {
> +  my ($self, $pms, $rulename) = @_;
> +  return "\n".'#line 1 "'.
> +        $pms->{conf}->{source_file}->{$rulename}.
> +        ', rule '.$rulename.',"';
> +}
> +
> +sub is_user_rule_sub {
> +  my ($self, $subname) = @_;
> +  my $package_name = __PACKAGE__;
> +  return 0 if (eval 'defined &'.$package_name.'::'.$subname);
> +  1;
> +}
> +
> +sub start_rules_plugin_code {
> +  my ($self, $ruletype) = @_;
> +
> +  my $evalstr = '
> +
> +      # start_rules_plugin_code '.$ruletype.'
> +      my $scoresptr = $self->{conf}->{scores};
> +
> +  ';
> +
> +  if ($self->{main}->have_plugin("start_rules")) {
> +    $evalstr .= '
> +
> +      $self->{main}->call_plugins ("start_rules", { permsgstatus => $self,
> +                                                    ruletype => \''.$ruletype.'\' });
> +
> +    ';
> +  }
> +
> +  return $evalstr;
> +}
> +
> +sub hit_rule_plugin_code {
> +  my ($self, $pms, $rulename, $ruletype, $loop_break_directive) = @_;
> +
> +  # note: keep this in 'single quotes' to avoid the $ & performance hit,
> +  # unless specifically requested by the caller.   Also split the
> +  # two chars, just to be paranoid and ensure that a buggy perl interp
> +  # doesn't impose that hit anyway (just in case)
> +  my $match = '($' . '&' . '|| "negative match")';
> +
> +  my $debug_code = '';
> +  if (exists($pms->{should_log_rule_hits})) {
> +    $debug_code = '
> +        dbg("rules: ran '.$ruletype.' rule '.$rulename.' ======> got hit: \"" . '.
> +            $match.' . "\"");
> +    ';
> +  }
> +
> +  my $save_hits_code = '';
> +  if ($pms->{save_pattern_hits}) {
> +    $save_hits_code = '
> +        $self->{pattern_hits}->{q{'.$rulename.'}} = '.$match.';
> +    ';
> +  }
> +
> +  # if we're not running "tflags multiple", break out of the matching
> +  # loop this way
> +  my $multiple_code = '';
> +  if ($pms->{conf}->{tflags}->{$rulename} !~ /\bmultiple\b/) {
> +    $multiple_code = $loop_break_directive.';';
> +  }
> +
> +  return $debug_code.$save_hits_code.$multiple_code;
> +}
> +
> +sub ran_rule_plugin_code {
> +  my ($self, $rulename, $ruletype) = @_;
> +
> +  return '' unless $self->{main}->have_plugin("ran_rule");
> +
> +  # The $self here looks odd, but since we are inserting this into eval'd code it
> +  # needs to be $self which in that case is actually the PerMsgStatus object
> +  return '
> +    $self->{main}->call_plugins ("ran_rule", { permsgstatus => $self, rulename => \''.$rulename.'\', ruletype => \''.$ruletype.'\' });
> +  ';
> +}
> +
> +1;
> 
> Modified: spamassassin/branches/check_plugin/rules/v320.pre
> URL: http://svn.apache.org/viewvc/spamassassin/branches/check_plugin/rules/v320.pre?view=diff&rev=462695&r1=462694&r2=462695
> ==============================================================================
> --- spamassassin/branches/check_plugin/rules/v320.pre (original)
> +++ spamassassin/branches/check_plugin/rules/v320.pre Tue Oct 10 21:28:24 2006
> @@ -11,6 +11,9 @@
>  #
>  ###########################################################################
>  
> +# Check - Provides main check functionality
> +loadplugin Mail::SpamAssassin::Plugin::Check
> +
>  # HTTPSMismatch - find URI mismatches between href and anchor text
>  #
>  loadplugin Mail::SpamAssassin::Plugin::HTTPSMismatch