#!/usr/bin/perl -w -T ############################################################# # The code in this file is copyright 2001 by Craig Hughes # # It is licensed for use with the SpamAssassin distribution # # under the terms of the Perl Artistic License, the text of # # which is included as the file named "License" # ############################################################# my $PREFIX = '@@PREFIX@@'; # substituted at 'make' time my $DEF_RULES_DIR = '@@DEF_RULES_DIR@@'; # substituted at 'make' time my $LOCAL_RULES_DIR = '@@LOCAL_RULES_DIR@@'; # substituted at 'make' time use lib '@@INSTALLSITELIB@@'; # substituted at 'make' time use lib '../lib'; # added by jm for use inside the distro use strict; use IO::Socket; use IO::Handle; use IO::Pipe; use Config; use Mail::SpamAssassin; use Mail::SpamAssassin::NoMailAudit; use Getopt::Long; use Pod::Usage; use Sys::Syslog qw(:DEFAULT setlogsock); use POSIX qw(:sys_wait_h); use POSIX qw(setsid); use Errno; use File::Spec; use File::Path; # Load Time::HiRes if it's available BEGIN { eval { require Time::HiRes }; Time::HiRes->import( qw(time) ) unless $@; } sub spawn; # forward declaration sub logmsg; # forward declaration my %resphash = ( EX_OK => 0, # no problems EX_USAGE => 64, # command line usage error EX_DATAERR => 65, # data format error EX_NOINPUT => 66, # cannot open input EX_NOUSER => 67, # addressee unknown EX_NOHOST => 68, # host name unknown EX_UNAVAILABLE => 69, # service unavailable EX_SOFTWARE => 70, # internal software error EX_OSERR => 71, # system error (e.g., can't fork) EX_OSFILE => 72, # critical OS file missing EX_CANTCREAT => 73, # can't create (user) output file EX_IOERR => 74, # input/output error EX_TEMPFAIL => 75, # temp failure; user is invited to retry EX_PROTOCOL => 76, # remote error in protocol EX_NOPERM => 77, # permission denied EX_CONFIG => 78, # configuration error ); # defaults my %opt = ( 'user-config' => 1, 'ident-timeout' => 5.0, ); my @OLD_ARGV = @ARGV; # Getopt::Long tends to clear @ARGV Getopt::Long::Configure ("bundling"); GetOptions( 'auto-whitelist|whitelist|a' => \$opt{'auto-whitelist'}, 'create-prefs!' => \$opt{'create-prefs'}, 'c' => \$opt{'create-prefs'}, 'daemonize!' => \$opt{'daemonize'}, 'd' => \$opt{'daemonize'}, 'help|h' => \$opt{'help'}, 'listen-ip|ip-address|i=s' => \$opt{'listen-ip'}, 'max-children|m=i' => \$opt{'max-children'}, 'port|p=i' => \$opt{'port'}, 'sql-config!' => \$opt{'sql-config'}, 'q' => \$opt{'sql-config'}, 'setuid-with-sql' => \$opt{'setuid-with-sql'}, 'Q' => \$opt{'setuid-with-sql'}, 'virtual-config|V=s' => \$opt{'virtual-config'}, 'pidfile|r=s' => \$opt{'pidfile'}, 'syslog|s=s' => \$opt{'syslog'}, 'syslog-socket=s' => \$opt{'syslog-socket'}, 'username|u=s' => \$opt{'username'}, 'vpopmail!' => \$opt{'vpopmail'}, 'v' => \$opt{'vpopmail'}, 'configpath|C=s' => \$opt{'configpath'}, 'user-config' => \$opt{'user-config'}, 'nouser-config|x' => sub{ $opt{'user-config'} = 0 }, 'allowed-ips|A=s' => \@{$opt{'allowed-ip'}}, 'debug!' => \$opt{'debug'}, 'D' => \$opt{'debug'}, 'local!' => \$opt{'local'}, 'L' => \$opt{'local'}, 'paranoid!' => \$opt{'paranoid'}, 'P' => \$opt{'paranoid'}, 'helper-home-dir|H:s' => \$opt{'home_dir_for_helpers'}, 'auth-ident' => \$opt{'auth-ident'}, 'ident-timeout=f' => \$opt{'ident-timeout'}, 'ssl' => \$opt{'ssl'}, 'server-key=s' => \$opt{'server-key'}, 'server-cert=s' => \$opt{'server-cert'}, # will be stripped in future release 'add-from!' => sub { warn "The --add-from option has been removed\n" }, 'F=i' => sub { warn "The -F option has been removed\n" }, ) or pod2usage(-exitval => $resphash{'EX_USAGE'}, -verbose => 0); @ARGV = @OLD_ARGV; $opt{'help'} and pod2usage(-exitval => $resphash{'EX_USAGE'}, -verbose => 0, -message => 'For more details, use "man spamd"'); # These can be changed on command line with -A flag if(@{$opt{'allowed-ip'}}) { set_allowed_ip(split /,/, join(',', @{$opt{'allowed-ip'}})); } else { set_allowed_ip('127.0.0.1'); } # ident-based spamc user authentication if ($opt{'auth-ident'}) { eval { require Net::Ident }; die "fatal: ident-based authentication requested, but Net::Ident is unavailable\n" if ($@); $opt{'ident-timeout'} = undef if $opt{'ident-timeout'} <= 0.0; import Net::Ident qw(ident_lookup); } # Check for server certs $opt{'server-key'} ||= "$LOCAL_RULES_DIR/certs/server-key.pem"; $opt{'server-cert'} ||= "$LOCAL_RULES_DIR/certs/server-cert.pem"; if ($opt{'ssl'}) { eval { require IO::Socket::SSL }; die "fatal: SSL encryption requested, but IO::Socket::SSL is unavailable\n" if ($@); if (!-e $opt{'server-key'}) { die "The server key file $opt{'server-key'} does not exist\n"; } if (!-e $opt{'server-cert'}) { die "The server certificate file $opt{'server-cert'} does not exist\n"; } } # This can be changed on the command line with the -s flag my $log_facility = $opt{'syslog'} || 'mail'; my $dontcopy = 1; if ($opt{'create-prefs'}) { $dontcopy = 0; } my $extrapid = 5000; undef($opt{'max-children'}) unless defined($opt{'max-children'}) && $opt{'max-children'} > 0; $extrapid = $opt{'max-children'} if defined($opt{'max-children'}); my $orighome; if (defined $ENV{'HOME'}) { $orighome = $ENV{'HOME'}; # keep a copy for use by Razor, Pyzor etc. delete $ENV{'HOME'}; # we do not want to use this when running spamd } my $spamtest = Mail::SpamAssassin->new({ dont_copy_prefs => $dontcopy, rules_filename => ($opt{'configpath'} || 0), local_tests_only => ($opt{'local'} || 0), debug => ($opt{'debug'} || 0), paranoid => ($opt{'paranoid'} || 0), home_dir_for_helpers => (defined $opt{'home_dir_for_helpers'} ? $opt{'home_dir_for_helpers'} : $orighome), PREFIX => $PREFIX, DEF_RULES_DIR => $DEF_RULES_DIR, LOCAL_RULES_DIR => $LOCAL_RULES_DIR }); # Do whitelist later in tmp dir. Side effect: this will be done as -u user. if ($log_facility ne 'stderr') { eval { setlogsock('unix'); syslog('debug', 'spamd starting'); # required to actually open the socket }; # Solaris sometimes doesn't support UNIX-domain syslog sockets apparently; # same is true for perl 5.6.0 build on an early version of Red Hat 7! if ($@) { eval { setlogsock('inet'); syslog('debug', 'spamd starting'); }; } # fall back to stderr if all else fails if ($@) { warn "failed to setlogsock() on this platform; reporting logs to stderr\n"; $log_facility = 'stderr'; } } my $port = $opt{'port'} || 783; my $addr = (gethostbyname($opt{'listen-ip'} || '127.0.0.1'))[0]; my $proto = getprotobyname('tcp'); ($port) = $port =~ /^(\d+)$/ or die "invalid port\n"; # Be a well-behaved daemon my $server; if ($opt{'ssl'}) { $server = new IO::Socket::SSL(LocalAddr => $addr, LocalPort => $port, Proto => $proto, Type => SOCK_STREAM, ReuseAddr => 1, Listen => SOMAXCONN, SSL_verify_mode => 0x00, SSL_key_file => $opt{'server-key'}, SSL_cert_file => $opt{'server-cert'} ) || die "Could not create SSL socket: $! $@\n"; } else { $server = new IO::Socket::INET(LocalAddr => $addr, LocalPort => $port, Proto => $proto, Type => SOCK_STREAM, ReuseAddr => 1, Listen => SOMAXCONN ) || die "Could not create INET socket: $! $@\n"; } $opt{'daemonize'} and daemonize(); # support non-root use (after we bind to the port) my $setuid_to_user = 0; if ($opt{'username'}) { my $uuid = getpwnam($opt{'username'}); if (!defined $uuid || $uuid == 0) { die "fatal: cannot run as nonexistent user or root with -u option\n"; } # make sure we can unlink it later if (defined $opt{'pidfile'}) { chown $uuid, -1, $opt{'pidfile'} || die "fatal: could not chown '$opt{'pidfile'}' to uid $uuid\n"; } $> = $uuid; # effective uid $< = $uuid; # real uid. we now cannot setuid anymore if ($> != $uuid and $> != ($uuid-2**32)) { die "fatal: setuid to uid $uuid failed\n"; } } elsif ($> == 0) { if ( !$opt{'vpopmail'} ) { $setuid_to_user = 1; } } $opt{'auto-whitelist'} and eval { require Mail::SpamAssassin::DBBasedAddrList; # create a factory for the persistent address list my $addrlistfactory = Mail::SpamAssassin::DBBasedAddrList->new(); $spamtest->set_persistent_address_list_factory ($addrlistfactory); }; Mail::SpamAssassin::Util::clean_path_in_taint_mode(); preload_modules_with_tmp_homedir(); # Note: we now use a set of fds to track children, as using SIGCHLD # is unreliable on many versions of perl (sadly). Thanks to # anomie /at/ users sourceforge net for the patch! $SIG{CHLD} = 'IGNORE'; $SIG{INT} = \&kill_handler; $SIG{TERM} = \&kill_handler; # now allow waiting processes to connect, if they're watching the log. # The test suite does this! if ($opt{'debug'}) { warn "server started on port $port (running version ". Mail::SpamAssassin::Version().")\n"; warn "server pid: $$\n"; } logmsg("server started on port $port (running version ". Mail::SpamAssassin::Version().")\n"); my $current_user; my $client; # qmail vpopmail support my $assign = "/var/qmail/users/assign"; # where to find domain to user mappings my (%qmailu, $qu_load); my $readvec = ""; my %pipes = (); vec($readvec, $server->fileno, 1) = 1; while (1) { if (defined $client) { $client->close; } # paranoia vs fd leaks cleanupchildren(); # some platforms leave zombies otherwise my $n = select(my $rd=$readvec, undef, undef, undef); next if ($n == -1 && $! == &Errno::EINTR); die "select failed: $!" if ($n <= 0); if ($opt{'max-children'}) { while (my ($kid, $pipe) = each %pipes) { # Since the pipe is never written, it will only become readable when # the other end closes it (on exit) so we could read the EOF. Thus, if # the pipe is readable the kid has exited. # # This kludge is necessary due to bugs in perl's signal handling and # reentrancy which mean we can't just catch SIGCHLD in the normal way. # next unless vec($rd, $pipe->fileno(), 1); vec($readvec, $pipe->fileno(), 1) = 0; delete ($pipes{$kid}); $extrapid++; Mail::SpamAssassin::dbg("cleaned up kid $kid, pool=$extrapid"); # We reaped a kid, so listen for connects again vec($readvec, $server->fileno, 1) = 1; } } if (vec($rd, $server->fileno, 1)) { if ($opt{'max-children'} && $extrapid <= 0) { # Since we can't accept any connects until we reap a kid, don't bother # selecting on Server until we do so. We have to do this test here # instead of in &spawn because we need the select loop to watch for # kids. vec($readvec, $server->fileno, 1) = 0; logmsg "hit max-children limit (".$opt{'max-children'}."): waiting for some to exit"; next; } $client = $server->accept; if (!$client) { # this can happen when interrupted by SIGCHLD on Solaris, # perl 5.8.0, and some other platforms with -m. if ($! == &Errno::EINTR) { next; } else { die "accept failed: $!"; } } my $start = time; my($port,$iaddr) = sockaddr_in($client->peername); my $name = gethostbyaddr($iaddr,AF_INET); if (ip_is_allowed(inet_ntoa($iaddr))) { logmsg "connection from $name [", inet_ntoa($iaddr),"] at port $port"; } else { logmsg "unauthorized connection from $name [", inet_ntoa($iaddr),"] at port $port"; $client->close; next; } spawn sub { $client->autoflush(1); local ($_) = $client->getline; if (!defined $_) { protocol_error ("(closed before headers)"); return 1; } chomp; # It may be a SKIP message, meaning that the client (spamc) # thinks it is too big to check. So we don't do any real work # in that case. if (/SKIP SPAMC\/(.*)/) { logmsg "skipped large message in ". sprintf("%3d", time - $start) ." seconds."; return 0; } # It might be a CHECK message, meaning that we should just check # if it's spam or not, then return the appropriate response. # If we get the PROCESS command, the client is going to send a # message that we need to filter. elsif (/(PROCESS|CHECK|SYMBOLS|REPORT|REPORT_IFSPAM) SPAMC\/(.*)/) { check ($1, $2, $start); } # If it was none of the above, then we don't know what it was. else { protocol_error ($_); } }; } } sub check { my ($method, $version, $start) = @_; local ($_); my $expected_length; # Protocol version 1.0 and greater may have "User:" and # "Content-length:" headers. But they're not required. if($version > 1.0) { while(1) { $_ = $client->getline; if(!defined $_) { protocol_error ("(EOF during headers)"); return 1; } if (/^\r\n/s) { last; } # We'll run handle user unless we've been told not # to process per-user config files. Otherwise # we'll check and see if we need to try SQL # lookups. If $opt{'user-config'} is true, we need to try # their config file and then do the SQL lookup. # If $opt{'user-config'} IS NOT true, we skip the conf file and # only need to do the SQL lookup if $opt{'sql-config'} IS # true. (I got that wrong the first time.) if (/^User: (.*)\r\n/) { $current_user = $1; auth_ident($current_user) if $opt{'auth-ident'}; if (!$opt{'user-config'}) { if ($opt{'sql-config'}) { handle_user_sql($current_user); } elsif ($opt{'virtual-config'}) { handle_virtual_user($current_user); } elsif ($opt{'setuid-with-sql'}) { handle_user_setuid_with_sql($current_user); $setuid_to_user = 1; #to benefit from any paranoia. } } else { handle_user($current_user); } } if (/^Content-length: ([0-9]*)\r\n/i) { $expected_length = $1; } } } if ( $setuid_to_user && $> == 0 ) { if ($spamtest->{paranoid}) { logmsg "PARANOID: still running as root, closing connection."; die; } logmsg "Still running as root: user not specified with -u, ". "not found, or set to root. Fall back to nobody."; my $uid = getpwnam('nobody'); $> = $uid; if ( !defined($uid) || ($> != $uid and $> != ($uid-2**32))) { logmsg "fatal: setuid to nobody failed"; die; } } if ($opt{'sql-config'} && !defined($current_user)) { handle_user_sql('nobody'); } my $resp = "EX_OK"; # Now read in message my @msglines; my $actual_length; my $in_header = 1; my $msgid; while ($_ = $client->getline()) { if ($in_header) { if (/^$/) { $in_header = 0; $msgid = '(unknown)' unless($msgid); } elsif (/^Message-Id:\s+(.*)$/i) { $msgid = $1; while($msgid =~ s/\([^\(\)]*\)//) {}; # remove comments and $msgid =~ s/^\s+|\s+$//g; # leading and trailing spaces $msgid =~ s/\s.*$/(...)/; # keep only the first token } } push(@msglines, $_); $actual_length += length; last if ($actual_length == $expected_length); } $current_user ||= '(unknown)'; logmsg (($method eq 'PROCESS') ? 'processing' : 'checking') . " message $msgid for $current_user:$>" . ($expected_length ? ", expecting $expected_length bytes" : "") . "."; my $mail = Mail::SpamAssassin::NoMailAudit->new ( data => \@msglines ); # Check length if we're supposed to if($expected_length) { if($actual_length != $expected_length) { protocol_error ("(Content-length mismatch: $expected_length vs. $actual_length)"); return 1; } } # Now use copy-on-writed (hopefully) SA object my $status = $spamtest->check($mail); my $msg_score = sprintf("%.1f",$status->get_hits); my $msg_threshold = sprintf("%.1f",$status->get_required_hits); my $response_spam_status = ""; my $was_it_spam; if ($status->is_spam) { $response_spam_status = $method eq "REPORT_IFSPAM" ? "Yes" : "True"; $was_it_spam = 'identified spam'; } else { $response_spam_status = $method eq "REPORT_IFSPAM" ? "No" : "False"; $was_it_spam = 'clean message'; } if ($method eq 'PROCESS') { $status->rewrite_mail; #if $status->is_spam; # Build the message to send back and measure it my $msg_resp = join '',$mail->header,"\n",@{$mail->body}; my $msg_resp_length = length($msg_resp); if($version >= 1.2) # Spamc protocol 1.2 means it accepts content-length { print $client "SPAMD/1.1 $resphash{$resp} $resp\r\n", "Content-length: $msg_resp_length\r\n\r\n", $msg_resp; } else # Earlier than 1.2 didn't accept content-length { print $client "SPAMD/1.0 $resphash{$resp} $resp\r\n", $msg_resp; } } else # $method eq 'CHECK' et al { my $response_header = "SPAMD/1.1 $resphash{$resp} $resp\r\n"; if ($method eq "REPORT_IFSPAM") { $response_header .= "X-Spam-Status: $response_spam_status, hits=$msg_score required=$msg_threshold tests=" . $status->get_names_of_tests_hit() . " version=" . Mail::SpamAssassin::Version(); } else { $response_header .= "Spam: $response_spam_status ; $msg_score / $msg_threshold"; } print $client $response_header, "\r\n\r\n"; print $client $status->get_names_of_tests_hit,"\r\n" if ($method eq "SYMBOLS"); print $client $status->get_report,"\r\n" if ($method eq "REPORT" or ($method eq "REPORT_IFSPAM" and $status->is_spam)); } logmsg "$was_it_spam ($msg_score/$msg_threshold) for $current_user:$> in ". sprintf("%.1f", time - $start) ." seconds, $actual_length bytes."; $status->finish(); # added by jm to allow GC'ing } sub protocol_error { local $_ = shift; my $resp = "EX_PROTOCOL"; print $client "SPAMD/1.0 $resphash{$resp} Bad header line: $_\r\n"; logmsg "bad protocol: header error: $_"; } sub spawn { my $coderef = shift; unless (@_ == 0 && $coderef && ref($coderef) eq 'CODE') { warn "usage: spawn CODEREF"; } my $pid; my $pipe; if ($opt{'max-children'}) { $pipe=IO::Pipe->new(); if (!defined($pipe)) { logmsg "pipe failed: $!"; return; } } $extrapid--; if (!defined($pid = fork)) { logmsg "cannot fork: $!"; $extrapid++; return; } elsif ($pid) { if ($opt{'max-children'}) { $pipe->reader(); $pipes{$pid} = $pipe; vec($readvec, $pipe->fileno(), 1) = 1; } return; # I'm the parent } # else I'm the child -- go spawn if ($opt{'max-children'}) { $pipe->writer(); %pipes = (); # No point in keeping the other kid pipes, close them all } $server->close; # redirect default output to STDERR (/dev/null), so that noise from # Razor etc. will not be output as headers and # thereby cause protocol failures. select STDERR; exit &$coderef(); } sub auth_ident { my $username = shift; my $ident_username = ident_lookup($client, $opt{'ident-timeout'}); my $dn = $ident_username || 'NONE'; # display name warn "ident_username = $dn, spamc_username = $username\n" if $opt{'debug'}; if ($username ne $ident_username) { logmsg "fatal: ident username ($dn) does not match " . "spamc username ($username)"; exit 1; } } sub handle_user { my $username = shift; # # If vpopmail config enabled then look up userinfo for vpopmail uid # as defined by $opt{'username'} or as passed via $username # my $userid = ''; if ($opt{'vpopmail'} && $opt{'username'}) { $userid = $opt{'username'}; } elsif ( $opt{'vpopmail'} ) { $userid = "vpopmail"; } else { $userid = $username; } my ($name,$pwd,$uid,$gid,$quota,$comment,$gcos,$dir,$etc) = getpwnam($userid); if ( !$spamtest->{'paranoid'} && !defined($uid) ) { #if we are given a username, but can't look it up, #Maybe NIS is down? lets break out here to allow #them to get 'defaults' when we are not running paranoid. logmsg "handle_user() -> unable to find user [$userid]!"; return 0; } if ($setuid_to_user) { $> = $uid; if ( !defined($uid) || ($> != $uid and $> != ($uid-2**32))) { logmsg "fatal: setuid to $username failed"; die; # make it fatal to avoid security breaches } else { logmsg "info: setuid to $username succeeded"; } } # # If vpopmail config enabled then set $dir to virtual homedir # if ($opt{'vpopmail'}) { $dir = `$dir/bin/vuserinfo -d $username`; chomp ($dir); } my $cf_file = $dir."/.spamassassin/user_prefs"; # # If vpopmail config enabled then pass virtual homedir onto create_default_cf_needed # if ($opt{'vpopmail'}) { if ($opt{'username'}) { create_default_cf_if_needed ($cf_file, $username, $dir); $spamtest->read_scoreonly_config ($cf_file); $spamtest->signal_user_changed ({ username => $username, user_dir => "$dir/.spamassassin" }); } else { my $sysnam = get_user_from_address ($username); $spamtest->read_scoreonly_config ($cf_file); $spamtest->signal_user_changed ({ username => $sysnam, user_dir => "$dir/.spamassassin" }) } } else { create_default_cf_if_needed ($cf_file, $username); $spamtest->read_scoreonly_config ($cf_file); $spamtest->signal_user_changed ({ username => $username }); } return 1; } # Handle user configs without the necessity of having individual users or a # SQL database. sub handle_virtual_user { my $username = shift; # the virtual-config contains the path to a directory which will # contain per-user preferences. my $dir=$opt{'virtual-config'}; my $file="$dir/$username.prefs"; # If the user file is not there, look for a default.prefs if(! -f $file) { $file="$dir/default.prefs"; # And if that isn't there, log that it's misconfigured. if(! -f $file) { logmsg("Couldn't find a virtual directory or defaults " . "for $username in $dir"); return(0); } else { # Log that the default configuration is being used for a user. logmsg("Using default config for $username"); } } # Found a config, load it. $spamtest->read_scoreonly_config($file); # TODO: assume that $dir/$username will be a writable directory we can # use for AWL, Bayes dbs etc. $spamtest->signal_user_changed ({ username => $username, user_dir => "$dir/$username" }); return(1); } sub handle_user_sql { my $username = shift; $spamtest->load_scoreonly_sql ($username); return 1; } sub handle_user_setuid_with_sql { my $username = shift; my ($name,$pwd,$uid,$gid,$quota,$comment,$gcos,$dir,$etc) = getpwnam($username); if ( !$spamtest->{'paranoid'} && !defined($uid) ) { #if we are given a username, but can't look it up, #Maybe NIS is down? lets break out here to allow #them to get 'defaults' when we are not running paranoid. logmsg "handle_user() -> unable to find user [$username]!\n"; return 0; } if ($setuid_to_user) { $> = $uid; if ( !defined($uid) || ($> != $uid and $> != ($uid-2**32))) { logmsg "fatal: setuid to $username failed"; die; # make it fatal to avoid security breaches } else { logmsg "info: setuid to $username succeeded, reading scores from SQL."; } } $spamtest->load_scoreonly_sql ($username); $spamtest->signal_user_changed ({ username => $username }); return 1; } sub create_default_cf_if_needed { my ($cf_file, $username, $userdir) = @_; # Parse user scores, creating default .cf if needed: if( ! -r $cf_file && ! $spamtest->{'dont_copy_prefs'}) { logmsg "Creating default_prefs [$cf_file]"; # If vpopmail config enabled then pass virtual homedir onto # create_default_prefs via $userdir $spamtest->create_default_prefs ($cf_file,$username,$userdir); if ( ! -r $cf_file ) { logmsg "Couldn't create readable default_prefs for [$cf_file]"; } } } sub get_user_from_address { my ($user, $domain) = split(/@/, $_[0]); my $dom = lc($domain); if ( $qmailu{$dom} ne "" ) { warn "returning result from cache.\n" if ($opt{'debug'}); my $nam = getpwuid($qmailu{$dom}); return $nam; } else { warn "cache miss\n" if ($opt{'debug'}); &fill_qmailu_cache($assign); if ( $qmailu{$dom} ne "" ) { my $nam = getpwuid($qmailu{$dom}); return $nam; } else { return 0; } } } sub fill_qmailu_cache { # rather than parsing the qmail users/assign file every time a message # arrives, we run this once when spamd is loaded and check the files # modified time each query to know when to reload it. my ($READ, $WRITE) = (stat($_[0]))[8,9]; if ( $WRITE > $qu_load ) { undef %qmailu; $qu_load = time; open(ASSIGN, $_[0]) || die "couldn't open $_[0]: $!\n"; warn "loading $_[0] into cache...." if ($opt{'debug'}); while() { my @data = split(/:/, $_); $qmailu{$data[1]} = $data[2]; }; warn "done.\n" if ($opt{'debug'}); close(ASSIGN); } else { warn "$_[0] already cached.\n" if ($opt{'debug'}); } } sub logmsg { my $old = $SIG{'PIPE'}; $SIG{'PIPE'} = sub { $main::SIGPIPE_RECEIVED++; }; # bug 605: http://bugzilla.spamassassin.org/show_bug.cgi?id=605 # more efficient for daemontools if --syslog=stderr is used if($log_facility eq 'stderr') { print STDERR join("",@_) . "\n"; return; } openlog('spamd','cons,pid',$log_facility); my $str = join ('', @_); if ($opt{'debug'}) { warn "logmsg: $str\n"; } eval { syslog('info', '%s', $str); }; if ($@) { warn "syslog() failed, try using --syslog-socket switch ($@)\n"; } if ($main::SIGPIPE_RECEIVED) { # SIGPIPE recieved when writing to syslog - this has been # found to occur with syslog-ng after syslog-ng restarts. # Close and reopen the log handle, then try again. closelog(); openlog('spamd','cons,pid',$log_facility); syslog('info', '%s', $str); # now report what happend my $msg = "SIGPIPE received - reopening log socket"; if ($opt{'debug'}) { warn "logmsg: $msg\n"; } syslog('warning', '%s', $msg); # if we've received multiple sigpipes, logging is probably # still broken. if ($main::SIGPIPE_RECEIVED > 1) { warn "logging failure: multiple SIGPIPEs received\n"; } $main::SIGPIPE_RECEIVED = 0; } $SIG{'PIPE'} = $old if defined($old); } sub kill_handler { my ($sig) = @_; logmsg "server killed by SIG$sig, shutting down"; $server->close; defined($opt{'pidfile'}) and unlink($opt{'pidfile'}); exit 0; } use POSIX 'setsid'; sub daemonize { $0 = join(' ', $0, @ARGV) unless($opt{'debug'});; # pretty command line in ps chdir '/' or die "Can't chdir to '/': $!"; $SIG{__WARN__} = sub { logmsg($_[0]); }; open STDIN,'/dev/null' or die "Can't read '/dev/null': $!"; open STDOUT,'>/dev/null' or die "Can't write '/dev/null': $!"; defined(my $pid=fork) or die "Can't fork: $!"; exit if $pid; setsid or die "Can't start new session: $!"; open STDERR,'>&STDOUT' or die "Can't duplicate stdout: $!"; Mail::SpamAssassin::dbg('daemonized.'); if(defined($opt{'pidfile'})) { open PIDF,">$opt{'pidfile'}" or warn "Can't open PID file: $!"; print PIDF $$."\n"; close PIDF; } } my @allowed_nets; sub set_allowed_ip { foreach (@_) { my ($ip, $bits) = m#^\s*(\d+\.\d+\.\d+\.\d+)(?:/(\d+))?\s*$# or die "illegal network address given: '$_'. Aborting.\n"; defined $bits or $bits = 32; my $mask = 0xFFffFFff ^ ((2 ** (32-$bits)) - 1); push @allowed_nets, { mask => $mask, ip => my_inet_aton($ip) & $mask, }; } } sub ip_is_allowed { my $ip = my_inet_aton($_[0]); foreach my $net (@allowed_nets){ return 1 if ($ip & $net->{mask}) == $net->{ip}; } 0; } sub my_inet_aton { unpack("N", pack("C4", split(/\./, $_[0]))) } sub preload_modules_with_tmp_homedir { # set $ENV{HOME} in /tmp while we compile and preload everything. # File::Spec->tmpdir uses TMPDIR, TMP, TEMP, C:/temp, /tmp etc. my $tmpdir = File::Spec->tmpdir(); if (!$tmpdir) { die "cannot find writable tmp dir! set TMP or TMPDIR in env"; } my $tmphome = File::Spec->catdir ($tmpdir, "spamassassin-$$"); $tmphome = Mail::SpamAssassin::Util::untaint_file_path ($tmphome); my $tmpsadir = File::Spec->catdir ($tmphome, ".spamassassin"); mkdir($tmphome, 0700) or die "fatal: Can't create $tmphome"; mkdir($tmpsadir, 0700) or die "fatal: Can't create $tmpsadir"; $ENV{HOME} = $tmphome; $spamtest->compile_now(0); # ensure all modules etc. are loaded $/ = "\n"; # argh, Razor resets this! Bad Razor! # now clean up the stuff we just created, and make us taint-safe delete $ENV{HOME}; # try to use File::Path. However, it's NOT taint-safe (!!) so will # fail sometimes, it seems. eval { rmtree $tmphome; }; # if the dir still exists, use system(). We've already called # Mail::SpamAssassin::Util::untaint_file_path(), which cleans metachars, # so this is safe (if a little absurd). if (-d $tmphome) { system ("rm -rf '".$tmphome."'"); } } sub cleanupchildren { # may be required on some platforms even though we use SIG{CHLD} = 'IGNORE'. # cf. mail from Stefan Seiz , Fri, 27 Dec 2002 17:32:54 # noting it on MacOS X Server 10.1.5. my $kid; do { $kid = waitpid(-1,&WNOHANG); } while ($kid > 0); } __DATA__ =head1 NAME spamd - daemonized version of spamassassin =head1 SYNOPSIS spamd [options] Options: -a, --auto-whitelist, --whitelist Use auto-whitelists -c, --create-prefs Create user preferences files -C path, --configpath=path Path for default config files -d, --daemonize Daemonize -h, --help Print usage message. -i ipaddr, --listen-ip=ipaddr,... Listen on the IP ipaddr (default: 127.0.0.1) -m num, --max-children num Allow maximum num children -p port, --port Listen on specified port (default: 783) -q, --sql-config Enable SQL config (only useful with -x) -Q, --setuid-with-sql Enable SQL config (only useful with -x, enables use of -a and -H) -V, --virtual-config=dir Enable Virtual configs (needs -x) -r pidfile, --pidfile Write the process id to pidfile -s facility, --syslog=facility Specify the syslog facility (default: mail) --syslog-socket=type How to connect to syslogd (default: unix) -u username, --username=username Run as username -v, --vpopmail Enable vpopmail config -x, --nouser-config Disable user config files --auth-ident Use ident to authenticate spamc user --ident-timeout=timeout Timeout for ident connections -A host,..., --allowed-ips=..,.. Limit ip addresses which can connect -D, --debug Print debugging messages -L, --local Use local tests only (no DNS) -P, --paranoid Die upon user errors -H dir Specify a different HOME directory, path optional --ssl Run an SSL server --server-key keyfile Specify an SSL keyfile --server-cert certfile Specify an SSL certificate =head1 DESCRIPTION The purpose of this program is to provide a daemonized version of the spamassassin executable. The goal is improving throughput performance for automated mail checking. This is intended to be used alongside C, a fast, low-overhead C client program. See the README file in the C directory of the SpamAssassin distribution for more details. Note: Although spamd will check per-user config files for every message, any changes to the system-wide config files will require restarting spamd for the changes to take effect. =head1 OPTIONS Options of the long form can be shortened as long as they remain unambiguous. (i.e. B<--dae> can be used instead of B<--daemonize>) Also, boolean options (like B<--auto-whitelist>) can be negated by adding I<--no> (B<--noauto-whitelist>), however, this is usually unnecessary. =over =item B<-a>, B<--auto-whitelist>, B<--whitelist> Use auto-whitelists. Auto-whitelists track the long-term average score for each sender and then shift the score of new messages toward that long-term average. This can increase or decrease the score for messages, depending on the long-term behavior of the particular correspondent. See the README file for more details. =item B<-c>, B<--create-prefs> Create user preferences files if they don't exist (default: don't). =item B<-C> I, B<--configpath>=I Use the specified path for locating configuration files. Ignore the default directories. =item B<-d>, B<--daemonize> Detach from starting process and run in background (daemonize). =item B<-h>, B<--help> Print a brief help message, then exit without further action. =item B<-i> I, B<--listen-ip>=I, B<--ip-address>=I Tells spamd to listen on the specified IP address [defaults to 127.0.0.1]. Use 0.0.0.0 to listen on all interfaces. =item B<-p> I, B<--port>=I Optionally specifies the port number for the server to listen on. =item B<-q>, B<--sql-config> Turn on SQL lookups even when per-user config files have been disabled with B<-x>. this is useful for spamd hosts which don't have user's home directories but do want to load user preferences from an SQL database. If your spamc client does not support sending the C header, like C, then the SQL username used will always be B. =item B<-Q>, B<--setuid-with-sql> Turn on SQL lookups even when per-user config files have been disabled with B<-x> and also setuid to the user. This is useful for spamd hosts which want to load user preferences from an SQL database but also wish to support the use of B<-a> (AWL) and B<-H> (Helper home directories.) =item B<-V>, B<--virtual-config>=I This option specifies a directory which will contain per-user preference files. The files are in the format of B.prefs>. A B file will be used if an individual user config is not found. Note that this B that B<-x> is used, and cannot be combined with SQL-based configuration. If a subdirectory is found in that directory, called B>, and it is writable, it will be used to score auto-whitelist and/or Bayes databases for that user. =item B<-r> I, B<--pidfile>=I Write the process ID of the spamd parent to the file specified by I. The file will be unlinked when the parent exits. Note that when running with the B<-u> option, the file must be writable by that user. =item B<-v>, B<--vpopmail> Enable vpopmail config. If specified with with B<-u> set to the vpopmail user, this allows spamd to lookup/create user_prefs in the vpopmail user's own maildir. This option is useful for vpopmail virtual users who do not have an entry in the system /etc/passwd file. If specified without B<-u>, then it allows every mail account on a vpopmail virtual domain setup to have their own user-customizable spamassassin preferences, assuming they have their own home directory set. =item B<-s> I, B<--syslog>=I Specify the syslog facility to use (default: mail). If C is specified, output will be written to stderr. This is useful if you're running C under the C package. =item B<--syslog-socket>=I Specify how spamd should send messages to syslogd. The options are C, C or C. The default is to try C first, falling back to C if perl detects errors in its C support. Some platforms, or versions of perl, are shipped with dysfunctional versions of the B package which do not support some socket types, so you may need to set this. If you get error messages regarding B<__PATH_LOG> or similar from spamd, try changing this setting. =item B<-u> I, B<--username>=I Run as the named user. The alternative, default behaviour is to setuid() to the user running C, if C is running as root. =item B<-x>, B<--nouser-config>, B<--user-config> Turn off(on) per-user config files. All users will just get the default configuration. =item B<--auth-ident> Verify the username provided by spamc using ident. This is only useful if connections are only allowed from trusted hosts (because an identd that lies is trivial to create) and if spamc REALLY SHOULD be running as the user it represents. Connections are terminated immediately if authentication fails. In this case, spamc will pass the mail through unchecked. Failure to connect to an ident server, and response timeouts are considered authentication failures. This requires that Net::Ident be installed. =item B<--ident-timeout>=I Wait at most I seconds for a response to ident queries. Authentication that takes long that I seconds will fail, and mail will not be processed. Setting this to 0.0 or less results in no timeout, which is STRONGLY discouraged. The default is 5 seconds. =item B<-A> I, B<--allowed-ips>=I Specify a list of authorized hosts or networks which can connect to this spamd instance. Single IP addresses can be given, or ranges of ip addresses in address/masklength format. This option can be specified multiple times or can take a list of addresses separated by commas. Examples: B<-A 10.11.12.13,10.11.12.14> -- only allow connections from 10.11.12.13 and 10.11.12.14 -B -- allow connections from any machine in the range 10.200.300.* By default, connections are only accepted from localhost [127.0.0.1]. =item B<-D>, B<--debug> Print debugging messages =item B<-L>, B<--local> Perform only local tests on all mail. In other words, skip DNS and other network tests. Works the same as the C<-L> flag to C. =item B<-P>, B<--paranoid> Die on user errors (for the user passed from spamc) instead of falling back to user I and using the default configuration. =item B<-m> I, B<--max-children>=I Specify a maximum number of children to spawn. Spamd will wait until another child finishes before forking again. Meanwhile, incoming connections will be queued. Please note that there is a OS specific maximum of connections that can be queued (Try C to find this maximum). Also, this option causes spamd to create an extra pipe for each child. =item B<-H> I, B<--helper-home-dir>=I Specify that external programs such as Razor, DCC, and Pyzor should have a HOME environment variable set to a specific directory. The default is to use the HOME environment variable setting from the shell running spamd. By specifying no argument, spamd will use the spamc caller's home directory instead. =item B<--ssl> Accept only SSL connections. The B perl module must be installed. =item B<--server-key> I Specify the SSL key file to use for SSL connections. =item B<--server-cert> I Specify the SSL certificate file to use for SSL connections. =back =head1 BUGS Perl 5.005_03 seems to have a bug, which spamd triggers, causing messages to pass through unscanned. Upgrading to Perl 5.6 seems to fix the problem, so that's the current workaround. More information can be found at http://www.hughes-family.org/bugzilla/show_bug.cgi?id=497 The C<-m> switch seems to trigger signal-handling bugs in many versions of Perl. =head1 SEE ALSO spamc(1) spamassassin(1) Mail::SpamAssassin(3) Mail::SpamAssassin::Conf(3) =head1 AUTHOR Craig R Hughes Ecraig@hughes-family.orgE =head1 PREREQUISITES C =cut