Current File : //sbin/rbld |
#!/usr/bin/perl
##########################################################################
# rbld - Daemon that reads and serves IP based blacklists and whitelists
# Copyright 2006, Bluehost, Inc.
#
# Authors and Contributers:
#
# Spencer Candland <spencer@bluehost.com>
# Ryan Chaudhry <rchaudhry@bluehost.com>
# Erick Cantwell <erick@bluehost.com>
#
# http://www.bluehost.com
# https://github.com/bluehost/rbld
#
##########################################################################
#
# This file is part of rbld
#
# Rbld free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA02111-1307, USA.
#
##########################################################################
use strict;
use warnings;
use IO::File;
use IO::Socket;
use Fcntl qw(F_SETFD);
use Proc::Daemon;
use Proc::PID::File;
use Data::Dumper;
use Getopt::Long;
use YAML::Syck qw(LoadFile);
use Time::HiRes qw(gettimeofday tv_interval);
use POSIX;
my $config = {};
my $settings = {};
my $defaults = {
rbld_conf => '/etc/rbld.conf',
log => '/var/log/rbld.log',
infile => '/etc/inrbld',
listconf => '/etc/rbld.d/rbldlists.conf',
run_path => '/usr/sbin/rbld',
sock_path => '/var/tmp/rbld.sock',
sock_owner => 'mailnull',
sock_group => 'nobody',
debug => 0,
};
# Get cli options
GetOptions (
'c|config=s' => \$config->{rbld_conf},
'o|log=s' => \$config->{log},
'i|infile=s' => \$config->{infile},
'l|listconf=s' => \$config->{listconf},
'r|runpath=s' => \$config->{run_path},
's|socketpath=s' => \$config->{sock_path},
'u|socketowner=s' => \$config->{sock_owner},
'g|socketgroup=s' => \$config->{sock_group},
'd|debug' => \$config->{debug},
'h|help' => \&help,
) || &help;
# Start
my @start = gettimeofday();
my $DEBUG = 0;
my ($dfh, $in_pid);
my %lists;
my %all;
my %info = (
blacklist => {},
infile => {},
metastats => {},
starttime => time(),
stats => {},
whitelist => {},
);
my %run = (
DEBUG => sub { $DEBUG = shift; return; },
DUMP => sub { return Dumper (%info, %lists); },
LOAD_CONF => \&load_conf,
LOAD_LIST => \&load_list,
CIDR => \&check_cidr,
IP => \&check_ip,
TRIE => \&check_trie,
META => \&check_meta,
ALL => \&check_all,
WHITELIST => \&check_whitelist,
STAT => \&give_stats,
STATS => \&give_stats,
);
my %load = (
CIDR => \&load_cidr,
IP => \&load_ip,
TRIE => \&load_trie,
META => \&load_meta,
);
sub debug {
return unless $DEBUG;
warn scalar(localtime).": [$$] @_";
}
sub main {
# Load default or cli specified configuration file
if ($config->{rbld_conf}) {
$settings = LoadFile($config->{rbld_conf});
} else {
$settings = LoadFile($defaults->{rbld_conf});
}
# Merge to config hash
# These/this should be moved to a subroutine
my @vals = ('log', 'infile', 'listconf', 'run_path', 'sock_path', 'sock_owner', 'sock_group', 'debug');
# First, merge conf file to cli
foreach (@vals) {
my $val = $_;
unless ($config->{$val}) {
if ($settings->{$val}) {
$config->{$val} = $settings->{$val};
}
}
}
# Next merge defaults into the config
foreach (@vals) {
my $val = $_;
unless ($config->{$val}) {
if ($defaults->{$val}) {
$config->{$val} = $defaults->{$val};
}
}
}
$DEBUG = 1 if $config->{debug};
$0 = "rbld";
Proc::Daemon::Init() unless $ENV{BIND_FD};
umask 0117;
exit 1 if Proc::PID::File->running();
open_log();
$SIG{TERM} = $SIG{INT} = sub { exit 0 };
$SIG{PIPE} = sub { die "PIPE" };
my $sigset = POSIX::SigSet->new();
POSIX::sigaction(&POSIX::SIGUSR2, POSIX::SigAction->new('open_log',
$sigset, &POSIX::SA_NODEFER));
POSIX::sigaction(&POSIX::SIGHUP, POSIX::SigAction->new('reload',
$sigset, &POSIX::SA_NODEFER));
reset_infile();
my @rblstart = gettimeofday();
warn scalar(localtime).": [$$] Loading Conf and Lists...\n";
load_conf($config->{listconf});
&link_meta;
warn scalar(localtime).": [$$] load completed in (".tv_interval (\@rblstart).").\n";
my $listen;
if (exists $ENV{BIND_FD} and $ENV{BIND_FD} =~ /^(\d+)$/) {
my $bind_fd = $1;
debug "Reusing fd($bind_fd)\n";
$listen = IO::Socket::UNIX->new();
$listen->fdopen($bind_fd, "r") or die "Socket: $!";
}
else {
unlink $config->{sock_path};
$listen = IO::Socket::UNIX->new(
Local => $config->{sock_path},
Listen => SOMAXCONN,
) or die "Socket: $!";
chown ( ((getpwnam("$config->{sock_owner}"))[2]), ((getgrnam("$config->{sock_group}"))[2]), $config->{sock_path}) || warn "Could not chown socket: $!";
}
warn scalar(localtime).": [$$] $0 startup completed in (".tv_interval (\@start)."). Now Listening.\n";
my ($conn, $req, $bvec, $rw, $timeleft, $nfound, $buffer, $data, $msg);
while (1) {
eval {
$conn = $listen->accept() or die "Accept error: $!\n";
$req = $bvec = '';
vec($bvec, $conn->fileno, 1) = 1;
$timeleft = 0.2;
while ($timeleft > 0) {
($nfound, $timeleft) = select($rw=$bvec, undef, undef, $timeleft);
$buffer = '';
if ($nfound != 0) {
sysread($conn, $buffer, 8192) or die "EOF on connection\n";
}
$req .= $buffer;
last if index($buffer, "\n") > 0;
}
die "Timed out on request\n" if $timeleft == 0;
$req =~ s/\n.*//;
};
if ($@) {
debug $@;
$conn->shutdown(2) if $conn;
next;
}
$info{requests}++;
my ($cmd, $args) = split (/\s+/, $req, 2);
$msg = '';
if ($run{$cmd}) {
debug "Running command [$req]\n";
$msg = &{$run{$cmd}}($args);
} else {
debug "Unknown command [$req]\n";
}
eval {
$timeleft = 0.5;
$buffer = 0;
if ($msg) {
do {
($nfound, $timeleft) = select(undef, $rw=$bvec, undef, $timeleft);
if ($nfound != 0) {
$buffer += syswrite($conn, $msg, length($msg));
}
} until ($timeleft == 0 or $buffer == length($msg));
}
$conn->shutdown(2);
};
}
}
# NAME TYPE [whitelist|blacklist] FILE FILE_FORMAT[IP|CIDR|TRIE|META]:[EXPIRE|TRIE_SPLIT|LIST] [STAT_ONLY]
sub load_conf {
my $cfile = shift;
debug "Loading config file $cfile\n";
my %nlists;
if (-e $cfile) {
# read the config
open (CF, "<$cfile");
flock (CF, 2);
while (<CF>) {
chomp($_);
next unless ($_);
next if (substr($_, 0, 1) eq "#");
my @tmp = split (/\s+/, $_);
my $file = $tmp[2];
# Make sure we have a valid type
my $type = $tmp[1];
next unless (($type eq "whitelist") or ($type eq "blacklist"));
# Make sure we have a valid format
my @split = split (/:/, $tmp[3]);
my $format = $split[0];
next unless (exists ($load{$format}));
$nlists{$file}{"file"} = $file;
$nlists{$file}{"name"} = $tmp[0];
$nlists{$file}{"type"} = $type;
$nlists{$file}{"format"} = $format;
$nlists{$file}{"split"} = $split[1] || 0;
$nlists{$file}{"stat_only"} = $tmp[4] || 0;
$nlists{$file}{"cfile"} = $cfile;
# So we can get at data through name as well, which
# is how queries to the list actually come through
$nlists{$tmp[0]} = \%{$nlists{$file}};
}
flock (CF, 8);
close (CF);
foreach my $file (keys %nlists) {
# See if conf changed
if (exists $lists{$file}) {
my $diff = 0;
foreach (keys %{$nlists{$file}}) {
$diff = 1 if ($nlists{$file}{$_} ne $lists{$file}{$_});
}
next unless ($diff == 1);
}
my $name = $nlists{$file}{"name"};
$lists{$file} = $nlists{$file};
load_list ($file);
# Create our inwatch watches
my $realfile = $lists{$file}{"file"};
add_to_infile ($realfile, "LOAD_LIST") unless (exists $nlists{$name}{"meta"});
# Create a run command for the list
$run{$name} = sub { return check_list($name, shift); },
}
# Find and delete options that were removed
foreach my $file (keys %lists) {
next unless ($lists{$file}{"cfile"} eq $cfile);
unless (exists $nlists{$file}) {
debug "$file was removed from conf $cfile, removing\n";
my $type = $lists{$file}{"type"};
my $name = $lists{$file}{"name"};
delete ($info{$type}{$name});
delete ($info{"stats"}{$name});
delete ($lists{$file});
delete ($run{$name});
}
}
}
# Even if it doesn't exist we want to add it, that way
# we can create it and then watch it. Mainly useful
# for things like our local whitelists, which may not
# exist yet on new servers
add_to_infile ($cfile, "LOAD_CONF");
}
# Take any list, and call correct routine based on format
sub load_list {
my $file = shift;
debug "Caught load_list on $file\n";
my $format = $lists{$file}{"format"};
if ($load{$format}) {
my $name = $lists{$file}{"name"};
warn scalar(localtime).": [$$] Loading $name $file (".$lists{$file}{"type"}." $format)\n";
return &{$load{$format}}($file);
}
}
sub load_cidr {
my $file = shift;
if (-e $file) {
open (LST, "<$file");
flock (LST, 2);
my $type = $lists{$file}{"type"};
my $name = $lists{$file}{"name"};
my $split = $lists{$file}{"split"};
my $expire = 0;
delete ($info{$type}{$name});
while (<LST>) {
chomp($_);
next unless ($_);
next if (substr($_, 0, 1) eq "#");
my $line = $_;
if ($split) {
my @tmp = split (/\s+/, $_);
if (time >= $tmp[0]) {
$expire = 1;
next;
}
$line = $tmp[1];
}
my ($ip, $mask) = split (/\//, $line);
if ($mask < 8) {
warn scalar(localtime).": [$$] CIDR range is too large ($ip/$mask), skipping.\n";
next;
}
# Handle ranges bigger then 16
my $range = 0;
if ($mask < 16) {
$range = ((2 ** (16 - $mask)) - 1);
}
foreach (0 .. $range) {
my $adjm = (32 - $mask);
my @oct = split (/\./, $ip);
$oct[1] += $_;
# Make sure we have some minimum and maximum values
$info{$type}{$name}{$oct[0]}{$oct[1]}{min} = $adjm unless (exists $info{$type}{$name}{$oct[0]}{$oct[1]}{min});
$info{$type}{$name}{$oct[0]}{$oct[1]}{max} = $adjm unless (exists $info{$type}{$name}{$oct[0]}{$oct[1]}{max});
$info{$type}{$name}{$oct[0]}{$oct[1]}{min} = $adjm if ($adjm < $info{$type}{$name}{$oct[0]}{$oct[1]}{min});
$info{$type}{$name}{$oct[0]}{$oct[1]}{max} = $adjm if ($adjm > $info{$type}{$name}{$oct[0]}{$oct[1]}{max});
my $pack = unpack("N", pack("C4", @oct)) >> $adjm;
$info{$type}{$name}{$oct[0]}{$oct[1]}{$adjm}{$pack} = 1;
}
}
if ($expire == 1) {
seek (LST, 0, 0);
foreach (keys %{$info{$type}{$name}}) {
print LST "$info{$type}{$name}{$_} $_\n";
}
truncate LBT, tell(LBT);
}
flock (LST, 8);
close (LST);
$all{$name} = 1;
}
}
sub load_ip {
my $file = shift;
if (-e $file) {
open (LST, "+<$file");
flock (LST, 2);
my $type = $lists{$file}{"type"};
my $name = $lists{$file}{"name"};
my $split = $lists{$file}{"split"};
my $expire = 0;
delete ($info{$type}{$name});
while (<LST>) {
chomp($_);
next unless ($_);
next if (substr($_, 0, 1) eq "#");
if ($split) {
my @tmp = split (/\s+/, $_);
if (time >= $tmp[0]) {
$expire = 1;
next;
}
$info{$type}{$name}{$tmp[1]} = $tmp[0];
} else {
$info{$type}{$name}{$_} = 1;
}
}
if ($expire == 1) {
seek (LST, 0, 0);
foreach (keys %{$info{$type}{$name}}) {
print LST "$info{$type}{$name}{$_} $_\n";
}
truncate LBT, tell(LBT);
}
flock (LST, 8);
close (LST);
$all{$name} = 1;
}
}
sub load_meta {
my $file = shift;
@{$lists{$file}{"meta"}} = split (/,/, $lists{$file}{"split"});
}
sub load_trie {
my $file = shift;
if (-e $file) {
open (LST, "<$file");
flock (LST, 2);
my $type = $lists{$file}{"type"};
my $name = $lists{$file}{"name"};
delete ($info{$type}{$name});
while (<LST>) {
chomp($_);
next unless ($_);
next if (substr($_, 0, 1) eq "#");
my ($key, $value) = split (/\s+/);
$info{$type}{$name}{$key} = $value;
}
flock (LST, 8);
close (LST);
$all{$name} = 1;
}
}
# Make fake meta_list masquarade as a real list, primarily for stats
sub link_meta {
foreach (keys %lists) {
if ($lists{$_}{"format"} eq "META") {
my $meta_name = $lists{$_}{"name"};
foreach my $list_name (@{$lists{$meta_name}{"meta"}}) {
$lists{$meta_name."_".$list_name} = \%{$lists{$list_name}};
}
}
}
}
# Whitelists are global, so checks all whitelists.
sub check_whitelist {
my $ip = shift;
foreach my $name (keys %{$info{whitelist}}) {
$info{"stats"}{$name}{"requests"}++;
my $format = $lists{$name}{"format"};
if (&{$run{$format}}($name, $ip)) {
$info{"stats"}{$name}{"rejections"}++;
return 1;
}
}
return 0;
}
# Check any list, will call correct routine based on format
sub check_list {
my $name = shift;
my $ip = shift;
my $format = $lists{$name}{"format"};
# Increment requests
$info{"stats"}{$name}{"requests"}++;
my $ret = &{$run{$format}}($name, $ip);
if ($ret) {
my $type = $lists{$name}{"type"};
# If type is not a blacklist we don't need to check whitelist
if ($type ne "blacklist") {
$info{"stats"}{$name}{"rejections"}++;
# Don't block if we are setup as stats only
return 0 if ($lists{$name}{"stat_only"});
return 1;
}
# If we were on a blacklist, check the whitelist.
# We do it in this order to get good whitelist stats.
return 0 if (check_whitelist($ip));
$info{"stats"}{$name}{"rejections"}++;
if ($ret ne 1) {
$info{"stats"}{$ret}{"rejections"}++ if ($ret ne 1);
return 0 if ($lists{$ret}{"stat_only"});
}
# Don't block if we are setup as stats only
return 0 if ($lists{$name}{"stat_only"});
return 1;
}
return 0
}
sub check_all {
# TODO, gather stats, requests and rejections, on
# the exact lists inside the "all" list.
# TODO, make it so you can specify a "all" list
# in the conf
my $ip = shift;
my $hits = "";
foreach my $list_name (keys %all) {
my $format = $lists{$list_name}{"format"};
$hits .= "$list_name " if (&{$run{$format}}($list_name, $ip));
}
return 0 if (check_whitelist($ip));
return $hits;
}
sub check_cidr {
my $name = shift;
my $ip = shift;
my $type = $lists{$name}{"type"};
my @oct = split (/\./, $ip);
return 0 unless (exists $info{$type}{$name}{$oct[0]});
return 0 unless (exists $info{$type}{$name}{$oct[0]}{$oct[1]});
# bitshift from my min mask to max to do the check
foreach ($info{$type}{$name}{$oct[0]}{$oct[1]}{min} .. $info{$type}{$name}{$oct[0]}{$oct[1]}{max}) {
my $pack = unpack("N", pack("C4", @oct)) >> $_;
return 1 if ($info{$type}{$name}{$oct[0]}{$oct[1]}{$_}{$pack});
}
return 0;
}
sub check_ip {
my $name = shift;
my $ip = shift;
my $type = $lists{$name}{"type"};
return 1 if ($info{$type}{$name}{$ip});
return 0;
}
sub check_meta {
my $name = shift;
my $ip = shift;
foreach my $list_name (@{$lists{$name}{"meta"}}) {
# Make sure list actually exists
next unless (exists $lists{$list_name});
my $format = $lists{$list_name}{"format"};
$info{"stats"}{$name."_".$list_name}{"requests"}++;
return $name."_".$list_name if (&{$run{$format}}($list_name, $ip));
}
return 0;
}
sub check_trie {
my $name = shift;
my $ip = shift;
my $type = $lists{$name}{"type"};
my $split = $lists{$name}{"split"};
my @oct = split (/\./, $ip);
my $data = unpack("N", pack("C4", @oct));
my $key = substr $data, 0, $split;
my $value = substr $data, $split;
return 0 unless (exists $info{$type}{$name}{$key});
return 1 if (1+index( $info{$type}{$name}{$key}, ":$value:" ));
return 0;
}
sub give_stats {
my $running = time - $info{"starttime"};
return unless ($running);
my (@time) = gmtime($running);
my $stats .= sprintf ("\n%30s:\t%d Days %d Hours %d Min %d Sec\n",
"Uptime", $time[7], $time[2], $time[1], $time[0], $running);
$stats .= sprintf ("%30s:\t%d\n", "Total Requests", $info{"requests"});
$stats .= sprintf ("%30s:\t%.2f\n", "Requests Per Second", ($info{"requests"} / $running));
foreach my $name (sort keys %{$info{"stats"}}) {
my $wording = "Rejections";
$stats .= sprintf ("\n%30s:\t%d (%.2f%%)", "$name Requests",
$info{"stats"}{$name}{"requests"},
(($info{"stats"}{$name}{"requests"} / $info{"requests"})*100));
# It is kind of awkward to call a whitelist save a "rejection"
# so we update the wording as appropriate
$wording = "Saves" if ($lists{$name}{"type"} eq "whitelist");
# Avoid uninitialized errors
if (exists $info{"stats"}{$name}{"rejections"}) {
$stats .= sprintf ("\n%30s:\t%d (%.2f%%)\n", "$name $wording",
$info{"stats"}{$name}{"rejections"},
(($info{"stats"}{$name}{"rejections"} / $info{"stats"}{$name}{"requests"}) * 100));
} else {
$stats .= sprintf ("\n%30s:\t%d\n", "$name $wording", 0);
}
$stats .= sprintf ("%30s:\t%.2f\n", "$name RPS", ($info{"stats"}{$name}{"requests"} / $running));
}
return $stats;
}
# Add a watch on a file via inwatch
sub add_to_infile {
my $file = shift;
return if ($info{"infile"}{$file});
my $cmd = shift;
open (INF, ">>$config->{infile}");
print INF "$file IN_MODIFY|IN_CREATE_SELF SOCK RBLD $cmd $file\n";
close (INF);
$info{"infile"}{$file} = 1;
return;
}
sub reset_infile {
delete $info{"infile"};
open (INF, ">$config->{infile}");
close (INF);
}
sub open_log {
warn scalar(localtime).": [$$] $0 Reseting log file...\n";
close (STDERR);
open STDERR, ">>$config->{log}";
chmod 0600, $config->{log};
warn scalar(localtime).": [$$] $0 Log file open.\n";
# TODO, Make this reload on the next request after
# something expires instead of once a day.
# Reload lists with entries that expire.
foreach my $file (keys %lists) {
next unless ($lists{$file}{"split"});
next if ($lists{$file}{"format"} eq "TRIE");
load_list ($file);
}
}
sub reload {
warn scalar(localtime).": [$$] $0 reloading...\n";
exit if fork;
sleep 2;
exec "$config->{run_path}" or die "exec: $!";
}
# HELP ME!!!
sub help {
print <<EOF;
-c|--config Path to rbld daemon configuration file
-o|--log=s Path to rbld log
-i|--infile Path to rbld infile
-l|--listconf Path to rbld list configuration file
-r|--runpath Path to run path of script (/usr/sbin/rbld)
-s|--socketpath Path to rbld socket
-u|--socketowner Who the rbld socket owner will be set to
-g|--socketgroup Which group the rbld socket will be set to
-d|--debug Debug output
-h|--help This lovely help message
EOF
exit 0;
}
END {
debug "Exiting...\n";
$dfh->close if defined $dfh;
exit 0;
}
main();