1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
|
# perl
# Logs URLs to a p5-DBI-MySQL database.
# This script is BSD licensed.
# Hacked together by Karlis "Hagabard" Loen in Feb 2007
# hagabard AT gmail DOT com
# Table format: (ircurls is default table name in script)
#+-----------+---------------+------+-----+---------+-------+
#| Field | Type | Null | Key | Default | Extra |
#+-----------+---------------+------+-----+---------+-------+
#| timestamp | timestamp(14) | YES | | NULL | |
#| hostmask | text(255) | YES | | NULL | |
#| target | text(255) | YES | | NULL | |
#| url | text(255) | YES | | NULL | |
#+-----------+---------------+------+-----+---------+-------+
# In the future I hope to get around to adding stuff like:
#+-----------+---------------+------+-----+---------+-------+
#| httptitle | text(255) | YES | | NULL | |
#| httpdinfo | text(255) | YES | | NULL | |
#| tinyurl | text(255) | YES | | NULL | |
#+-----------+---------------+------+-----+---------+-------+
# Test other DBI types, maybe /setp perl.logurlsql.dbtype="Pg" works?
# Tested with p5-DBI-Mysql, others untested
use DBI;
weechat::register("logurlsql", "0.2", "", "WeeChat p5-DBI script to log URLs to a SQL Database.");
weechat::add_message_handler("*", "cmd_logurl");
# Setup Database connection, now with /setp for your configuration pleasure
weechat::set_plugin_config("dbtype", "mysql") if (weechat::get_plugin_config("dbtype") eq "");
weechat::set_plugin_config("dbhost", "localhost") if (weechat::get_plugin_config("dbhost") eq "");
weechat::set_plugin_config("dbname", "weechat") if (weechat::get_plugin_config("dbname") eq "");
weechat::set_plugin_config("dbtable", "ircurls") if (weechat::get_plugin_config("dbtable") eq "");
weechat::set_plugin_config("dbuser", "irc") if (weechat::get_plugin_config("dbuser") eq "");
weechat::set_plugin_config("dbpass", "forever") if (weechat::get_plugin_config("dbpass") eq "");
# Regexps
sub URL_SCHEME_REGEX() { '(http|ftp|https|news|irc)' }
sub URL_GUESS_REGEX() { '(www|ftp)' }
sub URL_BASE_REGEX() { '[a-z0-9_\-+\\/:?%.&!~;,=\#<]' }
# This sub borrowed from the BSD licensed urlplot.pl irssi script by bwolf.
sub scan_url {
my $rawtext = shift;
return $1 if $rawtext =~ m|(@{[ URL_SCHEME_REGEX ]}://@{[ URL_BASE_REGEX ]}+)|io;
# The URL misses a scheme, try to be smart
if ($rawtext =~ m|@{[ URL_GUESS_REGEX ]}\.@{[ URL_BASE_REGEX ]}+|io) {
my $preserve = $&;
return "http://$preserve" if $1 =~ /^www/;
return "ftp://$preserve" if $1 =~ /^ftp/;
}
return undef;
}
sub cmd_logurl {
($null, $target, $data) = split ":",$_[1],3;
($hostmask, $null, $target) = split " ", $target;
if (defined($url = scan_url($data))) {
#weechat::print("hostmask=$hostmask, target=$target, url=$url");
db_insert($hostmask, $target, $url);
}
return weechat::PLUGIN_RC_OK;
}
sub db_insert {
my ($hostmask, $target, $url)=@_;
my $dbh = DBI->connect( "DBI:". weechat::get_plugin_config(dbtype) .":". weechat::get_plugin_config(dbname) .":". weechat::get_plugin_config(dbhost), weechat::get_plugin_config(dbuser), weechat::get_plugin_config(dbpass));
my $sql="insert into ". weechat::get_plugin_config(dbtable) ." (timestamp, hostmask, target, url) values (NOW()".",". $dbh->quote($hostmask) ."," . $dbh->quote($target) ."," . $dbh->quote($url) .")";
my $sth = $dbh->do($sql);
$dbh->disconnect();
}
|