cloudflare-tor/tool/irssi_cf_alturl.pl

236 lines
8.1 KiB
Perl
Raw Normal View History

2019-05-03 05:38:02 +02:00
#!/usr/bin/perl -w
# This Irssi script automatically check incoming http/https links
# and replace it to archive one if it is MITMed.
2019-05-04 16:03:22 +02:00
#
# Irssi /set Options
# you can view your current settigns by running "/set cflarealt" in Irssi
#
# /set cflarealt_debug <on|off> -- (off) if you have a problem try turning this on to debug
# /set cflarealt_send2channel <on|off> -- (off) send the converted URL publicly to everyone in your channels
# /set cflarealt_channels <"#channel1, #channel2, etc"> -- Channels to automatically convert. Empty Defaults to all
# /set cflarealt_shorturl_activate <on|off> -- (off) set it 'on' to use shortner
# /set cflarealt_shorturl_min <40> -- (40) How long a url has to be to trigger automatic url shortening
2019-05-05 03:14:26 +02:00
#
# /set cflarealt_localdbpath <"string to path"> -- () '/path/database/split/'
# /set cflarealt_uselocaldb <on|off> -- (off) if 'on', please set path to local database (or the script will die)
2019-05-03 05:38:02 +02:00
#---------------------------------------------------------------------
2019-05-04 16:12:21 +02:00
2019-05-04 16:03:22 +02:00
##use strict;
2019-05-04 16:12:21 +02:00
2019-05-03 05:38:02 +02:00
use vars qw($VERSION %IRSSI);
2019-05-05 03:14:26 +02:00
$VERSION = "20190506";
2019-05-04 16:03:22 +02:00
%IRSSI = (
# Special thanks to: "eo, tsaavik"
2019-05-03 05:38:02 +02:00
authors => "Anonymous",
2019-05-04 16:03:22 +02:00
contact => 'anonymous@cloudflare-tor.nab',
2019-05-03 05:38:02 +02:00
name => "irssi_cf_alturl.pl",
description => "Cloudflare URL replacer",
license => "WTFPL",
changed => "$VERSION"
);
use Irssi;
use Irssi::Irc;
use LWP::Simple;
use LWP::UserAgent;
2019-05-05 03:14:26 +02:00
my ( $cfg_minurllen, $cfg_send2chan, $cfg_useshort, $cfg_isdebug, $cfg_uselocaldb, $cfg_localdbpath, $cfg_chanlist );
2019-05-04 16:03:22 +02:00
my @cached = ();
2019-05-03 05:38:02 +02:00
sub setuphandler {
2019-05-04 16:03:22 +02:00
Irssi::settings_add_bool( "cflarealt", "cflarealt_send2channel", 0 );
if ( Irssi::settings_get_bool("cflarealt_send2channel") ) {
print "cflarealt: sending of shorturl's to public channels enabled";
$cfg_send2chan = 1;
}
Irssi::settings_add_bool( "cflarealt", "cflarealt_shorturl_activate", 0 );
if ( Irssi::settings_get_bool("cflarealt_shorturl_activate") ) {
print "cflarealt: URL shortner enabled";
$cfg_useshort = 1;
}
Irssi::settings_add_str( "cflarealt", "cflarealt_channels", "" );
$cfg_chanlist = Irssi::settings_get_str("cflarealt_channels");
if ($cfg_chanlist) {
print "cflarealt: Following channels are now parsed $cfg_chanlist";
}
Irssi::settings_add_int( "cflarealt", "cflarealt_shorturl_min", 40 );
my $old_min_url_length = $cfg_minurllen;
$cfg_minurllen = Irssi::settings_get_int("cflarealt_shorturl_min");
if ( $cfg_minurllen != $old_min_url_length ) {
print "cflarealt: min_url_length sucessfully set to $cfg_minurllen";
}
Irssi::settings_add_bool( "cflarealt", "cflarealt_debug", 0 );
my $old_debug = $cfg_isdebug;
$cfg_isdebug = Irssi::settings_get_bool("cflarealt_debug");
if ( $cfg_isdebug != $old_debug ) {
if ($cfg_isdebug) {
print "cflarealt: Debug Mode Enabled";
$cfg_isdebug = 1;
}
else {
print "cflarealt: Debug Mode Disabled";
$cfg_isdebug = 0;
}
}
2019-05-05 03:14:26 +02:00
Irssi::settings_add_bool( "cflarealt", "cflarealt_uselocaldb", 0 );
if ( Irssi::settings_get_bool("cflarealt_uselocaldb") ) {
print "cflarealt: Lookup Local DB enabled";
$cfg_uselocaldb = 1;
}
Irssi::settings_add_str( "cflarealt", "cflarealt_localdbpath", "" );
$cfg_localdbpath = Irssi::settings_get_str("cflarealt_localdbpath");
if ($cfg_localdbpath) {
print "cflarealt: DB path set to $cfg_localdbpath";
}
2019-05-03 05:38:02 +02:00
}
sub GotUrl {
my ( $server, $data, $nick, $addr, $target ) = @_;
if ( !$server || !$server->{connected} ) {
Irssi::print("Not connected to server");
return;
}
2019-05-04 16:03:22 +02:00
return unless ( goodchan($target) );
2019-05-03 05:38:02 +02:00
$data =~ s/^\s+//;
$data =~ s/\s+$//;
my @urls = ();
2019-05-04 16:03:22 +02:00
my ( $url, $a, $return, $char, $ch, $result ) = "";
2019-05-03 05:38:02 +02:00
my $same = 0;
my $sitewas = "t";
my @chars = ();
2019-05-04 16:03:22 +02:00
2019-05-03 05:38:02 +02:00
return unless ( ( $data =~ /\bhttp\:/ ) || ( $data =~ /\bhttps\:/ ) );
deb("$target triggered GotUrl() with url: $data");
2019-05-04 16:03:22 +02:00
# split on whitespace and get the url(s) out
# done this way in case there are more than
# one url per line.
2019-05-03 05:38:02 +02:00
foreach ( split( /\s/, $data ) ) {
if ( ( $_ =~ /^http\:/ ) || ( $_ =~ /^https\:/ ) ) {
foreach $a (@urls) {
if ( $_ eq $a ) {
2019-05-05 03:14:26 +02:00
2019-05-04 16:03:22 +02:00
# incase they use the same url on the line.
2019-05-03 05:38:02 +02:00
$same = 1;
next;
}
}
if ( $same == 0 ) {
$same = 0;
push( @urls, $_ );
}
}
}
2019-05-04 16:03:22 +02:00
my ( $myurl, $fqdn, $junk );
my ( $url, $browser, $response, $answer );
2019-05-05 03:14:26 +02:00
my ( $line, $ifoundit );
2019-05-04 16:03:22 +02:00
2019-05-03 05:38:02 +02:00
foreach (@urls) {
2019-05-04 16:03:22 +02:00
$myurl = $_;
( $junk, $fqdn ) = split( /\/\//, $myurl, 2 );
( $fqdn, $junk ) = split( /\//, $fqdn, 2 );
if ( length($fqdn) >= 4 ) {
## Start of Act
## ACT1: Update URL if Cloudflared
if ( grep( /^$fqdn$/, @cached ) ) {
deb("$target Found in Cache $fqdn");
$myurl = 'https://web.archive.org/web/' . $myurl;
2019-05-03 05:38:02 +02:00
}
else {
2019-05-05 03:14:26 +02:00
if ( $cfg_uselocaldb == 1 ) {
deb("$target Lookup local DB about $fqdn");
open( CFSFILE,$cfg_localdbpath. "cloudflare_". substr( $fqdn, 0, 1 ). ".txt" ) or die "file not found for $fqdn";
$ifoundit = 0;
while (<CFSFILE>) {
$line = $_;
$line =~ s/\R//g;
if ( $line eq $fqdn ) {
$ifoundit = 1;
last;
}
}
close CFSFILE;
if ( $ifoundit == 1 ) {
push( @cached, $fqdn );
$myurl = 'https://web.archive.org/web/' . $myurl;
}
}
else {
deb("$target Asking API about $fqdn");
$answer = '';
$url = 'https://searxes.danwin1210.me/collab/open/ismitm.php?f='.$fqdn;
$browser = LWP::UserAgent->new;
$browser->agent("Mozilla/5.0 (Windows NT 6.1; rv:60.0) Gecko/20100101 Firefox/60.0");
$response = $browser->get($url);
$answer = $response->content;
if ( $answer eq '[true,true]' ) {
push( @cached, $fqdn );
$myurl = 'https://web.archive.org/web/' . $myurl;
}
2019-05-04 16:03:22 +02:00
}
2019-05-03 05:38:02 +02:00
}
2019-05-04 16:03:22 +02:00
## ACT2: Short URL __if__ enabled and long
if ( $cfg_useshort == 1 ) {
if ( length($myurl) > $cfg_minurllen ) {
deb("$target Creating Short URL for $myurl");
2019-05-05 03:14:26 +02:00
$url = 'https://tinyurl.com/api-create.php?url='.$result;
2019-05-04 16:03:22 +02:00
$browser = LWP::UserAgent->new;
$browser->agent("Mozilla/5.0 (Windows NT 6.1; rv:60.0) Gecko/20100101 Firefox/60.0");
$response = $browser->get($url);
$answer = $response->content;
if ( index( $answer, 'http://tinyurl.com/' ) == 0 ) {
$myurl = $answer;
}
}
}
##ACT3: Shout Result
if ( $cfg_send2chan == 1 ) {
$server->command("msg $target $myurl");
}
else {
$server->print( "$target", "$myurl", MSGLEVEL_CLIENTCRAP );
}
## End of Act
2019-05-03 05:38:02 +02:00
}
2019-05-04 16:03:22 +02:00
deb("$target process done for input $myurl");
2019-05-03 05:38:02 +02:00
}
2019-05-04 16:03:22 +02:00
2019-05-04 16:28:09 +02:00
## Cleanup cache
2019-05-04 16:03:22 +02:00
if ( $#cached > 500 ) {
@cached = ();
2019-05-03 05:38:02 +02:00
}
2019-05-04 16:03:22 +02:00
return;
2019-05-03 05:38:02 +02:00
}
sub deb($) {
2019-05-04 16:03:22 +02:00
Irssi::print(shift) if ( $cfg_isdebug == 1 );
}
sub goodchan {
my $chan = shift;
return ("OK") if ( !$cfg_chanlist );
foreach ( split( /\,/, $cfg_chanlist ) ) {
return ("$_") if ( $_ =~ /$chan/i );
}
return undef;
2019-05-03 05:38:02 +02:00
}
setuphandler();
Irssi::signal_add( "setup changed", "setuphandler" );
Irssi::signal_add_last( "message public", "GotUrl" );
Irssi::signal_add_last( "ctcp action", "GotUrl" );