diff options
Diffstat (limited to 'plugin/url_title.pm')
| -rw-r--r-- | plugin/url_title.pm | 62 | 
1 files changed, 62 insertions, 0 deletions
| diff --git a/plugin/url_title.pm b/plugin/url_title.pm new file mode 100644 index 0000000..2a2258b --- /dev/null +++ b/plugin/url_title.pm @@ -0,0 +1,62 @@ +#!/usr/bin/env perl + +package plugin::url_title; + +use strict; +use warnings; +use HTTP::Tiny; +use HTML::HeadParser; + +my %config; + +sub configure { +	my $self = $_[0]; +	my $cref = $_[1]; +	%config = %$cref; +	return $self; +} + +sub message +{ +	my ($self, $me, $who, $where, $what) = @_; +	my $url; + +	if ($what =~ /(https?:\/\/[^ ]+)/i) { +		$url = $1; +	} +	return unless $url; + +	my $http = HTTP::Tiny->new((default_headers => {accept => 'text/html'}, timeout => 5)); + +	my $response = $http->get($url); + +	if (!$response->{success}) { +		print "Something broke: $response->{reason}\n"; +		return; +	} + +	if (!($response->{headers}->{"content-type"} =~ m,text/html ?,)) { +		print("Not html, giving up now\n"); +		return; +	} + +	my $html = $response->{content}; + +	my $parser = HTML::HeadParser->new; +	$parser->parse($html); + +	# get title and unpack from utf8 (assumption) +	my $title = $parser->header("title"); +	return unless $title; + +	my $shorturl = $url; +	$shorturl = (substr $url, 0, $config{url_len}) . "β¦" if length ($url) > $config{url_len}; + +	# remove http(s):// to avoid triggering other poorly configured bots +	$shorturl =~ s,^https?://,,g; +	$shorturl =~ s,/$,,g; + +	my $composed_title = "$title ($shorturl)"; +	return $composed_title; +} +1; | 
