aboutsummaryrefslogtreecommitdiff
path: root/idalius.pl
diff options
context:
space:
mode:
authorDavid Phillips <david@sighup.nz>2017-05-09 10:14:09 +1200
committerDavid Phillips <david@sighup.nz>2017-05-09 10:15:57 +1200
commit5390f36c84b0876b9c94dc49fa8e043a5d0d51a4 (patch)
treeee8c3b7c844a7169869ef27188c65fcc9619db31 /idalius.pl
parente8247d272afbc57601dfa542caa2d7fcd60173ff (diff)
downloadidalius-5390f36c84b0876b9c94dc49fa8e043a5d0d51a4.tar.xz
URL Titles: Don't use a HEAD request first
This upset some websites like reddit which are prissy about >1 request every two seconds.
Diffstat (limited to 'idalius.pl')
-rwxr-xr-xidalius.pl21
1 files changed, 10 insertions, 11 deletions
diff --git a/idalius.pl b/idalius.pl
index c0782ff..a885ca5 100755
--- a/idalius.pl
+++ b/idalius.pl
@@ -67,20 +67,17 @@ sub drop_priv {
sub url_get_title
{
my $url = $_[0];
- my $response = HTTP::Tiny->new((timeout => 5))->head($url);
+ my $http = HTTP::Tiny->new((default_headers => {accept => 'text/html'}, timeout => 5, agent => "Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Firefox/52.0"));
+
+ my $response = $http->get($url);
+
if (!$response->{success}) {
print "Something broke: $response->{content}\n";
return;
}
- if (!$response->{headers}->{"content-type"} =~ m,text/html ?,) {
- print("Not html, giving up now");
- return;
- }
-
- $response = HTTP::Tiny->new((timeout => 5))->get($url);
- if (!$response->{success}) {
- print "Something broke: $response->{content}\n";
+ if (!($response->{headers}->{"content-type"} =~ m,text/html ?,)) {
+ print("Not html, giving up now\n");
return;
}
@@ -158,8 +155,10 @@ sub irc_public {
if ($config{url_on} and $what =~ /(https?:\/\/[^ ]+)/i)
{
my $title = url_get_title($1);
- print "Title: $title\n";
- $irc->yield(privmsg => $channel => $title);
+ if ($title) {
+ print "Title: $title\n";
+ $irc->yield(privmsg => $channel => $title);
+ }
}
my $gathered = "";