From 637b4df401a85bfb478d59859f3a04b653e3c184 Mon Sep 17 00:00:00 2001 From: Emmanuel Di Pretoro Date: Fri, 24 Aug 2018 13:41:51 +0200 Subject: [PATCH] First draft of a tool to extract URLs from a text file --- extract_urls.pl | 14 ++++++++++++++ 1 file changed, 14 insertions(+) create mode 100644 extract_urls.pl diff --git a/extract_urls.pl b/extract_urls.pl new file mode 100644 index 0000000..0906012 --- /dev/null +++ b/extract_urls.pl @@ -0,0 +1,14 @@ +#!/usr/bin/env perl + +use strict; +use warnings; + +use Regexp::Common 'URI'; +use IO::All; + +foreach my $filename (@ARGV) { + my $content = io->file($filename)->slurp; + while ( $content =~ m/($RE{URI}{HTTP})/g ) { + print $1, $/; + } +}