The Perl Toolchain Summit needs more sponsors. If your company depends on Perl, please support this very important event.
#!/usr/bin/perl -w
use strict;
use warnings;

my $Example = <<"END";

Yes, Jim, I found it under "http://www.w3.org/Addressing/",
but you can probably pick it up from <a href="ftp://foo.example.com/rfc/">the RFC</a>. 
Note the <a class="warning" href="http://www.ics.uci.edu/pub/ietf/uri/historical.html#WARNING" target="_blank">warning</a>.
Also <foo bar>.
<a class="junk" href="http://google.com/search?q=&lt;html&gt;">Search for some entities</a>.
END

# Which should find these URIs
my @Uris = (
      "http://www.w3.org/Addressing/",
      "ftp://foo.example.com/rfc/",
      "http://www.ics.uci.edu/pub/ietf/uri/historical.html#WARNING",
      "http://google.com/search?q=&lt;html&gt;",
);

use Test::More tests => 5;
use URI::Find;

my @found;
my $finder = URI::Find->new(sub {
    my($uri) = @_;
    push @found, $uri;
    return "Link " . scalar @found;
    
});
$finder->find(\$Example);

is_deeply \@found, \@Uris, "found links in HTML";
like($Example, qr/"Link 1"/, 'link 1 replaced');
like($Example, qr/<a href="Link 2"/, 'link 2 replaced');
like($Example, qr/<a class="warning" href="Link 3"/, 'link 3 replaced');
like($Example, qr/<a class="junk" href="Link 4"/, 'link 4 replaced');