#!/usr/bin/perl
# Extract tags from web pages that have rel-tag microformat
use strict;
use warnings;
use URI;
use URI::Escape;
use Web::Scraper;
use YAML;
my $uri = shift or die "Usage: rel-tag.pl URL\n";
my $scraper = scraper {
process 'a[rel~="tag"]', 'tags[]' => sub {
my $uri = URI->new($_->attr('href'));
my $label = (grep length, split '/', $uri->path)[-1];
$label =~ s/\+/%20/g;
uri_unescape($label);
};
};
warn Dump $scraper->scrape(URI->new($uri));