eg/search-cpan.pl - metacpan.org

#!/usr/bin/perl
# search modules on search.cpan.org and extract name, description and author

use strict;
use warnings;
use URI;
use Web::Scraper;
use YAML;

my $query = shift || "Foo";
my $uri   = URI->new("http://search.cpan.org/search");
$uri->query_form(query => $query, mode => 'all');

my $scraper = scraper {
    process "body#cpansearch>p", 'modules[]' => scraper {
        process "//a[1]", name => 'TEXT', url => '@href';
        process "small", description => 'TEXT';
        process "span.date", date => 'TEXT';
        process q{//a[starts-with(@href, '/~')][2]}, author => 'TEXT';
    };
};

warn Dump $scraper->scrape($uri);

	Global
`s`	Focus search bar
`?`	Bring up this help dialog

	GitHub
`g` `p`	Go to pull requests
`g` `i`	go to github issues (only if github is preferred repository)

	POD
`g` `a`	Go to author
`g` `c`	Go to changes
`g` `i`	Go to issues
`g` `d`	Go to dist
`g` `r`	Go to repository/SCM
`g` `s`	Go to source
`g` `b`	Go to file browse

	Search terms
module: (e.g. module:Plugin)
distribution: (e.g. distribution:Dancer auth)
author: (e.g. author:SONGMU Redis)
version: (e.g. version:1.00)