package CPAN::Testers::WWW::Statistics;
use warnings;
use strict;
use vars qw($VERSION);
$VERSION = '1.21';
#----------------------------------------------------------------------------
=head1 NAME
CPAN::Testers::WWW::Statistics - CPAN Testers Statistics website.
=head1 DESCRIPTION
CPAN Testers Statistics comprises the actual website pages, a CGI tool to find
testers, and some backend code to help map tester address to a real identity.
=cut
# -------------------------------------
# Library Modules
use base qw(Class::Accessor::Fast);
use Config::IniFiles;
use CPAN::Testers::Common::DBUtils;
use File::Basename;
use File::Path;
use HTML::Entities;
use IO::File;
use Regexp::Assemble;
use CPAN::Testers::WWW::Statistics::Leaderboard;
use CPAN::Testers::WWW::Statistics::Pages;
use CPAN::Testers::WWW::Statistics::Graphs;
# -------------------------------------
# Public Methods
=head1 INTERFACE
=head2 The Constructor
=over 4
=item * new
Statistics creation object. Provides all the configuration and logging
functionality, as well the interface to the lower level functionality for Page
and Graph creation.
new() takes an option hash as an argument, which may contain the following
keys.
config => path to configuration file [required]
directory => path to output directory
mainstore => path/format to data storage files
templates => path to templates directory
address => path to address file
mailrc => path to 01mailrc.txt file
builder => path to output file from builder log parser
logfile => path to logfile
logclean => will overwrite any existing logfile if set
Note that while 'directory', 'templates' and 'address' are optional as
parameters, if they are not provided as parameters, then they MUST be
specified within the 'MASTER' section of the configuration file.
=back
=cut
sub _alarm_handler { return; }
sub new {
my $class = shift;
my %hash = @_;
my $self = {};
bless $self, $class;
# ensure we have a configuration file
die "Must specify the configuration file\n" unless( $hash{config});
die "Configuration file [$hash{config}] not found\n" unless(-f $hash{config});
# load configuration file
my $cfg;
local $SIG{'__WARN__'} = \&_alarm_handler;
eval { $cfg = Config::IniFiles->new( -file => $hash{config} ); };
die "Cannot load configuration file [$hash{config}]\n" unless($cfg && !$@);
$self->{cfg} = $cfg;
# configure databases
for my $db (qw(CPANSTATS TESTERS)) {
die "No configuration for $db database\n" unless($cfg->SectionExists($db));
my %opts = map {my $v = $cfg->val($db,$_); defined($v) ? ($_ => $v) : () }
qw(driver database dbfile dbhost dbport dbuser dbpass);
$self->{$db} = CPAN::Testers::Common::DBUtils->new(%opts);
die "Cannot configure $db database\n" unless($self->{$db});
}
my %OSNAMES;
my @rows = $self->{CPANSTATS}->get_query('array',q{SELECT osname,ostitle FROM osname ORDER BY id});
for my $row (@rows) {
$OSNAMES{lc $row->[0]} ||= $row->[1];
}
$self->osnames( \%OSNAMES );
my $ra = Regexp::Assemble->new();
my @NOREPORTS = split("\n", $cfg->val('NOREPORTS','list'));
for(@NOREPORTS) {
s/\s+\#.*$//; #remove comments
$ra->add($_);
}
$self->noreports($ra->re);
my @TOCOPY = split("\n", $cfg->val('TOCOPY','LIST'));
$self->tocopy(\@TOCOPY);
my %TOLINK;
for my $link ($cfg->Parameters('TOLINK')) {
my $file = $cfg->val('TOLINK',$link);
$TOLINK{$link} = $file;
}
$self->tolink(\%TOLINK);
$self->known_t( 0 );
$self->known_s( 0 );
$self->mainstore( _defined_or( $hash{mainstore}, $cfg->val('MASTER','mainstore' ), 'cpanstats-%s.json' ));
$self->templates( _defined_or( $hash{templates}, $cfg->val('MASTER','templates' ) ));
$self->address( _defined_or( $hash{address}, $cfg->val('MASTER','address' ) ));
$self->missing( _defined_or( $hash{missing}, $cfg->val('MASTER','missing' ) ));
$self->mailrc( _defined_or( $hash{mailrc}, $cfg->val('MASTER','mailrc' ) ));
$self->logfile( _defined_or( $hash{logfile}, $cfg->val('MASTER','logfile' ) ));
$self->logclean( _defined_or( $hash{logclean}, $cfg->val('MASTER','logclean' ), 0 ));
$self->directory( _defined_or( $hash{directory}, $cfg->val('MASTER','directory' ) ));
$self->copyright( $cfg->val('MASTER','copyright' ) );
$self->builder( _defined_or( $hash{builder}, $cfg->val('MASTER','builder' ) ));
for my $dir (qw(dir_cpan dir_backpan dir_reports)) {
$self->$dir( _defined_or( $hash{$dir}, $cfg->val('MASTER',$dir ) ));
}
$self->_log(sprintf "%-12s=%s", $_, ($self->$_() || ''))
for(qw(mainstore templates address missing mailrc logfile logclean directory builder dir_cpan dir_backpan dir_reports));
die "Must specify the output directory\n" unless($self->directory);
die "Must specify the template directory\n" unless($self->templates);
die "Must specify a valid mailrc path\n" unless($self->mailrc && -f $self->mailrc);
return $self;
}
=head2 Public Methods
=over 4
=item * leaderboard
Maintain the leaderboard table as requested.
=item * make_pages
Method to manage the data update and creation of all the statistics web pages.
Note that this method incorporate all of the method functionality of update,
make_basics, make_matrix and make_stats.
=item * update
Method to manage the data update only.
=item * make_basics
Method to manage the creation of the basic statistics web pages.
=item * make_matrix
Method to manage the creation of the matrix style statistics web pages.
=item * make_stats
Method to manage the creation of the tabular style statistics web pages.
=item * make_cpan
Method to manage the creation of the CPAN specific statistics files and web pages.
=item * make_leaders
Method to manage the creation of the OS leaderboard web pages.
=item * make_noreports
Method to manage the creation of the no reports pages.
=item * make_performance
Method to manage the creation/update of the builder performance data file.
=item * make_graphs
Method to manage the creation of all the statistics graphs.
=item * storage
Method to return specific JSON data currently stored.
=cut
__PACKAGE__->mk_accessors(
qw( directory mainstore templates address builder missing mailrc
logfile logclean copyright noreports tocopy tolink osnames
address profile known_t known_s dir_cpan dir_backpan dir_reports));
sub leaderboard {
my ($self,%options) = @_;
my $lb = CPAN::Testers::WWW::Statistics::Leaderboard->new(parent => $self);
return $lb->results( $options{results} ) if($options{results});
return $lb->check() if($options{check});
return $lb->renew() if($options{renew});
$lb->update() if($options{update});
$lb->postdate( $options{postdate} ) if($options{postdate});
}
sub make_pages {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->update_full();
}
sub update {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->update_data();
}
sub make_basics {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_basics();
}
sub make_matrix {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_matrices();
}
sub make_stats {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_stats();
}
sub make_cpan {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_cpan();
}
sub make_leaders {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_leaders();
}
sub make_noreports {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_noreports();
}
sub make_performance {
my $self = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->build_performance();
}
sub make_graphs {
my $self = shift;
my $stats = CPAN::Testers::WWW::Statistics::Graphs->new(parent => $self);
$stats->create();
}
sub storage {
my $self = shift;
my $type = shift;
$self->_check_files();
my $stats = CPAN::Testers::WWW::Statistics::Pages->new(parent => $self);
$stats->storage_read($type);
}
=item * ranges
Returns the specific date range array reference, as held in the configuration
file.
=item * osname
Returns the print form of a recorded OS name.
=item * tester
Returns either the known name of the tester for the given email address, or
returns a doctored version of the address for displaying in HTML.
=item * tester_lookup
Returns the name or email address, if found, of the stored profile or address
for the given addressid and testerid.
=item * tester_loader
Look up the number of know addresses and testers in the database.
=back
=cut
sub ranges {
my ($self,$section) = @_;
return unless($section);
my @now = localtime(time);
if($now[4]==0) { $now[5]--; $now[4]=12; }
my $now = sprintf "%04d%02d", $now[5]+1900, $now[4];
my @RANGES;
if($section eq 'NONE') {
@RANGES = ('00000000-99999999');
} else {
my @ranges = split("\n", $self->{cfg}->val($section,'LIST'));
for my $range (@ranges) {
my ($fdate,$tdate) = split('-',$range,2);
next if($fdate > $now);
$tdate = $now if($tdate > $now);
push @RANGES, "$fdate-$tdate";
}
}
return \@RANGES;
}
sub osname {
my ($self,$name) = @_;
my $osnames = $self->osnames();
return $osnames->{lc $name} || $name;
}
sub tester {
my ($self,$name) = @_;
return @{$self->{addresses}{$name}} if($self->{addresses}{$name});
my @rows = $self->{TESTERS}->get_query('hash',q{
SELECT a.email,p.name,p.pause,a.addressid,a.testerid
FROM address a
LEFT JOIN profile p ON p.testerid=a.testerid
WHERE a.address=? OR a.email=?
},$name,$name);
my @addr = ( $name, 0, 0 );
if(@rows) {
if($rows[0]->{name}) {
$addr[0] = $rows[0]->{name} . ($rows[0]->{pause} ? " ($rows[0]->{pause})" : '');
} else {
$addr[0] = $rows[0]->{email};
}
$addr[1] = $rows[0]->{addressid};
$addr[2] = $rows[0]->{testerid};
}
$addr[0] = _html_name($addr[0]);
$self->{addresses}{$name} = \@addr;
return @addr;
}
sub tester_lookup {
my ($self,$addressid,$testerid) = @_;
$self->tester_loader() unless($self->known_t);
my $address = $self->address;
my $profile = $self->profile;
return $profile->{$testerid}{html} if($testerid && $profile->{$testerid});
return $address->{$addressid}{html} if($addressid && $address->{$addressid});
return;
}
sub tester_loader {
my $self = shift;
my (%address,%profile);
my @rows = $self->{TESTERS}->get_query('hash',q{SELECT * FROM address});
for my $row (@rows) {
$row->{html} = _html_name($row->{email});
$address{$row->{addressid}} = $row;
}
$self->address( \%address );
@rows = $self->{TESTERS}->get_query('hash',q{SELECT * FROM profile});
for my $row (@rows) {
my $name = $row->{name} . ($row->{pause} ? " ($row->{pause})" : '');
$row->{html} = _html_name($name);
$profile{$row->{testerid}} = $row;
}
$self->profile( \%profile );
@rows = $self->{TESTERS}->get_query('array',q{
SELECT count(addressid),count(distinct testerid) FROM address WHERE testerid > 0
});
$self->known_s( $rows[0]->[0] );
$self->known_t( $rows[0]->[1] );
}
# -------------------------------------
# Private Methods
sub _html_name {
my $name = shift || return '';
$name = $name =~ /\&(\#x?\d+|\w+)\;/
? $name
: encode_entities( $name );
$name =~ s/\./ /g if($name =~ /\@/);
$name =~ s/\@/ \+ /g;
$name =~ s/</</g;
$name =~ s/>/>/g;
return $name;
}
sub _check_files {
my $self = shift;
die "Template directory not found\n" unless(-d $self->templates);
die "Must specify the path of the address file\n" unless( $self->address);
die "Address file not found\n" unless(-f $self->address);
}
sub _log {
my $self = shift;
my $log = $self->logfile or return;
mkpath(dirname($log)) unless(-f $log);
my $mode = $self->logclean ? 'w+' : 'a+';
$self->logclean(0);
my @dt = localtime(time);
my $dt = sprintf "%04d/%02d/%02d %02d:%02d:%02d", $dt[5]+1900,$dt[4]+1,$dt[3],$dt[2],$dt[1],$dt[0];
my $fh = IO::File->new($log,$mode) or die "Cannot write to log file [$log]: $!\n";
print $fh "$dt ", @_, "\n";
$fh->close;
}
sub _defined_or {
while(@_) {
my $value = shift;
return $value if(defined $value);
}
return;
}
q("I am NOT a number!");
__END__
=head1 CPAN TESTERS FUND
CPAN Testers wouldn't exist without the help and support of the Perl
community. However, since 2008 CPAN Testers has grown far beyond the
expectations of it's original creators. As a consequence it now requires
considerable funding to help support the infrastructure.
In early 2012 the Enlightened Perl Organisation very kindly set-up a
CPAN Testers Fund within their donatation structure, to help the project
cover the costs of servers and services.
If you would like to donate to the CPAN Testers Fund, please follow the link
below to the Enlightened Perl Organisation's donation site.
F<https://members.enlightenedperl.org/drupal/donate-cpan-testers>
If your company would like to support us, you can donate financially via the
fund link above, or if you have servers or services that we might use, please
send an email to admin@cpantesters.org with details.
Our full list of current sponsors can be found at our I <3 CPAN Testers site.
F<http://iheart.cpantesters.org>
=head1 BUGS, PATCHES & FIXES
There are no known bugs at the time of this release. However, if you spot a
bug or are experiencing difficulties, that is not explained within the POD
documentation, please send bug reports and patches to the RT Queue (see below).
Fixes are dependent upon their severity and my availability. Should a fix not
be forthcoming, please feel free to (politely) remind me.
RT Queue -
http://rt.cpan.org/Public/Dist/Display.html?Name=CPAN-Testers-WWW-Statistics
=head1 SEE ALSO
L<CPAN::Testers::Data::Generator>,
L<CPAN::Testers::WWW::Reports>
F<http://www.cpantesters.org/>,
F<http://stats.cpantesters.org/>,
F<http://wiki.cpantesters.org/>
=head1 AUTHOR
Barbie, <barbie@cpan.org>
for Miss Barbell Productions <http://www.missbarbell.co.uk>.
=head1 COPYRIGHT AND LICENSE
Copyright (C) 2005-2015 Barbie for Miss Barbell Productions.
This distribution is free software; you can redistribute it and/or
modify it under the Artistic Licence v2.
=cut