version 1.38, 2003/08/21 00:19:05
|
version 1.55, 2004/04/08 15:57:32
|
Line 56 This script also does general database m
|
Line 56 This script also does general database m
|
the C<loncapa:metadata> table if it is deprecated. |
the C<loncapa:metadata> table if it is deprecated. |
|
|
This script evaluates dynamic metadata from the authors' |
This script evaluates dynamic metadata from the authors' |
F<nohist_resevaldata.db> database file in order to store it in MySQL, as |
F<nohist_resevaldata.db> database file in order to store it in MySQL. |
well as to compress the filesize (add up all "count"-type metadata). |
|
|
|
This script is playing an increasingly important role for a loncapa |
This script is playing an increasingly important role for a loncapa |
library server. The proper operation of this script is critical for a smooth |
library server. The proper operation of this script is critical for a smooth |
Line 65 and correct user experience.
|
Line 64 and correct user experience.
|
|
|
=cut |
=cut |
|
|
|
use strict; |
|
|
|
use DBI; |
use lib '/home/httpd/lib/perl/'; |
use lib '/home/httpd/lib/perl/'; |
use LONCAPA::Configuration; |
use LONCAPA::Configuration; |
|
use LONCAPA::lonmetadata; |
|
|
use IO::File; |
use IO::File; |
use HTML::TokeParser; |
use HTML::TokeParser; |
use DBI; |
|
use GDBM_File; |
use GDBM_File; |
use POSIX qw(strftime mktime); |
use POSIX qw(strftime mktime); |
|
use File::Find; |
|
|
my @metalist; |
## |
|
## Use variables for table names so we can test this routine a little easier |
$simplestatus=''; |
my $oldname = 'metadata'; |
my %countext=(); |
my $newname = 'newmetadata'; |
|
|
sub writesimple { |
|
open(SMP,'>/home/httpd/html/lon-status/mysql.txt'); |
|
print SMP $simplestatus."\n"; |
|
close(SMP); |
|
} |
|
|
|
sub writecount { |
|
open(RSMP,'>/home/httpd/html/lon-status/rescount.txt'); |
|
foreach (keys %countext) { |
|
print RSMP $_.'='.$countext{$_}.'&'; |
|
} |
|
print RSMP 'time='.time."\n"; |
|
close(RSMP); |
|
} |
|
|
|
sub count { |
|
my $file=shift; |
|
$file=~/\.(\w+)$/; |
|
my $ext=lc($1); |
|
if (defined($countext{$ext})) { |
|
$countext{$ext}++; |
|
} else { |
|
$countext{$ext}=1; |
|
} |
|
} |
|
# ----------------------------------------------------- Un-Escape Special Chars |
|
|
|
sub unescape { |
|
my $str=shift; |
|
$str =~ s/%([a-fA-F0-9][a-fA-F0-9])/pack("C",hex($1))/eg; |
|
return $str; |
|
} |
|
|
|
# -------------------------------------------------------- Escape Special Chars |
|
|
|
sub escape { |
# |
my $str=shift; |
# Read loncapa_apache.conf and loncapa.conf |
$str =~ s/(\W)/"%".unpack('H2',$1)/eg; |
|
return $str; |
|
} |
|
|
|
|
|
# ------------------------------------------- Code to evaluate dynamic metadata |
|
|
|
sub dynamicmeta { |
|
|
|
my $url=&declutter(shift); |
|
$url=~s/\.meta$//; |
|
my %returnhash=(); |
|
my ($adomain,$aauthor)=($url=~/^(\w+)\/(\w+)\//); |
|
my $prodir=&propath($adomain,$aauthor); |
|
if ((tie(%evaldata,'GDBM_File', |
|
$prodir.'/nohist_resevaldata.db',&GDBM_READER(),0640)) && |
|
(tie(%newevaldata,'GDBM_File', |
|
$prodir.'/nohist_new_resevaldata.db',&GDBM_WRCREAT(),0640))) { |
|
my %sum=(); |
|
my %cnt=(); |
|
my %listitems=('count' => 'add', |
|
'course' => 'add', |
|
'avetries' => 'avg', |
|
'stdno' => 'add', |
|
'difficulty' => 'avg', |
|
'clear' => 'avg', |
|
'technical' => 'avg', |
|
'helpful' => 'avg', |
|
'correct' => 'avg', |
|
'depth' => 'avg', |
|
'comments' => 'app', |
|
'usage' => 'cnt' |
|
); |
|
my $regexp=$url; |
|
$regexp=~s/(\W)/\\$1/g; |
|
$regexp='___'.$regexp.'___([a-z]+)$'; |
|
foreach (keys %evaldata) { |
|
my $key=&unescape($_); |
|
if ($key=~/$regexp/) { |
|
my $ctype=$1; |
|
if (defined($cnt{$ctype})) { |
|
$cnt{$ctype}++; |
|
} else { |
|
$cnt{$ctype}=1; |
|
} |
|
unless ($listitems{$ctype} eq 'app') { |
|
if (defined($sum{$ctype})) { |
|
$sum{$ctype}+=$evaldata{$_}; |
|
} else { |
|
$sum{$ctype}=$evaldata{$_}; |
|
} |
|
} else { |
|
if (defined($sum{$ctype})) { |
|
if ($evaldata{$_}) { |
|
$sum{$ctype}.='<hr>'.$evaldata{$_}; |
|
} |
|
} else { |
|
$sum{$ctype}=''.$evaldata{$_}; |
|
} |
|
} |
|
if ($ctype ne 'count') { |
|
$newevaldata{$_}=$evaldata{$_}; |
|
} |
|
} |
|
} |
|
foreach (keys %cnt) { |
|
if ($listitems{$_} eq 'avg') { |
|
$returnhash{$_}=int(($sum{$_}/$cnt{$_})*100.0+0.5)/100.0; |
|
} elsif ($listitems{$_} eq 'cnt') { |
|
$returnhash{$_}=$cnt{$_}; |
|
} else { |
|
$returnhash{$_}=$sum{$_}; |
|
} |
|
} |
|
if ($returnhash{'count'}) { |
|
my $newkey=$$.'_'.time.'_searchcat___'.&escape($url).'___count'; |
|
$newevaldata{$newkey}=$returnhash{'count'}; |
|
} |
|
untie(%evaldata); |
|
untie(%newevaldata); |
|
} |
|
return %returnhash; |
|
} |
|
|
|
# ----------------- Code to enable 'find' subroutine listing of the .meta files |
|
require "find.pl"; |
|
sub wanted { |
|
(($dev,$ino,$mode,$nlink,$uid,$gid) = lstat($_)) && |
|
-f _ && |
|
/^.*\.meta$/ && !/^.+\.\d+\.[^\.]+\.meta$/ && |
|
push(@metalist,"$dir/$_"); |
|
} |
|
|
|
# --------------- Read loncapa_apache.conf and loncapa.conf and get variables |
|
my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf'); |
my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf'); |
my %perlvar=%{$perlvarref}; |
my %perlvar=%{$perlvarref}; |
undef $perlvarref; # remove since sensitive and not needed |
undef $perlvarref; |
delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed |
delete $perlvar{'lonReceipt'}; # remove since sensitive (really?) & not needed |
|
# |
# ------------------------------------- Only run if machine is a library server |
# Only run if machine is a library server |
exit unless $perlvar{'lonRole'} eq 'library'; |
exit if ($perlvar{'lonRole'} ne 'library'); |
|
# |
# ----------------------------- Make sure this process is running from user=www |
# Make sure this process is running from user=www |
|
|
my $wwwid=getpwnam('www'); |
my $wwwid=getpwnam('www'); |
if ($wwwid!=$<) { |
if ($wwwid!=$<) { |
$emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}"; |
my $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}"; |
$subj="LON: $perlvar{'lonHostID'} User ID mismatch"; |
my $subj="LON: $perlvar{'lonHostID'} User ID mismatch"; |
system("echo 'User ID mismatch. searchcat.pl must be run as user www.' |\ |
system("echo 'User ID mismatch. searchcat.pl must be run as user www.' |\ |
mailto $emailto -s '$subj' > /dev/null"); |
mailto $emailto -s '$subj' > /dev/null"); |
exit 1; |
exit 1; |
} |
} |
|
# |
|
# Let people know we are running |
# ---------------------------------------------------------- We are in business |
|
|
|
open(LOG,'>'.$perlvar{'lonDaemons'}.'/logs/searchcat.log'); |
open(LOG,'>'.$perlvar{'lonDaemons'}.'/logs/searchcat.log'); |
print LOG '==== Searchcat Run '.localtime()."====\n\n"; |
print LOG '==== Searchcat Run '.localtime()."====\n"; |
$simplestatus='time='.time.'&'; |
# |
|
# Connect to database |
my $dbh; |
my $dbh; |
# ------------------------------------- Make sure that database can be accessed |
if (! ($dbh = DBI->connect("DBI:mysql:loncapa","www",$perlvar{'lonSqlAccess'}, |
{ |
{ RaiseError =>0,PrintError=>0}))) { |
unless ( |
print LOG "Cannot connect to database!\n"; |
$dbh = DBI->connect("DBI:mysql:loncapa","www",$perlvar{'lonSqlAccess'},{ RaiseError =>0,PrintError=>0}) |
die "MySQL Error: Cannot connect to database!\n"; |
) { |
} |
print LOG "Cannot connect to database!\n"; |
# This can return an error and still be okay, so we do not bother checking. |
$simplestatus.='mysql=defunct'; |
# (perhaps it should be more robust and check for specific errors) |
&writesimple(); |
$dbh->do('DROP TABLE IF EXISTS '.$newname); |
exit; |
# |
} |
# Create the new table |
|
my $request = &LONCAPA::lonmetadata::create_metadata_storage($newname); |
my $make_metadata_table = "CREATE TABLE IF NOT EXISTS metadata (". |
$dbh->do($request); |
"title TEXT, author TEXT, subject TEXT, url TEXT, keywords TEXT, ". |
if ($dbh->err) { |
"version TEXT, notes TEXT, abstract TEXT, mime TEXT, language TEXT, ". |
$dbh->disconnect(); |
"creationdate DATETIME, lastrevisiondate DATETIME, owner TEXT, ". |
print LOG "\nMySQL Error Create: ".$dbh->errstr."\n"; |
"copyright TEXT, FULLTEXT idx_title (title), ". |
die $dbh->errstr; |
"FULLTEXT idx_author (author), FULLTEXT idx_subject (subject), ". |
|
"FULLTEXT idx_url (url), FULLTEXT idx_keywords (keywords), ". |
|
"FULLTEXT idx_version (version), FULLTEXT idx_notes (notes), ". |
|
"FULLTEXT idx_abstract (abstract), FULLTEXT idx_mime (mime), ". |
|
"FULLTEXT idx_language (language), FULLTEXT idx_owner (owner), ". |
|
"FULLTEXT idx_copyright (copyright)) TYPE=MYISAM"; |
|
# It would sure be nice to have some logging mechanism. |
|
$dbh->do($make_metadata_table); |
|
} |
} |
|
# |
# ------------------------------------------------------------- get .meta files |
# find out which users we need to examine |
opendir(RESOURCES,"$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}"); |
opendir(RESOURCES,"$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}"); |
my @homeusers = grep { |
my @homeusers = |
&ishome("$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}/$_") |
grep { |
} grep {!/^\.\.?$/} readdir(RESOURCES); |
&ishome("$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}/$_"); |
|
} grep { |
|
!/^\.\.?$/; |
|
} readdir(RESOURCES); |
closedir RESOURCES; |
closedir RESOURCES; |
|
|
# |
# |
# Create the statement handlers we need |
# Loop through the users |
my $delete_sth = $dbh->prepare |
|
("DELETE FROM metadata WHERE url LIKE BINARY ?"); |
|
|
|
my $insert_sth = $dbh->prepare |
|
("INSERT INTO metadata VALUES (". |
|
"?,". # title |
|
"?,". # author |
|
"?,". # subject |
|
"?,". # m2??? |
|
"?,". # version |
|
"?,". # current |
|
"?,". # notes |
|
"?,". # abstract |
|
"?,". # mime |
|
"?,". # language |
|
"?,". # creationdate |
|
"?,". # revisiondate |
|
"?,". # owner |
|
"?)" # copyright |
|
); |
|
|
|
foreach my $user (@homeusers) { |
foreach my $user (@homeusers) { |
print LOG "\n=== User: ".$user."\n\n"; |
print LOG "=== User: ".$user."\n"; |
# Remove left-over db-files from potentially crashed searchcat run |
|
my $prodir=&propath($perlvar{'lonDefDomain'},$user); |
my $prodir=&propath($perlvar{'lonDefDomain'},$user); |
unlink($prodir.'/nohist_new_resevaldata.db'); |
# |
# Use find.pl |
# Use File::Find to get the files we need to read/modify |
undef @metalist; |
find( |
@metalist=(); |
{preprocess => \&only_meta_files, |
&find("$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}/$user"); |
# wanted => \&print_filename, |
# -- process each file to get metadata and put into search catalog SQL |
# wanted => \&log_metadata, |
# database. Also, check to see if already there. |
wanted => \&process_meta_file, |
# I could just delete (without searching first), but this works for now. |
}, |
foreach my $m (@metalist) { |
"$perlvar{'lonDocRoot'}/res/$perlvar{'lonDefDomain'}/$user"); |
print LOG "- ".$m."\n"; |
|
my $ref=&metadata($m); |
|
my $m2='/res/'.&declutter($m); |
|
$m2=~s/\.meta$//; |
|
&dynamicmeta($m2); |
|
&count($m2); |
|
$delete_sth->execute($m2); |
|
$insert_sth->execute($ref->{'title'}, |
|
$ref->{'author'}, |
|
$ref->{'subject'}, |
|
$m2, |
|
$ref->{'keywords'}, |
|
'current', |
|
$ref->{'notes'}, |
|
$ref->{'abstract'}, |
|
$ref->{'mime'}, |
|
$ref->{'language'}, |
|
sqltime($ref->{'creationdate'}), |
|
sqltime($ref->{'lastrevisiondate'}), |
|
$ref->{'owner'}, |
|
$ref->{'copyright'}); |
|
# if ($dbh->err()) { |
|
# print STDERR "Error:".$dbh->errstr()."\n"; |
|
# } |
|
$ref = undef; |
|
} |
|
|
|
# --------------------------------------------------- Clean up database |
|
# Need to, perhaps, remove stale SQL database records. |
|
# ... not yet implemented |
|
|
|
# ------------------------------------------- Copy over the new db-files |
|
# |
|
# Check the size of nohist_new_resevaldata.db compared to |
|
# nohist_resevaldata.db |
|
my @stat_result = stat($prodir.'/nohist_new_resevaldata.db'); |
|
my $new_size = $stat_result[7]; |
|
@stat_result = stat($prodir.'/nohist_resevaldata.db'); |
|
my $old_size = $stat_result[7]; |
|
if ($old_size) { |
|
if ($new_size/$old_size > 0.15 ) { |
|
system('mv '.$prodir.'/nohist_new_resevaldata.db '. |
|
$prodir.'/nohist_resevaldata.db'); |
|
} else { |
|
print LOG "Size of '$user' old nohist_reseval: $old_size ". |
|
"Size of new: $new_size. Not overwriting.\n"; |
|
my $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}"; |
|
my $subj="LON: $perlvar{'lonHostID'} searchcat.pl $user reseval ". |
|
"modification error."; |
|
system("echo ". |
|
"'See /home/httpd/perl/logs/searchcat.txt for information.' ". |
|
"| mailto $emailto -s '$subj' > /dev/null"); |
|
} |
|
} |
|
} |
} |
# --------------------------------------------------- Close database connection |
# |
$dbh->disconnect; |
# Rename the table |
print LOG "\n==== Searchcat completed ".localtime()." ====\n"; |
$dbh->do('DROP TABLE IF EXISTS '.$oldname); |
|
if (! $dbh->do('RENAME TABLE '.$newname.' TO '.$oldname)) { |
|
print LOG "MySQL Error Rename: ".$dbh->errstr."\n"; |
|
die $dbh->errstr; |
|
} |
|
if (! $dbh->disconnect) { |
|
print LOG "MySQL Error Disconnect: ".$dbh->errstr."\n"; |
|
die $dbh->errstr; |
|
} |
|
## |
|
## Finished! |
|
print LOG "==== Searchcat completed ".localtime()." ====\n"; |
close(LOG); |
close(LOG); |
&writesimple(); |
|
&writecount(); |
&write_type_count(); |
|
&write_copyright_count(); |
|
|
exit 0; |
exit 0; |
|
|
|
######################################################## |
|
######################################################## |
|
### ### |
|
### File::Find support routines ### |
|
### ### |
|
######################################################## |
|
######################################################## |
|
## |
|
## &only_meta_files |
|
## |
|
## Called by File::Find. |
|
## Takes a list of files/directories in and returns a list of files/directories |
|
## to search. |
|
sub only_meta_files { |
|
my @PossibleFiles = @_; |
|
my @ChosenFiles; |
|
foreach my $file (@PossibleFiles) { |
|
if ( ($file =~ /\.meta$/ && # Ends in meta |
|
$file !~ /\.\d+\.[^\.]+\.meta$/ # is not for a prior version |
|
) || (-d $file )) { # directories are okay |
|
# but we do not want /. or /.. |
|
push(@ChosenFiles,$file); |
|
} |
|
} |
|
return @ChosenFiles; |
|
} |
|
|
|
## |
|
## |
|
## Debugging routines, use these for 'wanted' in the File::Find call |
|
## |
|
sub print_filename { |
|
my ($file) = $_; |
|
my $fullfilename = $File::Find::name; |
|
if (-d $file) { |
|
print LOG " Got directory ".$fullfilename."\n"; |
|
} else { |
|
print LOG " Got file ".$fullfilename."\n"; |
|
} |
|
$_=$file; |
|
} |
|
|
|
sub log_metadata { |
|
my ($file) = $_; |
|
my $fullfilename = $File::Find::name; |
|
return if (-d $fullfilename); # No need to do anything here for directories |
|
print LOG $fullfilename."\n"; |
|
my $ref=&metadata($fullfilename); |
|
if (! defined($ref)) { |
|
print LOG " No data\n"; |
|
return; |
|
} |
|
while (my($key,$value) = each(%$ref)) { |
|
print LOG " ".$key." => ".$value."\n"; |
|
} |
|
&count_copyright($ref->{'copyright'}); |
|
$_=$file; |
|
} |
|
|
# ============================================================================= |
|
|
|
# ---------------------------------------------------------------- Get metadata |
## |
# significantly altered from subroutine present in lonnet |
## process_meta_file |
|
## Called by File::Find. |
|
## Only input is the filename in $_. |
|
sub process_meta_file { |
|
my ($file) = $_; |
|
my $filename = $File::Find::name; |
|
return if (-d $filename); # No need to do anything here for directories |
|
# |
|
print LOG $filename."\n"; |
|
# |
|
my $ref=&metadata($filename); |
|
# |
|
# $url is the original file url, not the metadata file |
|
my $url='/res/'.&declutter($filename); |
|
$url=~s/\.meta$//; |
|
print LOG " ".$url."\n"; |
|
# |
|
# Ignore some files based on their metadata |
|
if ($ref->{'obsolete'}) { |
|
print LOG "obsolete\n"; |
|
return; |
|
} |
|
&count_copyright($ref->{'copyright'}); |
|
if ($ref->{'copyright'} eq 'private') { |
|
print LOG "private\n"; |
|
return; |
|
} |
|
# |
|
# Find the dynamic metadata |
|
my %dyn; |
|
if ($url=~ m:/default$:) { |
|
$url=~ s:/default$:/:; |
|
} else { |
|
# %dyn=&dynamicmeta($url); |
|
&count_type($url); |
|
} |
|
# |
|
$ref->{'creationdate'} = &sqltime($ref->{'creationdate'}); |
|
$ref->{'lastrevisiondate'} = &sqltime($ref->{'lastrevisiondate'}); |
|
my %Data = ( |
|
%$ref, |
|
%dyn, |
|
'url'=>$url, |
|
'version'=>'current'); |
|
my ($count,$err) = &LONCAPA::lonmetadata::store_metadata($dbh,$newname, |
|
\%Data); |
|
if ($err) { |
|
print LOG "\nMySQL Error Insert: ".$err."\n"; |
|
die $err; |
|
} |
|
if ($count < 1) { |
|
print LOG "Unable to insert record into MySQL database for $url\n"; |
|
die "Unable to insert record into MySQl database for $url"; |
|
} else { |
|
print LOG "Count = ".$count."\n"; |
|
} |
|
# |
|
# Reset $_ before leaving |
|
$_ = $file; |
|
} |
|
|
|
######################################################## |
|
######################################################## |
|
### ### |
|
### &metadata($uri) ### |
|
### Retrieve metadata for the given file ### |
|
### ### |
|
######################################################## |
|
######################################################## |
sub metadata { |
sub metadata { |
my ($uri,$what)=@_; |
my ($uri)=@_; |
my %metacache; |
my %metacache=(); |
$uri=&declutter($uri); |
$uri=&declutter($uri); |
my $filename=$uri; |
my $filename=$uri; |
$uri=~s/\.meta$//; |
$uri=~s/\.meta$//; |
$uri=''; |
$uri=''; |
unless ($metacache{$uri.'keys'}) { |
if ($filename !~ /\.meta$/) { |
unless ($filename=~/\.meta$/) { $filename.='.meta'; } |
$filename.='.meta'; |
my $metastring=&getfile($perlvar{'lonDocRoot'}.'/res/'.$filename); |
} |
my $parser=HTML::TokeParser->new(\$metastring); |
my $metastring=&getfile($perlvar{'lonDocRoot'}.'/res/'.$filename); |
my $token; |
return undef if (! defined($metastring)); |
while ($token=$parser->get_token) { |
my $parser=HTML::TokeParser->new(\$metastring); |
if ($token->[0] eq 'S') { |
my $token; |
my $entry=$token->[1]; |
while ($token=$parser->get_token) { |
my $unikey=$entry; |
if ($token->[0] eq 'S') { |
if (defined($token->[2]->{'part'})) { |
my $entry=$token->[1]; |
$unikey.='_'.$token->[2]->{'part'}; |
my $unikey=$entry; |
} |
if (defined($token->[2]->{'part'})) { |
if (defined($token->[2]->{'name'})) { |
$unikey.='_'.$token->[2]->{'part'}; |
$unikey.='_'.$token->[2]->{'name'}; |
} |
} |
if (defined($token->[2]->{'name'})) { |
if ($metacache{$uri.'keys'}) { |
$unikey.='_'.$token->[2]->{'name'}; |
$metacache{$uri.'keys'}.=','.$unikey; |
} |
|
if ($metacache{$uri.'keys'}) { |
|
$metacache{$uri.'keys'}.=','.$unikey; |
|
} else { |
|
$metacache{$uri.'keys'}=$unikey; |
|
} |
|
foreach ( @{$token->[3]}) { |
|
$metacache{$uri.''.$unikey.'.'.$_}=$token->[2]->{$_}; |
|
} |
|
if (! ($metacache{$uri.''.$unikey}=$parser->get_text('/'.$entry))){ |
|
$metacache{$uri.''.$unikey} = |
|
$metacache{$uri.''.$unikey.'.default'}; |
|
} |
|
} # End of ($token->[0] eq 'S') |
|
} |
|
return \%metacache; |
|
} |
|
|
|
## |
|
## &getfile($filename) |
|
## Slurps up an entire file into a scalar. |
|
## Returns undef if the file does not exist |
|
sub getfile { |
|
my $file = shift(); |
|
if (! -e $file ) { |
|
return undef; |
|
} |
|
my $fh=IO::File->new($file); |
|
my $contents = ''; |
|
while (<$fh>) { |
|
$contents .= $_; |
|
} |
|
return $contents; |
|
} |
|
|
|
######################################################## |
|
######################################################## |
|
### ### |
|
### Dynamic Metadata ### |
|
### ### |
|
######################################################## |
|
######################################################## |
|
sub dynamicmeta { |
|
my $url = &declutter(shift()); |
|
$url =~ s/\.meta$//; |
|
my %data = ('count' => 0, |
|
'course' => 0, |
|
'course_list' => '', |
|
'avetries' => 'NULL', |
|
'avetries_list' => '', |
|
'stdno' => 0, |
|
'stdno_list' => '', |
|
'usage' => 0, |
|
'usage_list' => '', |
|
'goto' => 0, |
|
'goto_list' => '', |
|
'comefrom' => 0, |
|
'comefrom_list' => '', |
|
'difficulty' => 'NULL', |
|
'difficulty_list' => '', |
|
'sequsage' => '0', |
|
'sequsage_list' => '', |
|
'clear' => 'NULL', |
|
'technical' => 'NULL', |
|
'correct' => 'NULL', |
|
'helpful' => 'NULL', |
|
'depth' => 'NULL', |
|
'comments' => '', |
|
); |
|
my ($dom,$auth)=($url=~/^(\w+)\/(\w+)\//); |
|
my $prodir=&propath($dom,$auth); |
|
# |
|
# Get metadata except counts |
|
my %evaldata; |
|
if (! tie(%evaldata,'GDBM_File', |
|
$prodir.'/nohist_resevaldata.db',&GDBM_READER(),0640)) { |
|
return (undef); |
|
} |
|
my %sum=(); |
|
my %count=(); |
|
my %concat=(); |
|
my %listitems=( |
|
'course' => 'add', |
|
'goto' => 'add', |
|
'comefrom' => 'add', |
|
'avetries' => 'average', |
|
'stdno' => 'add', |
|
'difficulty' => 'average', |
|
'clear' => 'average', |
|
'technical' => 'average', |
|
'helpful' => 'average', |
|
'correct' => 'average', |
|
'depth' => 'average', |
|
'comments' => 'append', |
|
'usage' => 'count' |
|
); |
|
# |
|
my $regexp=$url; |
|
$regexp=~s/(\W)/\\$1/g; |
|
$regexp='___'.$regexp.'___([a-z]+)$'; |
|
while (my ($esckey,$value)=each %evaldata) { |
|
my $key=&unescape($esckey); |
|
if ($key=~/$regexp/) { |
|
my ($item,$purl,$cat)=split(/___/,$key); |
|
$count{$cat}++; |
|
if ($listitems{$cat} ne 'append') { |
|
if (defined($sum{$cat})) { |
|
$sum{$cat}+=&unescape($value); |
|
$concat{$cat}.=','.$item; |
} else { |
} else { |
$metacache{$uri.'keys'}=$unikey; |
$sum{$cat}=&unescape($value); |
|
$concat{$cat}=$item; |
} |
} |
map { |
} else { |
$metacache{$uri.''.$unikey.'.'.$_}=$token->[2]->{$_}; |
if (defined($sum{$cat})) { |
} @{$token->[3]}; |
if ($evaldata{$esckey}=~/\w/) { |
unless ( |
$sum{$cat}.='<hr />'.&unescape($evaldata{$esckey}); |
$metacache{$uri.''.$unikey}=$parser->get_text('/'.$entry) |
} |
) { $metacache{$uri.''.$unikey}= |
} else { |
$metacache{$uri.''.$unikey.'.default'}; |
$sum{$cat}=''.&unescape($evaldata{$esckey}); |
} |
} |
} |
} |
} |
} |
} |
} |
return \%metacache; |
untie(%evaldata); |
|
# transfer gathered data to returnhash, calculate averages where applicable |
|
my %returnhash; |
|
while (my $cat=each(%count)) { |
|
if ($count{$cat} eq 'nan') { next; } |
|
if ($sum{$cat} eq 'nan') { next; } |
|
if ($listitems{$cat} eq 'average') { |
|
if ($count{$cat}) { |
|
$returnhash{$cat}=int(($sum{$cat}/$count{$cat})*100.0+0.5)/100.0; |
|
} else { |
|
$returnhash{$cat}='NULL'; |
|
} |
|
} elsif ($listitems{$cat} eq 'count') { |
|
$returnhash{$cat}=$count{$cat}; |
|
} else { |
|
$returnhash{$cat}=$sum{$cat}; |
|
} |
|
$returnhash{$cat.'_list'}=$concat{$cat}; |
|
} |
|
# |
|
# get count |
|
if (tie(my %evaldata,'GDBM_File', |
|
$prodir.'/nohist_accesscount.db',&GDBM_READER(),0640)) { |
|
my $escurl=&escape($url); |
|
if (! exists($evaldata{$escurl})) { |
|
$returnhash{'count'}=0; |
|
} else { |
|
$returnhash{'count'}=$evaldata{$escurl}; |
|
} |
|
untie %evaldata; |
|
} |
|
return %returnhash; |
} |
} |
|
|
# ------------------------------------------------------------ Serves up a file |
######################################################## |
# returns either the contents of the file or a -1 |
######################################################## |
sub getfile { |
### ### |
|
### Counts ### |
|
### ### |
|
######################################################## |
|
######################################################## |
|
{ |
|
|
|
my %countext; |
|
|
|
sub count_type { |
my $file=shift; |
my $file=shift; |
if (! -e $file ) { return -1; }; |
$file=~/\.(\w+)$/; |
my $fh=IO::File->new($file); |
my $ext=lc($1); |
my $a=''; |
$countext{$ext}++; |
while (<$fh>) { $a .=$_; } |
|
return $a; |
|
} |
} |
|
|
# ------------------------------------------------------------- Declutters URLs |
sub write_type_count { |
sub declutter { |
open(RESCOUNT,'>/home/httpd/html/lon-status/rescount.txt'); |
my $thisfn=shift; |
while (my ($extension,$count) = each(%countext)) { |
$thisfn=~s/^$perlvar{'lonDocRoot'}//; |
print RESCOUNT $extension.'='.$count.'&'; |
$thisfn=~s/^\///; |
} |
$thisfn=~s/^res\///; |
print RESCOUNT 'time='.time."\n"; |
return $thisfn; |
close(RESCOUNT); |
} |
} |
|
|
# --------------------------------------- Is this the home server of an author? |
} # end of scope for %countext |
# (copied from lond, modification of the return value) |
|
|
{ |
|
|
|
my %copyrights; |
|
|
|
sub count_copyright { |
|
$copyrights{@_[0]}++; |
|
} |
|
|
|
sub write_copyright_count { |
|
open(COPYCOUNT,'>/home/httpd/html/lon-status/copyrightcount.txt'); |
|
while (my ($copyright,$count) = each(%copyrights)) { |
|
print COPYCOUNT $copyright.'='.$count.'&'; |
|
} |
|
print COPYCOUNT 'time='.time."\n"; |
|
close(COPYCOUNT); |
|
} |
|
|
|
} # end of scope for %copyrights |
|
|
|
######################################################## |
|
######################################################## |
|
### ### |
|
### Miscellanous Utility Routines ### |
|
### ### |
|
######################################################## |
|
######################################################## |
|
## |
|
## &ishome($username) |
|
## Returns 1 if $username is a LON-CAPA author, 0 otherwise |
|
## (copied from lond, modification of the return value) |
sub ishome { |
sub ishome { |
my $author=shift; |
my $author=shift; |
$author=~s/\/home\/httpd\/html\/res\/([^\/]*)\/([^\/]*).*/$1\/$2/; |
$author=~s/\/home\/httpd\/html\/res\/([^\/]*)\/([^\/]*).*/$1\/$2/; |
Line 449 sub ishome {
|
Line 553 sub ishome {
|
} |
} |
} |
} |
|
|
# -------------------------------------------- Return path to profile directory |
## |
# (copied from lond) |
## &propath($udom,$uname) |
|
## Returns the path to the users LON-CAPA directory |
|
## (copied from lond) |
sub propath { |
sub propath { |
my ($udom,$uname)=@_; |
my ($udom,$uname)=@_; |
$udom=~s/\W//g; |
$udom=~s/\W//g; |
Line 461 sub propath {
|
Line 567 sub propath {
|
return $proname; |
return $proname; |
} |
} |
|
|
# ---------------------------- convert 'time' format into a datetime sql format |
## |
|
## &sqltime($timestamp) |
|
## |
|
## Convert perl $timestamp to MySQL time. MySQL expects YYYY-MM-DD HH:MM:SS |
|
## |
sub sqltime { |
sub sqltime { |
my ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday,$isdst) = |
my ($time) = @_; |
localtime(&unsqltime(@_[0])); |
my $mysqltime; |
$mon++; $year+=1900; |
if ($time =~ |
return "$year-$mon-$mday $hour:$min:$sec"; |
/(\d+)-(\d+)-(\d+) # YYYY-MM-DD |
|
\s # a space |
|
(\d+):(\d+):(\d+) # HH:MM::SS |
|
/x ) { |
|
# Some of the .meta files have the time in mysql |
|
# format already, so just make sure they are 0 padded and |
|
# pass them back. |
|
$mysqltime = sprintf('%04d-%02d-%02d %02d:%02d:%02d', |
|
$1,$2,$3,$4,$5,$6); |
|
} elsif ($time =~ /^\d+$/) { |
|
my @TimeData = gmtime($time); |
|
# Alter the month to be 1-12 instead of 0-11 |
|
$TimeData[4]++; |
|
# Alter the year to be from 0 instead of from 1900 |
|
$TimeData[5]+=1900; |
|
$mysqltime = sprintf('%04d-%02d-%02d %02d:%02d:%02d', |
|
@TimeData[5,4,3,2,1,0]); |
|
} else { |
|
print LOG " Unable to decode time ".$time."\n"; |
|
$mysqltime = 0; |
|
} |
|
return $mysqltime; |
} |
} |
|
|
sub maketime { |
## |
my %th=@_; |
## &declutter($filename) |
return POSIX::mktime(($th{'seconds'},$th{'minutes'},$th{'hours'}, |
## Given a filename, returns a url for the filename. |
$th{'day'},$th{'month'}-1, |
sub declutter { |
$th{'year'}-1900,0,0,$th{'dlsav'})); |
my $thisfn=shift; |
|
$thisfn=~s/^$perlvar{'lonDocRoot'}//; |
|
$thisfn=~s/^\///; |
|
$thisfn=~s/^res\///; |
|
return $thisfn; |
} |
} |
|
|
|
## |
######################################### |
## Escape / Unescape special characters |
# |
sub unescape { |
# Retro-fixing of un-backward-compatible time format |
my $str=shift; |
|
$str =~ s/%([a-fA-F0-9][a-fA-F0-9])/pack("C",hex($1))/eg; |
sub unsqltime { |
return $str; |
my $timestamp=shift; |
|
if ($timestamp=~/^(\d+)\-(\d+)\-(\d+)\s+(\d+)\:(\d+)\:(\d+)$/) { |
|
$timestamp=&maketime('year'=>$1,'month'=>$2,'day'=>$3, |
|
'hours'=>$4,'minutes'=>$5,'seconds'=>$6); |
|
} |
|
return $timestamp; |
|
} |
} |
|
|
|
sub escape { |
|
my $str=shift; |
|
$str =~ s/(\W)/"%".unpack('H2',$1)/eg; |
|
return $str; |
|
} |