';
- if($cache{'DisplayLegend'} eq 'Show Legend') {
- $Ptr .= &ProblemStatisticsLegend();
+###############################################
+###############################################
+sub BuildProblemStatisticsPage {
+ my ($r,$c)=@_;
+ #
+ my %Saveable_Parameters = ('Status' => 'scalar',
+ 'statsoutputmode' => 'scalar',
+ 'Section' => 'array',
+ 'StudentData' => 'array',
+ 'Maps' => 'array');
+ &Apache::loncommon::store_course_settings('statistics',
+ \%Saveable_Parameters);
+ &Apache::loncommon::restore_course_settings('statistics',
+ \%Saveable_Parameters);
+ #
+ &Apache::lonstatistics::PrepareClasslist();
+ #
+ # Clear the package variables
+ undef(@StatsArray);
+ #
+ # Finally let the user know we are here
+ my $interface = &CreateInterface();
+ $r->print($interface);
+ $r->print('');
+ #
+ if (! exists($ENV{'form.statsfirstcall'})) {
+ $r->print('');
+ $r->print('
'.
+ &mt('Press "Generate Statistics" when you are ready.').
+ '
'.
+ &mt('It may take some time to update the student data '.
+ 'for the first analysis. Future analysis this session '.
+ ' will not have this delay.').
+ '
');
+ return;
+ } elsif ($ENV{'form.statsfirstcall'} eq 'yes' ||
+ exists($ENV{'form.UpdateCache'}) ||
+ exists($ENV{'form.ClearCache'}) ) {
+ $r->print('');
+ &Apache::lonstatistics::Gather_Student_Data($r);
+ } else {
+ $r->print('');
}
- $r->print($Ptr);
$r->rflush();
-
- my @Header = ("Homework Sets Order","#Stdnts","Tries","Mod",
- "Mean","#YES","#yes","%Wrng","DoDiff",
- "S.D.","Skew.","D.F.1st","D.F.2nd","Disc.");
- my $color=&setbgcolor(0);
-
-# my %Discuss=&Apache::loncoursedata::LoadDiscussion($courseID);
-# my ($upper, $lower) = &Discriminant(\%discriminant,$r);
- if(!defined($cache{'StatisticsCached'})) {
- untie(%cache);
- &Apache::loncoursedata::DownloadStudentCourseDataSeparate($students,
- 'true',
- $cacheDB,
- 'true',
- 'true',
- $courseID,
- $r, $c);
- if($c->aborted()) { return; }
-
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- $r->print('Unable to tie database.');
- return;
- }
- my ($problemData) = &ExtractStudentData(\%cache, $students);
- &CalculateStatistics($problemData);
- untie(%cache);
-
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
- $r->print('Unable to tie database.');
- return;
- }
- foreach(keys(%$problemData)) {
- $cache{$_} = $problemData->{$_};
- }
- $cache{'StatisticsCached'} = 'true';
- untie(%cache);
-
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- $r->print('Unable to tie database.');
- return;
- }
- }
- my $orderedProblems = &SortProblems(\%cache,
- $cache{'ProblemStatisticsSort'},
- $cache{'ProblemStatisticsAscend'});
- &BuildStatisticsTable(\%cache, $cache{'DisplayFormat'}, $orderedProblems,
- \@Header, $r, $color);
- untie(%cache);
-
+ #
+ # This probably does not need to be done each time we are called, but
+ # it does not slow things down noticably.
+ &Apache::loncoursedata::populate_weight_table();
+ if (exists($ENV{'form.Excel'})) {
+ &Excel_output($r);
+ } else {
+ my $sortby = $ENV{'form.sortby'};
+ $sortby = 'container' if (! defined($sortby) || $sortby =~ /^\s*$/);
+ my $plot = $ENV{'form.plot'};
+ &Apache::lonnet::logthis('form.plot = '.$plot);
+ if ($sortby eq 'container' && ! defined($plot)) {
+ &output_html_by_sequence($r);
+ } else {
+ if (defined($plot)) {
+ &Apache::lonnet::logthis('calling plot routine');
+ &make_plot($r,$plot);
+ }
+ &output_html_stats($r);
+ }
+ }
return;
}
+##########################################################
+##########################################################
+##
+## HTML output routines
+##
+##########################################################
+##########################################################
+sub output_html_by_sequence {
+ my ($r) = @_;
+ my $c = $r->connection();
+ $r->print(&html_preamble());
+ #
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ last if ($c->aborted);
+ next if ($seq->{'num_assess'} < 1);
+ $r->print("
".$seq->{'title'}."
".
+ '
'."\n".
+ '
'."\n".
+ '
'.
+ &statistics_table_header('no container')."
\n");
+ my @Data = &compute_statistics_on_sequence($seq);
+ foreach my $data (@Data) {
+ $r->print('
\n";
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ if (defined($starttime) || defined($endtime)) {
+ # Inform the user what the time limits on the data are.
+ $Str .= '
'.&mt('Statistics on submissions from [_1] to [_2]',
+ &Apache::lonlocal::locallocaltime($starttime),
+ &Apache::lonlocal::locallocaltime($endtime)
+ ).'
';
}
- $Str .= "\n".'
'."\n";
-
+ $Str .= "
".&mt('Compiled on [_1]',
+ &Apache::lonlocal::locallocaltime(time))."
";
return $Str;
}
-sub BuildStatisticsTable {
- my ($cache,$displayFormat,$orderedProblems,$headings,$r,$color)=@_;
-#6666666
-# my $file="/home/httpd/perl/tmp/183d.txt";
-# open(OUT, ">$file");
-#6666666
-## &Apache::lonstatistics::Create_PrgWin($r);
-##777777
-## my (%Activity) = &LoadActivityLog();
-## $r->print('');
-## my ($doDiffFile) = &LoadDoDiffFile();
-
-##777777
-## $Str .= &Classify($discriminantFactor, $students);
-
- if($displayFormat ne 'Display CSV Format') {
- $r->print('
'."\n");
- $r->print('
'."\n");
- $r->print(&CreateProblemStatisticsTableHeading($headings, $r));
- } else {
- $r->print(' ');
+###############################################
+###############################################
+##
+## Misc HTML output routines
+##
+###############################################
+###############################################
+sub statistics_html_table_data {
+ my ($data,$options) = @_;
+ my $row = '';
+ foreach my $field (@Fields) {
+ next if ($options =~ /no $field->{'name'}/);
+ $row .= '
';
+ #
+ my $discdata .= ''.join(',',@Labels).''.$/.
+ ''.join(',',@Disc).''.$/;
+ #
+ my $diffdata .= ''.join(',',@Labels).''.$/.
+ ''.join(',',@Diff).''.$/;
+ #
+ $plot=<<"END";
+
+
+ Degree of Discrmination and Degree of Difficulty
+
+ Problem Number
+
+ $discdata
+
+
+ $diffdata
+
+
+END
+ my $plotresult =
+ '
'.&Apache::lonxml::xmlparse($r,'web',$plot).'
'.$/;
+ $r->print($plotresult);
+ return;
+}
- return $Ptr;
+sub plot_dropdown {
+ my $current = '';
+ #
+ if (defined($ENV{'form.plot'})) {
+ $current = $ENV{'form.plot'};
+ }
+ #
+ my @Additional_Plots = (
+ { graphable=>'yes',
+ name => 'degrees',
+ title => 'DoDisc and DoDiff' });
+ #
+ my $Str= "\n".''."\n";
+ return $Str;
}
-sub ProblemStatisticsLegend {
- my $Ptr = '';
- $Ptr = '
';
- $Ptr .= '
';
- $Ptr .= '#Stdnts
';
- $Ptr .= '
Total number of students attempted the problem.';
- $Ptr .= '
';
- $Ptr .= 'Tries
';
- $Ptr .= '
Total number of tries for solving the problem.';
- $Ptr .= '
';
- $Ptr .= 'Mod
';
- $Ptr .= '
Largest number of tries for solving the problem by a student.';
- $Ptr .= '
';
- $Ptr .= 'Mean
';
- $Ptr .= '
Average number of tries. [ Tries / #Stdnts ]';
- $Ptr .= '
';
- $Ptr .= '#YES
';
- $Ptr .= '
Number of students solved the problem correctly.';
- $Ptr .= '
';
- $Ptr .= '#yes
';
- $Ptr .= '
Number of students solved the problem by override.';
- $Ptr .= '
';
- $Ptr .= '%Wrong
';
- $Ptr .= '
Percentage of students who tried to solve the problem ';
- $Ptr .= 'but is still incorrect. [ 100*((#Stdnts-(#YES+#yes))/#Stdnts) ]';
- $Ptr .= '
';
- $Ptr .= 'DoDiff
';
- $Ptr .= '
Degree of Difficulty of the problem. ';
- $Ptr .= '[ 1 - ((#YES+#yes) / Tries) ]';
- $Ptr .= '
';
- $Ptr .= 'S.D.
';
- $Ptr .= '
Standard Deviation of the tries. ';
- $Ptr .= '[ sqrt(sum((Xi - Mean)^2)) / (#Stdnts-1) ';
- $Ptr .= 'where Xi denotes every student\'s tries ]';
- $Ptr .= '
';
- $Ptr .= 'Skew.
';
- $Ptr .= '
Skewness of the students tries.';
- $Ptr .= '[(sqrt( sum((Xi - Mean)^3) / #Stdnts)) / (S.D.^3)]';
- $Ptr .= '
';
- $Ptr .= 'Dis.F.
';
- $Ptr .= '
Discrimination Factor: A Standard for evaluating the ';
- $Ptr .= 'problem according to a Criterion ';
- $Ptr .= '[Applied Criterion in %27 Upper Students - ';
- $Ptr .= 'Applied the same Criterion in %27 Lower Students] ';
- $Ptr .= '1st Criterion for Sorting the Students: ';
- $Ptr .= 'Sum of Partial Credit Awarded / Total Number of Tries ';
- $Ptr .= '2nd Criterion for Sorting the Students: ';
- $Ptr .= 'Total number of Correct Answers / Total Number of Tries';
- $Ptr .= '
';
- $Ptr .= '
Disc.
';
- $Ptr .= '
Number of Students had at least one discussion.';
- $Ptr .= '
';
-
- return $Ptr;
-}
-
-#------- Processing upperlist and lowerlist according to each problem
-
-sub ExtractStudentData {
- my ($cache, $students)=@_;
-
-#$Apache::lonxml::debug=1;
-#&Apache::lonhomework::showhash(%$cache);
-#$Apache::lonxml::debug=0;
-
- my @problemList=();
- my %problemData;
- foreach my $sequence (split(':', $cache->{'orderedSequences'})) {
- foreach my $problemID (split(':', $cache->{$sequence.':problems'})) {
- foreach my $part (split(/\:/,$cache->{$sequence.':'.
- $problemID.
- ':parts'})) {
- my $id = $sequence.':'.$problemID.':'.$part;
- push(@problemList, $id);
- my $totalTries = 0;
- my $totalAwarded = 0;
- my $correct = 0;
- my $correctByOverride = 0;
- my $studentCount = 0;
- my $maxTries = 0;
- my $totalFirst = 0;
- my @studentTries=();
- foreach(@$students) {
- my $code = $cache->{"$_:$problemID:$part:code"};
-
- if(defined($cache->{$_.':error'}) || $code eq ' ' ||
- $cache->{"$_:$problemID:NoVersion"} eq 'true') {
- next;
- }
+###############################################
+###############################################
+##
+## Excel output routines
+##
+###############################################
+###############################################
+sub Excel_output {
+ my ($r) = @_;
+ $r->print('
'.&mt('Preparing Excel Spreadsheet').'
');
+ ##
+ ## Compute the statistics
+ &compute_all_statistics($r);
+ my $c = $r->connection;
+ return if ($c->aborted());
+ ##
+ ## Create the excel workbook
+ my $filename = '/prtspool/'.
+ $ENV{'user.name'}.'_'.$ENV{'user.domain'}.'_'.
+ time.'_'.rand(1000000000).'.xls';
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ #
+ # Create sheet
+ my $excel_workbook = Spreadsheet::WriteExcel->new('/home/httpd'.$filename);
+ #
+ # Check for errors
+ if (! defined($excel_workbook)) {
+ $r->log_error("Error creating excel spreadsheet $filename: $!");
+ $r->print(&mt("Problems creating new Excel file. ".
+ "This error has been logged. ".
+ "Please alert your LON-CAPA administrator."));
+ return 0;
+ }
+ #
+ # The excel spreadsheet stores temporary data in files, then put them
+ # together. If needed we should be able to disable this (memory only).
+ # The temporary directory must be specified before calling 'addworksheet'.
+ # File::Temp is used to determine the temporary directory.
+ $excel_workbook->set_tempdir($Apache::lonnet::tmpdir);
+ #
+ # Add a worksheet
+ my $sheetname = $ENV{'course.'.$ENV{'request.course.id'}.'.description'};
+ if (length($sheetname) > 31) {
+ $sheetname = substr($sheetname,0,31);
+ }
+ my $excel_sheet = $excel_workbook->addworksheet(
+ &Apache::loncommon::clean_excel_name($sheetname));
+ ##
+ ## Begin creating excel sheet
+ ##
+ my ($rows_output,$cols_output) = (0,0);
+ #
+ # Put the course description in the header
+ $excel_sheet->write($rows_output,$cols_output++,
+ $ENV{'course.'.$ENV{'request.course.id'}.'.description'});
+ $cols_output += 3;
+ #
+ # Put a description of the sections listed
+ my $sectionstring = '';
+ my @Sections = @Apache::lonstatistics::SelectedSections;
+ if (scalar(@Sections) > 1) {
+ if (scalar(@Sections) > 2) {
+ my $last = pop(@Sections);
+ $sectionstring = "Sections ".join(', ',@Sections).', and '.$last;
+ } else {
+ $sectionstring = "Sections ".join(' and ',@Sections);
+ }
+ } else {
+ if ($Sections[0] eq 'all') {
+ $sectionstring = "All sections";
+ } else {
+ $sectionstring = "Section ".$Sections[0];
+ }
+ }
+ $excel_sheet->write($rows_output,$cols_output++,$sectionstring);
+ $cols_output += scalar(@Sections);
+ #
+ # Time restrictions
+ my $time_string;
+ if (defined($starttime)) {
+ # call localtime but not lonlocal:locallocaltime because excel probably
+ # cannot handle localized text. Probably.
+ $time_string .= 'Data collected from '.localtime($time_string);
+ if (defined($endtime)) {
+ $time_string .= ' to '.localtime($endtime);
+ }
+ $time_string .= '.';
+ } elsif (defined($endtime)) {
+ # See note above about lonlocal:locallocaltime
+ $time_string .= 'Data collected before '.localtime($endtime).'.';
+ }
+ #
+ # Put the date in there too
+ $excel_sheet->write($rows_output,$cols_output++,
+ 'Compiled on '.localtime(time));
+ #
+ $rows_output++;
+ $cols_output=0;
+ #
+ # Long Headers
+ foreach my $field (@Fields) {
+ next if ($field->{'name'} eq 'problem_num');
+ if (exists($field->{'long_title'})) {
+ $excel_sheet->write($rows_output,$cols_output++,
+ $field->{'long_title'});
+ } else {
+ $excel_sheet->write($rows_output,$cols_output++,'');
+ }
+ }
+ $rows_output++;
+ $cols_output=0;
+ # Brief headers
+ foreach my $field (@Fields) {
+ next if ($field->{'name'} eq 'problem_num');
+ # Use english for excel as I am not sure how well excel handles
+ # other character sets....
+ $excel_sheet->write($rows_output,$cols_output++,$field->{'title'});
+ }
+ $rows_output++;
+ foreach my $data (@StatsArray) {
+ $cols_output=0;
+ foreach my $field (@Fields) {
+ next if ($field->{'name'} eq 'problem_num');
+ $excel_sheet->write($rows_output,$cols_output++,
+ $data->{$field->{'name'}});
+ }
+ $rows_output++;
+ }
+ #
+ $excel_workbook->close();
+ #
+ # Tell the user where to get their excel file
+ $r->print(' '.
+ ''.
+ &mt('Your Excel Spreadsheet').''."\n");
+ $r->rflush();
+ return;
+}
- $studentCount++;
- my $tries = $cache->{"$_:$problemID:$part:tries"};
- if($maxTries < $tries) {
- $maxTries = $tries;
- }
- $totalTries += $tries;
- push(@studentTries, $tries);
+##################################################
+##################################################
+##
+## Statistics Gathering and Manipulation Routines
+##
+##################################################
+##################################################
+sub compute_statistics_on_sequence {
+ my ($seq) = @_;
+ my @Data;
+ foreach my $res (@{$seq->{'contents'}}) {
+ next if ($res->{'type'} ne 'assessment');
+ foreach my $part (@{$res->{'parts'}}) {
+ #
+ # This is where all the work happens
+ my $data = &get_statistics($seq,$res,$part,scalar(@StatsArray)+1);
+ push (@Data,$data);
+ push (@StatsArray,$data);
+ }
+ }
+ return @Data;
+}
- my $awarded = $cache->{"$_:$problemID:$part:awarded"};
- $totalAwarded += $awarded;
+sub compute_all_statistics {
+ my ($r) = @_;
+ if (@StatsArray > 0) {
+ # Assume we have already computed the statistics
+ return;
+ }
+ my $c = $r->connection;
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ last if ($c->aborted);
+ next if ($seq->{'num_assess'} < 1);
+ &compute_statistics_on_sequence($seq);
+ }
+}
- if($code eq '*') {
- $correct++;
- if($tries == 1) {
- $totalFirst++;
- }
- } elsif($code eq '+') {
- $correctByOverride++;
+sub sort_data {
+ my ($sortkey) = @_;
+ return if (! @StatsArray);
+ #
+ # Sort the data
+ my $sortby = undef;
+ foreach my $field (@Fields) {
+ if ($sortkey eq $field->{'name'}) {
+ $sortby = $field->{'name'};
+ }
+ }
+ if (! defined($sortby) || $sortby eq '' || $sortby eq 'problem_num') {
+ $sortby = 'container';
+ }
+ if ($sortby ne 'container') {
+ # $sortby is already defined, so we can charge ahead
+ if ($sortby =~ /^(title|part)$/i) {
+ # Alpha comparison
+ @StatsArray = sort {
+ lc($a->{$sortby}) cmp lc($b->{$sortby}) ||
+ lc($a->{'title'}) cmp lc($b->{'title'}) ||
+ lc($a->{'part'}) cmp lc($b->{'part'});
+ } @StatsArray;
+ } else {
+ # Numerical comparison
+ @StatsArray = sort {
+ my $retvalue = 0;
+ if ($b->{$sortby} eq 'nan') {
+ if ($a->{$sortby} ne 'nan') {
+ $retvalue = -1;
+ } else {
+ $retvalue = 0;
}
}
-
- $problemData{$id.':sequenceTitle'} =
- $cache->{$sequence.':title'};
- $problemData{$id.':studentCount'} = $studentCount;
- $problemData{$id.':totalTries'} = $totalTries;
- $problemData{$id.':studentTries'} = \@studentTries;
- $problemData{$id.':totalAwarded'} = $totalAwarded;
- $problemData{$id.':correct'} = $correct;
- $problemData{$id.':correctByOverride'} = $correctByOverride;
- $problemData{$id.':wrong'} = $studentCount -
- ($correct + $correctByOverride);
- $problemData{$id.':maxTries'} = $maxTries;
- $problemData{$id.':totalFirst'} = $totalFirst;
- }
+ if ($a->{$sortby} eq 'nan') {
+ if ($b->{$sortby} ne 'nan') {
+ $retvalue = 1;
+ }
+ }
+ if ($retvalue eq '0') {
+ $retvalue = $b->{$sortby} <=> $a->{$sortby} ||
+ lc($a->{'title'}) <=> lc($b->{'title'}) ||
+ lc($a->{'part'}) <=> lc($b->{'part'});
+ }
+ $retvalue;
+ } @StatsArray;
}
}
+ #
+ # Renumber the data set
+ my $count;
+ foreach my $data (@StatsArray) {
+ $data->{'problem_num'} = ++$count;
+ }
+ return;
+}
- $problemData{'problemList'} = join(':::', @problemList);
-# $Discussed=0;
-# if($Discuss->{"$name:$problem"}) {
-# $TotDiscuss++;
-# $Discussed=1;
-# }
-
- return \%problemData;
-}
-
-sub SortProblems {
- my ($problemData,$sortBy,$ascend)=@_;
-
- my @problems = split(':::', $problemData->{'problemList'});
- if($sortBy eq "Homework Sets Order") {
- return \@problems;
- }
-
- my $data;
-
- if ($sortBy eq "#Stdnts") { $data = ':studentCount'; }
- elsif($sortBy eq "Tries") { $data = ':totalTries'; }
- elsif($sortBy eq "Mod") { $data = ':maxTries'; }
- elsif($sortBy eq "Mean") { $data = ':mean'; }
- elsif($sortBy eq "#YES") { $data = ':correct'; }
- elsif($sortBy eq "#yes") { $data = ':correctByOverride'; }
- elsif($sortBy eq "%Wrng") { $data = ':percentWrong'; }
- elsif($sortBy eq "DoDiff") { $data = ':degreeOfDifficulty'; }
- elsif($sortBy eq "S.D.") { $data = ':standardDeviation'; }
- elsif($sortBy eq "Skew.") { $data = ':skewness'; }
- elsif($sortBy eq "D.F.1st") { $data = ':discriminantFactor1'; }
- elsif($sortBy eq "D.F.2nd") { $data = ':discriminantFactor2'; }
- elsif($sortBy eq "Disc.") { $data = ''; }
- else { return \@problems; }
-
- my @orderedProblems =
- sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
- @problems;
- if($ascend eq 'Descending') {
- @orderedProblems = reverse(@orderedProblems);
- }
-
- return \@orderedProblems;
-}
-
-sub CalculateStatistics {
- my ($data)=@_;
-
- my @problems = split(':::', $data->{'problemList'});
- foreach(@problems) {
- # Mean
- $data->{$_.':mean'} = ($data->{$_.':studentCount'}) ?
- ($data->{$_.':totalTries'} / $data->{$_.':studentCount'}) : 0;
-
- # %Wrong
- $data->{$_.':percentWrong'} = ($data->{$_.':studentCount'}) ?
- (($data->{$_.':wrong'} / $data->{$_.':studentCount'}) * 100.0) :
- 100.0;
-
- # Degree of Difficulty
- $data->{$_.':degreeOfDifficulty'} = ($data->{$_.':totalTries'}) ?
- (1 - (($data->{$_.':correct'} + $data->{$_.':correctByOverride'}) /
- $data->{$_.':totalTries'})) : 0;
-
- # Factor in mean
- my $studentTries = $data->{$_.':studentTries'};
- foreach(my $index=0; $index < scalar(@$studentTries); $index++) {
- $studentTries->[$index] -= $data->{$_.':mean'};
- }
- my $sumSquared = 0;
- my $sumCubed = 0;
- foreach(@$studentTries) {
- my $squared = ($_ * $_);
- my $cubed = ($squared * $_);
- $sumSquared += $squared;
- $sumCubed += $cubed;
- }
-
- # Standard deviation
- $data->{$_.':standardDeviation'} = ($data->{$_.':studentCount'} - 1) ?
- ((sqrt($sumSquared)) / ($data->{$_.':studentCount'} - 1)) : 0;
-
- # Skewness
- my $standardDeviation = $data->{$_.':standardDeviation'};
- $data->{$_.':skewness'} = ($data->{$_.':standardDeviation'}) ?
- (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) /
- ($standardDeviation * $standardDeviation * $standardDeviation)) :
- 0;
+########################################################
+########################################################
- # Discrimination Factor 1
- $data->{$_.':discriminationFactor1'} = 0;
+=pod
- # Discrimination Factor 2
- $data->{$_.':discriminationFactor2'} = 0;
- }
+=item &get_statistics()
- return;
+Wrapper routine from the call to loncoursedata::get_problem_statistics.
+Calls lonstathelpers::get_time_limits() to limit the data set by time
+and &compute_discrimination_factor
+
+Inputs: $sequence, $resource, $part, $problem_num
+
+Returns: Hash reference with statistics data from
+loncoursedata::get_problem_statistics.
+
+=cut
+
+########################################################
+########################################################
+sub get_statistics {
+ my ($sequence,$resource,$part,$problem_num) = @_;
+ #
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ my $symb = $resource->{'symb'};
+ my $courseid = $ENV{'request.course.id'};
+ #
+ my $data = &Apache::loncoursedata::get_problem_statistics
+ (\@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,
+ $symb,$part,$courseid,$starttime,$endtime);
+ $data->{'part'} = $part;
+ $data->{'problem_num'} = $problem_num;
+ $data->{'container'} = $sequence->{'title'};
+ $data->{'title'} = $resource->{'title'};
+ $data->{'title.link'} = $resource->{'src'}.'?symb='.
+ &Apache::lonnet::escape($resource->{'symb'});
+ #
+ $data->{'deg_of_disc'} = &compute_discrimination_factor($resource,$part,$sequence);
+ return $data;
}
-sub ProcessDiscriminant {
- my ($List) = @_;
- my @sortedList = sort (@$List);
- my $Count = scalar @sortedList;
- my $Problem;
- my @Dis;
- my $Slvd=0;
- my $tmp;
- my $Sum1=0;
- my $Sum2=0;
- my $nIndex=0;
- my $nStudent=0;
- my %Proc=undef;
- while ($nIndex<$Count) {
-# $jr->print(" $nIndex) $sortedList[$nIndex]");
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- my $Temp = $Problem;
- do {
- $nIndex++;
- $nStudent++;
- $Sum1 += $Dis[0];
- $Sum2 += $Dis[1];
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- } while ( $Problem eq $Temp && $nIndex < $Count );
- $Proc{$Temp}=($Sum1/$nStudent).':'.($Sum2/$nStudent);
-# $jr->print(" $nIndex) $Temp --> ($nStudent) $Proc{$Temp}");
- $Sum1=0;
- $Sum2=0;
- $nStudent=0;
- }
-
- return %Proc;
-}
-
-#------- Creating Discimination factor
-sub Discriminant {
- my ($discriminant)=@_;
- my @discriminantKeys=keys(%$discriminant);
- my $Count = scalar @discriminantKeys;
-
- my $UpCnt = int(0.27*$Count);
- my $low=0;
- my $up=$Count-$UpCnt;
- my @UpList=();
- my @LowList=();
-
- $Count=0;
- foreach my $key (sort(@discriminantKeys)) {
- $Count++;
- if($low < $UpCnt || $Count > $up) {
- $low++;
- my $str=$discriminant->{$key};
- foreach(split(/\&/,$str)){
- if($_) {
- if($low<$UpCnt) { push(@LowList,$_); }
- else { push(@UpList,$_); }
- }
- }
- }
+
+###############################################
+###############################################
+
+=pod
+
+=item &compute_discrimination_factor()
+
+Inputs: $Resource, $Sequence
+
+Returns: integer between -1 and 1
+
+=cut
+
+###############################################
+###############################################
+sub compute_discrimination_factor {
+ my ($resource,$part,$sequence) = @_;
+ my @Resources;
+ foreach my $res (@{$sequence->{'contents'}}) {
+ next if ($res->{'symb'} eq $resource->{'symb'});
+ push (@Resources,$res->{'symb'});
+ }
+ #
+ # rank
+ my $ranking =
+ &Apache::loncoursedata::rank_students_by_scores_on_resources
+ (\@Resources,
+ \@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,undef);
+ #
+ # compute their percent scores on the problems in the sequence,
+ my $number_to_grab = int(scalar(@{$ranking})/4);
+ my $num_students = scalar(@{$ranking});
+ my @BottomSet = map { $_->[&Apache::loncoursedata::RNK_student()];
+ } @{$ranking}[0..$number_to_grab];
+ my @TopSet =
+ map {
+ $_->[&Apache::loncoursedata::RNK_student()];
+ } @{$ranking}[($num_students-$number_to_grab)..($num_students-1)];
+ my ($bottom_sum,$bottom_max) =
+ &Apache::loncoursedata::get_sum_of_scores($resource,$part,\@BottomSet);
+ my ($top_sum,$top_max) =
+ &Apache::loncoursedata::get_sum_of_scores($resource,$part,\@TopSet);
+ my $deg_of_disc;
+ if ($top_max == 0 || $bottom_max==0) {
+ $deg_of_disc = 'nan';
+ } else {
+ $deg_of_disc = ($top_sum/$top_max) - ($bottom_sum/$bottom_max);
}
- my %DisUp = &ProcessDiscriminant(\@UpList);
- my %DisLow = &ProcessDiscriminant(\@LowList);
+ #&Apache::lonnet::logthis(' '.$top_sum.'/'.$top_max.
+ # ' - '.$bottom_sum.'/'.$bottom_max);
+ return $deg_of_disc;
+}
+
+###############################################
+###############################################
- return (\%DisUp, \%DisLow);
-}
+=pod
-#---- END Problem Statistics Web Page ----------------------------------------
+=item ProblemStatisticsLegend
-#---- Problem Statistics Graph Web Page --------------------------------------
+=over 4
-# ------------------------------------------- Prepare data for Graphical chart
+=item #Stdnts
+Total number of students attempted the problem.
+
+=item Tries
+Total number of tries for solving the problem.
+
+=item Max Tries
+Largest number of tries for solving the problem by a student.
+
+=item Mean
+Average number of tries. [ Tries / #Stdnts ]
+
+=item #YES
+Number of students solved the problem correctly.
+
+=item #yes
+Number of students solved the problem by override.
+
+=item %Wrong
+Percentage of students who tried to solve the problem
+but is still incorrect. [ 100*((#Stdnts-(#YES+#yes))/#Stdnts) ]
+
+=item DoDiff
+Degree of Difficulty of the problem.
+[ 1 - ((#YES+#yes) / Tries) ]
+
+=item S.D.
+Standard Deviation of the tries.
+[ sqrt(sum((Xi - Mean)^2)) / (#Stdnts-1)
+where Xi denotes every student\'s tries ]
+
+=item Skew.
+Skewness of the students tries.
+[(sqrt( sum((Xi - Mean)^3) / #Stdnts)) / (S.D.^3)]
+
+=item Dis.F.
+Discrimination Factor: A Standard for evaluating the
+problem according to a Criterion
+
+=item [Criterion to group students into %27 Upper Students -
+and %27 Lower Students]
+1st Criterion for Sorting the Students:
+Sum of Partial Credit Awarded / Total Number of Tries
+2nd Criterion for Sorting the Students:
+Total number of Correct Answers / Total Number of Tries
+
+=item Disc.
+Number of Students had at least one discussion.
+
+=back
+
+=cut
+
+
+############################################################
+############################################################
+##
+## How this all works:
+## Statistics are computed by calling &get_statistics with the sequence,
+## resource, and part id to run statistics on. At various places within
+## the loops which compute the statistics, as well as before and after
+## the entire process, subroutines can be called. The subroutines are
+## registered to the following hooks:
+##
+## hook subroutine inputs
+## ----------------------------------------------------------
+## pre $r,$count
+## pre_seq $r,$count,$seq
+## pre_res $r,$count,$seq,$res
+## calc $r,$count,$seq,$res,$data
+## post_res $r,$count,$seq,$res
+## post_seq $r,$count,$seq
+## post $r,$count
+##
+## abort $r
+##
+## subroutines will be called in the order in which they are registered.
+##
+############################################################
+############################################################
+{
-sub BuildGraphicChart {
- my ($graph,$cacheDB,$courseDescription,$r)=@_;
- my %cache;
- my $max = 0;
+my %hooks;
+my $aborted = 0;
+
+sub abort_computation {
+ $aborted = 1;
+}
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- return 'Unable to tie database.';
+sub clear_hooks {
+ $aborted = 0;
+ undef(%hooks);
+}
+
+sub register_hook {
+ my ($hookname,$subref)=@_;
+ if ($hookname !~ /^(pre|pre_seq|pre_res|post|post_seq|post_res|calc)$/){
+ return;
}
-
- my @problems = split(':::', $cache{'problemList'});
- my @values = ();
- foreach (@problems) {
- my $data = 0;
- if($graph eq 'DoDiffGraph') {
- $data = sprintf("%.2f", $cache{$_.':degreeOfDifficulty'}),
+ if (ref($subref) ne 'CODE') {
+ &Apache::lonnet::logthis('attempt to register hook to non-code: '.
+ $hookname,' = '.$subref);
+ } else {
+ if (exists($hooks{$hookname})) {
+ push(@{$hooks{$hookname}},$subref);
} else {
- $data = sprintf("%.1f", $cache{$_.':percentWrong'}),
- }
- if($max < $data) {
- $max = $data;
+ $hooks{$hookname} = [$subref];
}
- push(@values, $data);
}
- untie(%cache);
+ return;
+}
- my $sendValues = join(',', @values);
-# my $sendCount = $#values;
- my $sendCount = scalar(@values);
+sub run_hooks {
+ my $context = shift();
+ foreach my $hook (@{$hooks{$context}}) {
+ if ($aborted && $context ne 'abort') {
+ last;
+ }
+ my $retvalue = $hook->(@_);
+ if (defined($retvalue) && $retvalue eq '0') {
+ $aborted = 1 if (! $aborted);
+ }
+ }
+}
- my $title = '';
- if($graph eq 'DoDiffGraph') {
- $title = 'Degree-of-Difficulty';
+sub run_statistics {
+ my ($r) = @_;
+ my $count = 0;
+ &run_hooks('pre',$r,$count);
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ last if ($aborted);
+ next if ($seq->{'num_assess'}<1);
+ &run_hooks('pre_seq',$r,$count,$seq);
+ foreach my $res (@{$seq->{'contents'}}) {
+ last if ($aborted);
+ next if ($res->{'type'} ne 'assessment');
+ &run_hooks('pre_res',$r,$count,$seq,$res);
+ foreach my $part (@{$res->{'parts'}}) {
+ last if ($aborted);
+ #
+ # This is where all the work happens
+ my $data = &get_statistics($seq,$res,$part,++$count);
+ &run_hooks('calc',$r,$count,$seq,$res,$part,$data);
+ }
+ &run_hooks('post_res',$r,$count,$seq,$res);
+ }
+ &run_hooks('post_seq',$r,$count,$seq);
+ }
+ if ($aborted) {
+ &run_hooks('abort',$r);
} else {
- $title = 'Wrong-Percentage';
+ &run_hooks('post',$r,$count);
}
- my @GData = ($courseDescription, 'Problems', $title, $max, $sendCount,
- $sendValues);
-
- $r->print(''."\n");
- $r->print('');
- $r->print('