--- loncom/interface/statistics/lonproblemstatistics.pm 2002/11/26 16:59:03 1.37 +++ loncom/interface/statistics/lonproblemstatistics.pm 2003/03/28 15:20:59 1.48 @@ -1,7 +1,6 @@ # The LearningOnline Network with CAPA -# (Publication Handler # -# $Id: lonproblemstatistics.pm,v 1.37 2002/11/26 16:59:03 minaeibi Exp $ +# $Id: lonproblemstatistics.pm,v 1.48 2003/03/28 15:20:59 matthew Exp $ # # Copyright Michigan State University Board of Trustees # @@ -26,14 +25,27 @@ # http://www.lon-capa.org/ # # (Navigate problems for statistical reports -# YEAR=2001 -# 5/5,7/9,7/25/1,8/11,9/13,9/26,10/5,10/9,10/22,10/26 Behrouz Minaei -# 11/1,11/4,11/16,12/14,12/16,12/18,12/20,12/31 Behrouz Minaei -# YEAR=2002 -# 1/22,2/1,2/6,2/25,3/2,3/26,4/7,5/6 Behrouz Minaei -# 5/12,5/26,7/16,7/29,8/5,10/31 Behrouz Minaei # -### +############################################### +############################################### + +=pod + +=head1 NAME + +lonproblemstatistics + +=head1 SYNOPSIS + +Routines to present problem statistics to instructors via tables, +Excel files, and plots. + +=over 4 + +=cut + +############################################### +############################################### package Apache::lonproblemstatistics; @@ -41,254 +53,777 @@ use strict; use Apache::lonnet(); use Apache::lonhtmlcommon; use Apache::loncoursedata; -use GDBM_File; +use Apache::lonstatistics; +use Spreadsheet::WriteExcel; +############################################### +############################################### -sub InitializeProblemStatistics { - my ($cacheDB, $students, $courseID, $c, $r)=@_; - my %cache; - - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - $r->print('Unable to tie database1.'); - return ('ERROR', undef); - } - - # Remove students who don't have the proper section. - my @sectionsSelected = split(':',$cache{'sectionsSelected'}); - for(my $studentIndex=((scalar @$students)-1); $studentIndex>=0; - $studentIndex--) { - my $value = $cache{$students->[$studentIndex].':section'}; - my $found = 0; - foreach (@sectionsSelected) { - if($_ eq 'none') { - if($value eq '' || !defined($value) || $value eq ' ') { - $found = 1; - last; - } - } else { - if($value eq $_) { - $found = 1; - last; - } - } - } - if($found == 0) { - splice(@$students, $studentIndex, 1); - } - } +=pod - my $isNotCached = 0; - my $lastStatus = (defined($cache{'StatisticsLastStatus'})) ? - $cache{'StatisticsLastStatus'} : 'Nothing'; - my $whichStudents = join(':::',sort(@$students)); - if(!defined($cache{'StatisticsCached'}) || - $lastStatus ne $cache{'Status'} || - $whichStudents ne $cache{'StatisticsWhichStudents'}) { - $isNotCached = 1; - } +=item &CreateInterface() + +Create the main intereface for the statistics page. Allows the user to +select sections, maps, and output. + +=cut + +############################################### +############################################### +sub CreateInterface { + my $Str = ''; + $Str .= ''."\n"; + $Str .= ''; + $Str .= ''; + $Str .= ''; + $Str .= ''; + $Str .= ''."\n"; + # + $Str .= ''."\n"; + $Str .= '
SectionsSequences and FoldersOutput
'."\n"; + $Str .= &Apache::lonstatistics::SectionSelect('Section','multiple',5); + $Str .= ''; + # + my $only_seq_with_assessments = sub { + my $s=shift; + if ($s->{'num_assess'} < 1) { + return 0; + } else { + return 1; + } + }; + $Str .= &Apache::lonstatistics::MapSelect('Maps','multiple,all',5, + $only_seq_with_assessments); + $Str .= ''."\n"; + $Str .= &CreateAndParseOutputSelector(); + $Str .= '
'."\n"; + return $Str; +} - untie(%cache); - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) { - $r->print('Unable to tie database.2'); - return ('ERROR', undef); - } - if($isNotCached && defined($cache{'StatisticsCached'})) { - my @statkeys = split(':::', $cache{'StatisticsKeys'}); - delete $cache{'StatisticsKeys'}; - delete $cache{'StatisticsCached'}; - foreach(@statkeys) { - delete $cache{$_}; - } - } +####################################################### +####################################################### - untie(%cache); - if($isNotCached) { - &Apache::loncoursedata::DownloadStudentCourseDataSeparate($students, - 'true', - $cacheDB, - 'true', - 'true', - $courseID, - $r, $c); - } - if($c->aborted()) { return ('ERROR', undef); } +=pod - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - $r->print('Unable to tie database.3'); - return ('ERROR', undef); - } - my $problemData; - if($isNotCached) { - ($problemData) = &ExtractStudentData(\%cache, $students); - &CalculateStatistics($problemData, \%cache, $courseID); - } - untie(%cache); +=item &CreateAndParseOutputSelector() - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) { - $r->print('Unable to tie database.4'); - return ('ERROR', undef); +Construct a selection list of options for output and parse output selections. +The current output selected is indicated by the values of the two package +variables $output_mode and $show. @OutputOptions holds the descriptions of +the output options and the values for $output_mode and $show. + + Based on code from lonstudentassessment.pm. + +=cut + +####################################################### +####################################################### +my $output_mode; +my $show; + +my @OutputOptions = + ( + { name => 'problem statistics grouped by sequence', + value => 'HTML problem statistics grouped', + description => 'Output statistics for the problem parts.', + mode => 'html', + show => 'grouped', + }, + { name => 'problem statistics ungrouped', + value => 'HTML problem statistics ungrouped', + description => 'Output statistics for the problem parts.', + mode => 'html', + show => 'ungrouped', + }, + { name => 'problem statistics, Excel', + value => 'Excel problem statistics', + description => 'Output statistics for the problem parts '. + 'in an Excel workbook', + mode => 'excel', + show => 'all', + }, + { name => 'Degree of Difficulty Plot', + value => 'plot deg diff', + description => 'Generate a plot of the degree of difficulty of each '. + 'problem part.', + mode => 'plot', + show => 'deg of diff', + }, + { name => 'Percent Wrong Plot', + value => 'plot per wrong', + description => 'Generate a plot showing the percent of students who '. + 'were unable to complete each problem part', + mode => 'plot', + show => 'per wrong', + }, + ); + +sub OutputDescriptions { + my $Str = ''; + $Str .= "

Output Modes

\n"; + $Str .= "
\n"; + foreach my $outputmode (@OutputOptions) { + $Str .="
".$outputmode->{'name'}."
\n"; + $Str .="
".$outputmode->{'description'}."
\n"; } - if($isNotCached) { - foreach(keys(%$problemData)) { - $cache{$_} = $problemData->{$_}; + $Str .= "
\n"; + return $Str; +} + +sub CreateAndParseOutputSelector { + my $Str = ''; + my $elementname = 'statsoutputmode'; + # + # Format for output options is 'mode, restrictions'; + my $selected = 'HTML problem statistics grouped'; + if (exists($ENV{'form.'.$elementname})) { + if (ref($ENV{'form.'.$elementname} eq 'ARRAY')) { + $selected = $ENV{'form.'.$elementname}->[0]; + } else { + $selected = $ENV{'form.'.$elementname}; } - $cache{'StatisticsKeys'} = join(':::', keys(%$problemData)); - $cache{'StatisticsCached'} = 'true'; - $cache{'StatisticsLastStatus'} = $cache{'Status'}; - $cache{'StatisticsWhichStudents'} = $whichStudents; } - untie(%cache); - - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - $r->print('Unable to tie database.5'); - return ('ERROR', undef); + # + # Set package variables describing output mode + $output_mode = 'html'; + $show = 'all'; + foreach my $option (@OutputOptions) { + next if ($option->{'value'} ne $selected); + $output_mode = $option->{'mode'}; + $show = $option->{'show'}; + } + # + # Build the form element + $Str = qq/"; + return $Str; +} - my $orderedProblems = &SortProblems(\%cache, - $cache{'ProblemStatisticsSort'}, - $cache{'SortProblems'}, - $cache{'ProblemStatisticsAscend'}); - untie(%cache); +############################################### +############################################### - return ('OK', $orderedProblems); -} +=pod -sub BuildProblemStatisticsPage { - my ($cacheDB, $students, $courseID, $c, $r)=@_; +=item &Gather_Student_Data() - my @Header = ("Homework Sets Order","#Stdnts","Tries","Mod", - "Mean","#YES","#yes","%Wrng","DoDiff", - "S.D.","Skew.","D.F.1st","D.F.2nd"); - my $color=&setbgcolor(0); - my %cache; +Ensures all student data is up to date. - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - $r->print('Unable to tie database.6'); - return; - } - my $Ptr = ''; - $Ptr .= ''; - $Ptr .= ''."\n"; - $Ptr .= ''."\n"; - $Ptr .= ''."\n"; - $Ptr .= ''."\n"; - $Ptr .= ''."\n"; - $Ptr .= ''."\n"; - $Ptr .= &ProblemStatisticsButtons($cache{'DisplayFormat'}, - $cache{'DisplayLegend'}, - $cache{'SortProblems'}); - $Ptr .= '
Select Map'; - $Ptr .= &Apache::lonhtmlcommon::MapOptions(\%cache, 'Statistics', - 'Statistics'); - $Ptr .= '
Sorting Type:'."\n"; - $Ptr .= &Apache::lonhtmlcommon::AscendOrderOptions( - $cache{'ProblemStatisticsAscend'}, - 'ProblemStatistics', - 'Statistics'); - $Ptr .= '
Select Sections'; - $Ptr .= ''."\n"; - my @sections = split(':',$cache{'sectionList'}); - my @sectionsSelected = split(':',$cache{'sectionsSelected'}); - $Ptr .= &Apache::lonhtmlcommon::MultipleSectionSelect(\@sections, - \@sectionsSelected, - 'Statistics'); - $Ptr .= '
'; - if($cache{'DisplayLegend'} eq 'Show Legend') { - $Ptr .= &ProblemStatisticsLegend(); +=cut + +############################################### +############################################### +sub Gather_Student_Data { + my ($r) = @_; + my $c = $r->connection(); + # + my @Sequences = &Apache::lonstatistics::Sequences_with_Assess(); + # + my @Students = @Apache::lonstatistics::Students; + # + # Open the progress window + my %prog_state=&Apache::lonhtmlcommon::Create_PrgWin + ($r,'Statistics Compilation Status', + 'Statistics Compilation Progress', scalar(@Students)); + # + while (my $student = shift @Students) { + return if ($c->aborted()); + my ($status,undef) = &Apache::loncoursedata::ensure_current_data + ($student->{'username'},$student->{'domain'}, + $ENV{'request.course.id'}); + &Apache::lonhtmlcommon::Increment_PrgWin($r,\%prog_state, + 'last student'); } - $r->print($Ptr); + &Apache::lonhtmlcommon::Close_PrgWin($r,\%prog_state); $r->rflush(); - untie(%cache); +} - my ($result, $orderedProblems) = - &InitializeProblemStatistics($cacheDB, $students, $courseID, $c, $r); - if($result ne 'OK') { - return; - } +############################################### +############################################### + +=pod + +=item &BuildProblemStatisticsPage() - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - $r->print('Unable to tie database.6'); +Main interface to problem statistics. + +=cut + +############################################### +############################################### +sub BuildProblemStatisticsPage { + my ($r,$c)=@_; + # + $output_mode = 'html'; + $show = 'grouped'; + # + $r->print(&CreateInterface()); + $r->print(''); + $r->print(''); + if (! exists($ENV{'form.statsfirstcall'})) { + $r->print(< + +Please make your selections in the boxes above and hit +the button marked "Update Display". + +

+ENDMSG return; } - &BuildStatisticsTable(\%cache, $cache{'DisplayFormat'}, - $cache{'SortProblems'}, $orderedProblems, - \@Header, $r, $color); - untie(%cache); - + # + &Gather_Student_Data($r); + # + # + if ($output_mode eq 'html') { + $r->print("

". + $ENV{'course.'.$ENV{'request.course.id'}.'.description'}. + "

\n"); + $r->print("

".localtime(time)."

"); + $r->rflush(); + if ($show eq 'grouped') { + &output_html_grouped_by_sequence($r); + } elsif ($show eq 'ungrouped') { + &output_html_ungrouped($r); + } + } elsif ($output_mode eq 'excel') { + $r->print("

Preparing Excel Spreadsheet

"); + &output_excel($r); + } elsif ($output_mode eq 'plot') { + if ($show eq 'deg of diff') { + &plot_statistics($r,'DoDiff'); + } elsif ($show eq 'per wrong') { + &plot_statistics($r,'%Wrng'); + } + } else { + $r->print("

Not implemented

"); + } return; } -sub BuildGraphicChart { - my ($graph,$cacheDB,$courseDescription,$students,$courseID,$r,$c)=@_; - my %cache; - my $max; - unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) { - return 'Unable to tie database.7'; - } +############################################### +############################################### - my $title = ''; - if($graph eq 'DoDiffGraph') { - $title = 'Degree-of-Difficulty'; - } else { - $title = 'Wrong-Percentage'; - } +=pod - my $currentSequence = -1; - my $sortProblems = 'Sort Within Sequence'; +=item &output_html_grouped_by_sequence() - my ($result, $orderedProblems) = - &InitializeProblemStatistics($cacheDB, $students, $courseID, $c, $r); - if($result ne 'OK') { - return; - } +Presents the statistics data as an html table organized by the order +the assessments appear in the course. - my @values = (); +=cut - foreach(@$orderedProblems) { - my ($sequence,$problem,$part)=split(':', $_); - if($cache{'StatisticsMaps'} ne 'All Maps' && - $cache{'StatisticsMaps'} ne $cache{$sequence.':title'}) { - next; +############################################### +############################################### +sub output_html_grouped_by_sequence { + my ($r) = @_; + my $problem_num = 0; + #$r->print(&ProblemStatisticsLegend()); + my @Header = ("Title","Part","#Stdnts","Tries","Mod", + "Mean","#YES","#yes","%Wrng","DoDiff", + "S.D.","Skew.");#,"D.F.1st","D.F.2nd"); + # #FFFFE6 #EEFFCC #DDFFFF FFDDDD #DDFFDD #FFDDFF + foreach my $sequence (&Apache::lonstatistics::Sequences_with_Assess()) { + next if ($sequence->{'num_assess'}<1); + $r->print("

".$sequence->{'title'}."

"); + $r->print('
'."\n"); + $r->print(''."\n"); + $r->print('\n"); + foreach my $resource (@{$sequence->{'contents'}}) { + next if ($resource->{'type'} ne 'assessment'); + foreach my $part (@{$resource->{'parts'}}) { + $problem_num++; + my ($num,$tries,$mod,$mean,$Solved,$solved,$DegOfDiff,$STD, + $SKEW) = &get_statistics($resource->{'symb'},$part); + # + $part = ' ' if ($part == 0); + # + my $wrongpercent = 0; + if (defined($num) && $num > 0) { + $wrongpercent=int(10*100*($num-$Solved+$solved)/$num)/10; + } + my $option = ''; + $r->print(''.&statistics_html_table_data + ($resource,$part,$num,$tries,$mod,$mean,$Solved, + $solved,$wrongpercent,$DegOfDiff,$STD,$SKEW, + $option). + "\n"); + } } + $r->print("
'. + join("",@Header)."
\n"); + $r->print("
\n"); + $r->rflush(); + } + # + return; +} - if( $currentSequence == -1 || - ($sortProblems eq 'Sort Within Sequence' && - $currentSequence != $sequence)) { - if($currentSequence != -1) { - &DrawGraph(\@values,$courseDescription,$title,$max,$r); - } - if($sortProblems eq 'Sort Within Sequence') { - $r->print('
'.$cache{$sequence.':title'}.''."\n"); +############################################### +############################################### + +=pod + +=item &output_html_ungrouped() + +Presents the statistics data in a single html table which can be sorted by +different columns. + +=cut + +############################################### +############################################### +sub output_html_ungrouped { + my ($r,$option) = @_; + # + my $problem_num = 0; + my $show_container = 0; + my $show_part = 0; + #$r->print(&ProblemStatisticsLegend()); + my @Header = ("Title","Part","#Stdnts","Tries","Mod", + "Mean","#YES","#yes","%Wrng","DoDiff", + "S.D.","Skew");#,"D.F.1st","D.F.2nd"); + # + my $sortby = undef; + foreach (@Header) { + if ($ENV{'form.sortby'} eq $_) { + $sortby = $_; + } + } + if (! defined($sortby) || $sortby eq '') { + $sortby = 'Container'; + } + # If there is more than one sequence, list their titles + my @Sequences = &Apache::lonstatistics::Sequences_with_Assess(); + if (@Sequences > 1) { + unshift(@Header,"Container"); + $show_container = 1; + } + # + # If the option for showing the problem number is needed, push that + # on the list too + if (defined($option) && $option =~ /show probnum/) { + unshift(@Header,"P#"); + } + # + $r->print('
'."\n"); + $r->rflush(); + # + # Compile the data + my @Statsarray; + foreach my $sequence (@Sequences) { + next if ($sequence->{'num_assess'}<1); + foreach my $resource (@{$sequence->{'contents'}}) { + next if ($resource->{'type'} ne 'assessment'); + foreach my $part (@{$resource->{'parts'}}) { + $problem_num++; + my ($num,$tries,$mod,$mean,$Solved,$solved,$DegOfDiff,$STD, + $SKEW) = &get_statistics($resource->{'symb'},$part); + # + $show_part = 1 if ($part ne '0'); + $part = ' ' if ($part == 0); + # + my $wrongpercent = 0; + if (defined($num) && $num > 0) { + $wrongpercent=int(10*100*($num-$Solved+$solved)/$num)/10; + } + push (@Statsarray, + { 'sequence' => $sequence, + 'resource' => $resource, + 'Title' => $resource->{'title'}, + 'Part' => $part, + '#Stdnts' => $num, + 'Tries' => $tries, + 'Mod' => $mod, + 'Mean' => $mean, + '#YES' => $Solved, + '#yes' => $solved, + '%Wrng' => $wrongpercent, + 'DoDiff' => $DegOfDiff, + 'S.D.' => $STD, + 'Skew' => $SKEW, + 'problem_num' => $problem_num, + }); } + } + } + # + # Table Headers + $r->print(''."\n"); + my $Str = ''; + foreach (@Header) { + next if ($_ eq 'Part' && !$show_part); + # Do not allow sorting on some fields + if ($_ eq $sortby || /^(Part|P\#)$/) { + $Str .= ''; + } else { + $Str .= ''; + } + } + $r->print(''.$Str."\n"); + # + # Sort the data + my @OutputOrder; + if ($sortby eq 'Container') { + @OutputOrder = @Statsarray; + } else { + # $sortby is already defined, so we can charge ahead + if ($sortby =~ /^(title|part)$/i) { + # Alpha comparison + @OutputOrder = sort { + lc($a->{$sortby}) cmp lc($b->{$sortby}) || + lc($a->{'Title'}) cmp lc($b->{'Title'}) || + lc($a->{'Part'}) cmp lc($b->{'Part'}); + } @Statsarray; + } else { + # Numerical comparison + @OutputOrder = sort { + my $retvalue = 0; + if ($b->{$sortby} eq 'nan') { + if ($a->{$sortby} ne 'nan') { + $retvalue = -1; + } else { + $retvalue = 0; + } + } + if ($a->{$sortby} eq 'nan') { + if ($b->{$sortby} ne 'nan') { + $retvalue = 1; + } + } + if ($retvalue eq '0') { + $retvalue = $b->{$sortby} <=> $a->{$sortby} || + lc($a->{'Title'}) <=> lc($b->{'Title'}) || + lc($a->{'Part'}) <=> lc($b->{'Part'}); + } + $retvalue; + } @Statsarray; + } + } + $option .= ',no part' if (! $show_part); + foreach my $row (@OutputOrder) { + $r->print(''); + if (defined($option) && $option =~ /show probnum/) { + $r->print(''); + } + if ($show_container) { + $r->print(''); + } + $r->print(&statistics_html_table_data + ($row->{'resource'},$row->{'Part'},$row->{'#Stdnts'}, + $row->{'Tries'},$row->{'Mod'},$row->{'Mean'}, + $row->{'#YES'},$row->{'#yes'},$row->{"\%Wrng"}, + $row->{'DoDiff'},$row->{'S.D.'},$row->{'Skew'}, + $option)); + $r->print("\n"); + } + $r->print("
'.$_.''. + ''. + $_.'
'.$row->{'problem_num'}.'' + .$row->{'sequence'}->{'title'}.'
\n"); + $r->print("
\n"); + $r->rflush(); + # + return; +} + +############################################### +############################################### + +=pod + +=item &output_excel() - $currentSequence = $sequence; - @values = (); - $max=0; - } - my $data = 0; - if($graph eq 'DoDiffGraph') { - $data = sprintf("%.2f", $cache{$_.':degreeOfDifficulty'}), +Presents the statistical data in an Excel 95 compatable spreadsheet file. + +=cut + +############################################### +############################################### +sub output_excel { + my ($r) = @_; + my $filename = '/prtspool/'. + $ENV{'user.name'}.'_'.$ENV{'user.domain'}.'_'. + time.'_'.rand(1000000000).'.xls'; + # + my $excel_workbook = undef; + my $excel_sheet = undef; + # + my $rows_output = 0; + my $cols_output = 0; + # + # Create sheet + $excel_workbook = Spreadsheet::WriteExcel->new('/home/httpd'.$filename); + # + # Check for errors + if (! defined($excel_workbook)) { + $r->log_error("Error creating excel spreadsheet $filename: $!"); + $r->print("Problems creating new Excel file. ". + "This error has been logged. ". + "Please alert your LON-CAPA administrator"); + return ; + } + # + # The excel spreadsheet stores temporary data in files, then put them + # together. If needed we should be able to disable this (memory only). + # The temporary directory must be specified before calling 'addworksheet'. + # File::Temp is used to determine the temporary directory. + $excel_workbook->set_tempdir($Apache::lonnet::tmpdir); + # + # Add a worksheet + my $sheetname = $ENV{'course.'.$ENV{'request.course.id'}.'.description'}; + if (length($sheetname) > 31) { + $sheetname = substr($sheetname,0,31); + } + $excel_sheet = $excel_workbook->addworksheet($sheetname); + # + # Put the course description in the header + $excel_sheet->write($rows_output,$cols_output++, + $ENV{'course.'.$ENV{'request.course.id'}.'.description'}); + $cols_output += 3; + # + # Put a description of the sections listed + my $sectionstring = ''; + my @Sections = @Apache::lonstatistics::SelectedSections; + if (scalar(@Sections) > 1) { + if (scalar(@Sections) > 2) { + my $last = pop(@Sections); + $sectionstring = "Sections ".join(', ',@Sections).', and '.$last; + } else { + $sectionstring = "Sections ".join(' and ',@Sections); + } + } else { + if ($Sections[0] eq 'all') { + $sectionstring = "All sections"; } else { - $data = sprintf("%.1f", $cache{$_.':percentWrong'}), + $sectionstring = "Section ".$Sections[0]; } - if($max < $data) { - $max = $data; + } + $excel_sheet->write($rows_output,$cols_output++,$sectionstring); + $cols_output += scalar(@Sections); + # + # Put the date in there too + $excel_sheet->write($rows_output,$cols_output++, + 'Compiled on '.localtime(time)); + # + $rows_output++; + $cols_output=0; + # + # Add the headers + my @Header = ("Container","Title","Part","#Stdnts","Tries","Mod", + "Mean","#YES","#yes","%Wrng","DoDiff", + "S.D.","Skew.");#,"D.F.1st","D.F.2nd"); + foreach (@Header) { + $excel_sheet->write($rows_output,$cols_output++,$_); + } + $rows_output++; + # + # Write the data + foreach my $sequence (&Apache::lonstatistics::Sequences_with_Assess()) { + next if ($sequence->{'num_assess'}<1); + foreach my $resource (@{$sequence->{'contents'}}) { + next if ($resource->{'type'} ne 'assessment'); + foreach my $part (@{$resource->{'parts'}}) { + $cols_output=0; + my ($num,$tries,$mod,$mean,$Solved,$solved,$DegOfDiff,$STD, + $SKEW) = &get_statistics($resource->{'symb'},$part); + # + if (!defined($part) || $part eq '') { + $part = ' '; + } + my $wrongpercent = 0; + if (defined($num) && $num > 0) { + $wrongpercent=int(10*100*($num-$Solved+$solved)/$num)/10; + } + foreach ($sequence->{'title'},$resource->{'title'},$part, + $num,$tries,$mod,$mean,$Solved,$solved,$wrongpercent, + $DegOfDiff,$STD,$SKEW) { + $excel_sheet->write($rows_output,$cols_output++,$_); + } + $rows_output++; + } } - push(@values, $data); } - untie(%cache); + # + # Write the excel file + $excel_workbook->close(); + # Tell the user where to get their excel file + $r->print('
'. + 'Your Excel spreadsheet.'."\n"); + $r->rflush(); + return; +} + +############################################### +############################################### + +=pod + +=item &statistics_html_table_data() - &DrawGraph(\@values,$courseDescription,$title,$max,$r); +Help function used to format the rows for HTML table output. +=cut + +############################################### +############################################### +sub statistics_html_table_data { + my ($resource,$part,$num,$tries,$mod,$mean,$Solved,$solved,$wrongpercent, + $DegOfDiff,$STD,$SKEW,$options) = @_; + my $row = ''; + $row .= ''. + ''. + $resource->{'title'}.''. + ''; + $row .= ''.$part.'' if ($options !~ /no part/); + foreach ($num,$tries) { + $row .= ''.$_.''; + } + foreach ($mod) { + $row .= ''.$_.''; + } + foreach ($mean) { + $row .= ''. + sprintf("%5.2f",$_).''; + } + foreach ($Solved,$solved) { + $row .= ''.$_.''; + } + foreach ($wrongpercent) { + $row .= ''. + sprintf("%5.1f",$_).''; + } + foreach ($DegOfDiff,$STD,$SKEW) { + $row .= ''. + sprintf("%5.2f",$_).''; + } + return $row; +} + +############################################### +############################################### + +=pod + +=item &plot_statistics() + +=cut + +############################################### +############################################### +sub plot_statistics { + my ($r,$datafield) = @_; + my @Data; + # + my %Fields = ('#Stdnts'=> 0, + 'Tries' => 1, + 'Mod' => 2, + 'Mean' => 3, + '#YES' => 4, + '#yes' => 5, + '%Wrng' => 9, + 'DoDiff' => 6, + 'S.D.' => 7, + 'Skew' => 8,); + # + my $field = '%Wrng'; + foreach (keys(%Fields)) { + $field = $_ if ($datafield eq $_); + } + my $fieldindex = $Fields{$field}; + # + my $Max = 0; + foreach my $sequence (&Apache::lonstatistics::Sequences_with_Assess()) { + next if ($sequence->{'num_assess'}<1); + foreach my $resource (@{$sequence->{'contents'}}) { + next if ($resource->{'type'} ne 'assessment'); + foreach my $part (@{$resource->{'parts'}}) { + my @Results= &get_statistics($resource->{'symb'},$part); + my ($num,$Solved,$solved) = @Results[0,4,5]; + my $wrongpercent = 0; + if (defined($num) && $num > 0) { + $wrongpercent=int(10*100*($num-$Solved+$solved)/$num)/10; + } + push (@Results,$wrongpercent); + my $data = $Results[$fieldindex]; + $data = 0 if ($data eq 'nan'); + $Max = $data if ($Max<$data); + push (@Data,$data); + } + } + } + # + # Print out plot request + my $title = 'Percent Wrong'; + if ($field eq 'DoDiff') { + $title = 'Degree of Difficulty'; + } + my $yaxis = 'Percent'; + if ($field eq 'DoDiff') { + $yaxis = ''; + } elsif ($field ne '%Wrng') { + $yaxis = ''; + } + # + # Determine appropriate value for $Max + if ($field eq 'DoDiff') { + if ($Max > 0.5) { + $Max = 1; + } elsif ($Max > 0.2) { + $Max = 0.5; + } elsif ($Max > 0.1) { + $Max = 0.2; + } + } elsif ($field eq '%Wrng') { + if ($Max > 50) { + $Max = 100; + } elsif ($Max > 25) { + $Max = 50; + } elsif ($Max > 20) { + $Max = 25; + } elsif ($Max > 10) { + $Max = 20; + } elsif ($Max > 5) { + $Max = 10; + } else { + $Max = 5; + } + } + + $r->print("

".&DrawGraph(\@Data,$title,'Problem Number',$yaxis, + $Max)."

\n"); + # + # Print out the data + $ENV{'form.sortby'} = 'Contents'; + &output_html_ungrouped($r,'show probnum'); return; } +############################################### +############################################### + +=pod + +=item &DrawGraph() +=cut + +############################################### +############################################### sub DrawGraph { - my ($values,$courseDescription,$title,$Max,$r)=@_; + my ($values,$title,$xaxis,$yaxis,$Max)=@_; + $title = '' if (! defined($title)); + $xaxis = '' if (! defined($xaxis)); + $yaxis = '' if (! defined($yaxis)); + # my $sendValues = join(',', @$values); my $sendCount = scalar(@$values); - $r->print("
The Maximum Value is: $Max"); if ( $Max > 1 ) { if ($Max % 10) { if ( int($Max) < $Max ) { @@ -296,212 +831,39 @@ sub DrawGraph { $Max = int($Max); } } - #(10 - $Max % 10); - } else { $Max = 1; } - - my @GData = ('','Problem_number',$title,$Max,$sendCount,$sendValues); - -# $r->print(''."\n"); - $r->print('
'."\n"); - $r->print(''); -# $r->print('
'."\n"); - $r->print('
'."\n"); -} - -#---- Problem Statistics Web Page --------------------------------------- - -sub CreateProblemStatisticsTableHeading { - my ($headings,$r)=@_; - - my $Str=''; - $Str .= ''."\n"; - $Str .= 'P#'."\n"; - foreach(@$headings) { - $Str .= ''; - $Str .= ''.$_.' '."\n"; + } else { + $Max = 1; } - $Str .= "\n".''."\n"; - - return $Str; + my @GData = ($title,$xaxis,$yaxis,$Max,$sendCount,$sendValues); + return ''; } -sub BuildStatisticsTable { - my ($cache,$displayFormat,$sortProblems,$orderedProblems,$headings, - $r,$color)=@_; - - my $count = 1; - my $currentSequence = -1; - foreach(@$orderedProblems) { - my ($sequence,$problem,$part)=split(':', $_); - if($cache->{'StatisticsMaps'} ne 'All Maps' && - $cache->{'StatisticsMaps'} ne $cache->{$sequence.':title'}) { - next; - } - - if($currentSequence == -1 || - ($sortProblems eq 'Sort Within Sequence' && - $currentSequence != $sequence)) { - if($displayFormat ne 'Display CSV Format') { - if($currentSequence ne -1) { - $r->print(''); - $r->print('
'); - } - if($sortProblems eq 'Sort Within Sequence') { - $r->print(''.$cache->{$sequence.':title'}.''); - } - $r->print('
'."\n"); - $r->print(''."\n"); - $r->print(&CreateProblemStatisticsTableHeading($headings, $r)); - } else { - if($sortProblems eq 'Sort Within Sequence') { - $r->print('"'.$cache->{$sequence.':title'}.'"'); - } - $r->print('
'); - } - $currentSequence = $sequence; - } - - my $ref = ''.$cache->{$problem.':title'}.''; - my $title = $cache->{$problem.':title'}; - if($part != 0) { - $title .= ' Part '.$part; - } - my $source = $cache->{$problem.':source'}; - my $tableData = join('&', $ref, $title, $source, - $cache->{$_.':studentCount'}, - $cache->{$_.':totalTries'}, - $cache->{$_.':maxTries'}, - $cache->{$_.':mean'}, - $cache->{$_.':correct'}, - $cache->{$_.':correctByOverride'}, - $cache->{$_.':percentWrong'}, - $cache->{$_.':degreeOfDifficulty'}, - $cache->{$_.':standardDeviation'}, - $cache->{$_.':skewness'}, - $cache->{$_.':discriminationFactor1'}, - $cache->{$_.':discriminationFactor2'}); - - &TableRow($displayFormat,$tableData,$count,$r,$color); - - $count++; - } - if($displayFormat ne 'Display CSV Format') { - $r->print('
'."\n"); - $r->print('
'); - } else { - $r->print('
'); +sub get_statistics { + my ($symb,$part) = @_; + # + my $courseid = $ENV{'request.course.id'}; + # + my $students = \@Apache::lonstatistics::Students; + if ($Apache::lonstatistics::SelectedSections[0] eq 'all') { + $students = undef; } - - return; + my @Results = &Apache::loncoursedata::get_problem_statistics + ($students,$symb,$part,$courseid); + return @Results; } -sub TableRow { - my ($displayFormat,$Str,$RealIdx,$r,$color)=@_; - my($ref,$title,$source,$StdNo,$TotalTries,$MxTries,$Avg,$YES,$Override, - $Wrng,$DoD,$SD,$Sk,$_D1,$_D2)=split(/\&/,$Str); - my $Ptr; - if($displayFormat eq 'Display CSV Format') { - $Ptr='"'.$RealIdx.'",'."\n". - '"'.$title.'",'."\n". - '"'.$source.'",'."\n". - '"'.$StdNo.'",'."\n". - '"'.$TotalTries.'",'."\n". - '"'.$MxTries.'",'."\n". - '"'.$Avg.'",'."\n". - '"'.$YES.'",'."\n". - '"'.$Override.'",'."\n". - '"'.$Wrng.'",'."\n". - '"'.$DoD.'",'."\n". - '"'.$SD.'",'."\n". - '"'.$Sk.'",'."\n". - '"'.$_D1.'",'."\n". - '"'.$_D2.'"'."\n". - "
\n"; +############################################### +############################################### - $r->print("\n".$Ptr); - } else { - $Ptr=''."\n". - ''.$RealIdx.''."\n". - ''.$ref.''."\n". - ' '.$StdNo.''."\n". - ''.$TotalTries.''."\n". - ''.$MxTries.''."\n". - ''.$Avg.''."\n". - ' '.$YES.''."\n". - ' '.$Override.''."\n". - ' '.$Wrng.''."\n". - ' '.$DoD.''."\n". - ' '.$SD.''."\n". - ' '.$Sk.''."\n". - ' '.$_D1.''."\n". - ' '.$_D2.''."\n"; - $r->print($Ptr.''."\n"); - } +=pod - return; -} +=item &ProblemStatisticsLegend() -# For loading the colored table for display or un-colored for print -sub setbgcolor { - my $PrintTable=shift; - my %color; - if ($PrintTable){ - $color{"gb"}="#FFFFFF"; - $color{"red"}="#FFFFFF"; - $color{"yellow"}="#FFFFFF"; - $color{"green"}="#FFFFFF"; - $color{"purple"}="#FFFFFF"; - } else { - $color{"gb"}="#DDFFFF"; - $color{"red"}="#FFDDDD"; - $color{"yellow"}="#EEFFCC"; - $color{"green"}="#DDFFDD"; - $color{"purple"}="#FFDDFF"; - } - - return \%color; -} - -sub ProblemStatisticsButtons { - my ($displayFormat, $displayLegend, $sortProblems)=@_; - - my $Ptr = ''; - $Ptr .= '{'orderedSequences'})) { - foreach my $problemID (split(':', $cache->{$sequence.':problems'})) { - foreach my $part (split(/\:/,$cache->{$sequence.':'. - $problemID. - ':parts'})) { - my $id = $sequence.':'.$problemID.':'.$part; - push(@problemList, $id); - my $totalTries = 0; - my $totalAwarded = 0; - my $correct = 0; - my $correctByOverride = 0; - my $studentCount = 0; - my $maxTries = 0; - my $totalFirst = 0; - my @studentTries=(); - foreach(@$students) { - my $code = $cache->{"$_:$problemID:$part:code"}; - - if(defined($cache->{$_.':error'}) || $code eq ' ' || - $cache->{"$_:$problemID:NoVersion"} eq 'true') { - next; - } - - $studentCount++; - my $tries = $cache->{"$_:$problemID:$part:tries"}; - if($maxTries < $tries) { - $maxTries = $tries; - } - $totalTries += $tries; - push(@studentTries, $tries); - - my $awarded = $cache->{"$_:$problemID:$part:awarded"}; - $totalAwarded += $awarded; - - if($code eq '*') { - $correct++; - if($tries == 1) { - $totalFirst++; - } - } elsif($code eq '+') { - $correctByOverride++; - } - } - - my $studentTriesJoined = join(':::', @studentTries); - $problemData{$id.':sequenceTitle'} = - $cache->{$sequence.':title'}; - $problemData{$id.':studentCount'} = $studentCount; - $problemData{$id.':totalTries'} = $totalTries; - $problemData{$id.':studentTries'} = $studentTriesJoined; - $problemData{$id.':totalAwarded'} = $totalAwarded; - $problemData{$id.':correct'} = $correct; - $problemData{$id.':correctByOverride'} = $correctByOverride; - $problemData{$id.':wrong'} = $studentCount - - ($correct + $correctByOverride); - $problemData{$id.':maxTries'} = $maxTries; - $problemData{$id.':totalFirst'} = $totalFirst; - } - } - } - - my @upperStudents1=(); - my @lowerStudents1=(); - my @upperStudents2=(); - my @lowerStudents2=(); - my $upperCount = int(0.27*scalar(@$students)); - # Discriminant Factor criterion 1 - my $sortedStudents = &SortDivideByTries($students,$cache,':totalAwarded'); - - for(my $i=0; $i<$upperCount; $i++) { - push(@lowerStudents1, $sortedStudents->[$i]); - push(@upperStudents1, $sortedStudents->[(scalar(@$students)-$i-1)]); - } - - $problemData{'studentsUpperListCriterion1'}=join(':::', @upperStudents1); - $problemData{'studentsLowerListCriterion1'}=join(':::', @lowerStudents1); - - # Discriminant Factor criterion 2 - $sortedStudents = &SortDivideByTries($students, $cache, ':totalSolved'); - - for(my $i=0; $i<$upperCount; $i++) { - push(@lowerStudents2, $sortedStudents->[$i]); - push(@upperStudents2, $sortedStudents->[(scalar(@$students)-$i-1)]); - } - $problemData{'studentsUpperListCriterion2'}=join(':::', @upperStudents2); - $problemData{'studentsLowerListCriterion2'}=join(':::', @lowerStudents2); - - $problemData{'problemList'} = join(':::', @problemList); - - return \%problemData; -} - -sub SortDivideByTries { - my ($toSort, $data, $sortOn)=@_; - my @orderedData = sort { ($data->{$a.':totalTries'}) ? - ($data->{$a.$sortOn}/$data->{$a.':totalTries'}):0 - <=> - ($data->{$b.':totalTries'}) ? - ($data->{$b.$sortOn}/$data->{$b.':totalTries'}):0 - } @$toSort; - - return \@orderedData; -} - -sub SortProblems { - my ($problemData,$sortBy,$sortProblems,$ascend)=@_; - - my @problems = split(':::', $problemData->{'problemList'}); - if($sortBy eq "Homework Sets Order") { - return \@problems; - } - - my $data; - - if ($sortBy eq "#Stdnts") { $data = ':studentCount'; } - elsif($sortBy eq "Tries") { $data = ':totalTries'; } - elsif($sortBy eq "Mod") { $data = ':maxTries'; } - elsif($sortBy eq "Mean") { $data = ':mean'; } - elsif($sortBy eq "#YES") { $data = ':correct'; } - elsif($sortBy eq "#yes") { $data = ':correctByOverride'; } - elsif($sortBy eq "%Wrng") { $data = ':percentWrong'; } - elsif($sortBy eq "DoDiff") { $data = ':degreeOfDifficulty'; } - elsif($sortBy eq "S.D.") { $data = ':standardDeviation'; } - elsif($sortBy eq "Skew.") { $data = ':skewness'; } - elsif($sortBy eq "D.F.1st") { $data = ':discriminationFactor1'; } - elsif($sortBy eq "D.F.2nd") { $data = ':discriminationFactor2'; } - else { return \@problems; } - - my %temp; - my @sequenceList=(); - foreach(@problems) { - my ($sequence) = split(':', $_); - - my @array=(); - my $tempArray; - if(defined($temp{$sequence})) { - $tempArray = $temp{$sequence}; - } else { - push(@sequenceList, $sequence); - $tempArray = \@array; - $temp{$sequence} = $tempArray; - } - - push(@$tempArray, $_); - } - - my @orderedProblems; - if($sortProblems eq "Sort Within Sequence") { - foreach(keys(%temp)) { - my $tempArray = $temp{$_}; - my @tempOrder = - sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} } - @$tempArray; - $temp{$_} = \@tempOrder; - } - foreach(@sequenceList) { - my $tempArray = $temp{$_}; - @orderedProblems = (@orderedProblems, @$tempArray); - } - } else { - @orderedProblems = - sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} } - @problems; - } - - if($ascend eq 'Descending') { - @orderedProblems = reverse(@orderedProblems); - } - - return \@orderedProblems; -} - -sub CalculateStatistics { - my ($data, $cache, $courseID)=@_; - - my @problems = split(':::', $data->{'problemList'}); - foreach(@problems) { - # Mean - my $mean = ($data->{$_.':studentCount'}) ? - ($data->{$_.':totalTries'} / $data->{$_.':studentCount'}) : 0; - $data->{$_.':mean'} = sprintf("%.2f", $mean); - - # %Wrong - my $pw = ($data->{$_.':studentCount'}) ? - (($data->{$_.':wrong'} / $data->{$_.':studentCount'}) * 100.0) : - 100.0; - $data->{$_.':percentWrong'} = sprintf("%.1f", $pw); - - # Degree of Difficulty - my $dod = ($data->{$_.':totalTries'}) ? - (1 - (($data->{$_.':correct'} + $data->{$_.':correctByOverride'}) / - $data->{$_.':totalTries'})) : 0; - - $data->{$_.':degreeOfDifficulty'} = sprintf("%.2f", $dod); - - # Factor in mean - my @studentTries = split(':::', $data->{$_.':studentTries'}); - foreach(my $index=0; $index < scalar(@studentTries); $index++) { - $studentTries[$index] -= $mean; - } - my $sumSquared = 0; - my $sumCubed = 0; - foreach(@studentTries) { - my $squared = ($_ * $_); - my $cubed = ($squared * $_); - $sumSquared += $squared; - $sumCubed += $cubed; - } - - # Standard deviation - my $standardDeviation; - if($data->{$_.':studentCount'} - 1 > 0) { - $standardDeviation = (sqrt($sumSquared)) / - ($data->{$_.':studentCount'} - 1); - } else { - $standardDeviation = 0.0; - } - $data->{$_.':standardDeviation'} = sprintf("%.1f", $standardDeviation); - - # Skewness - my $skew; - if($standardDeviation > 0.0999 && $data->{$_.':studentCount'} > 0) { - $skew = (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) / - ($standardDeviation * - $standardDeviation * - $standardDeviation)); - } else { - $skew = 0.0; - } - - $data->{$_.':skewness'} = sprintf("%.1f", $skew); - - # Discrimination Factor 1 - my ($sequence, $problem, $part) = split(':', $_); - - my @upper1 = split(':::', $data->{'studentsUpperListCriterion1'}); - my @lower1 = split(':::', $data->{'studentsLowerListCriterion1'}); - - my $upper1Sum=0; - foreach my $name (@upper1) { - $upper1Sum += $cache->{"$name:$problem:$part:awarded"}; - } - $upper1Sum = (scalar(@upper1)) ? ($upper1Sum/(scalar(@upper1))) : 0; - - my $lower1Sum=0; - foreach my $name (@lower1) { - $lower1Sum += $cache->{"$name:$problem:$part:awarded"}; - } - $lower1Sum = (scalar(@lower1)) ? ($lower1Sum/(scalar(@lower1))) : 0; - - my $df1 = $upper1Sum - $lower1Sum; - $data->{$_.':discriminationFactor1'} = sprintf("%.2f", $df1); - - # Discrimination Factor 2 - my @upper2 = split(':::', $data->{'studentsUpperListCriterion2'}); - my @lower2 = split(':::', $data->{'studentsLowerListCriterion2'}); - - my $upper2Sum=0; - foreach my $name (@upper2) { - $upper2Sum += $cache->{"$name:$problem:$part:awarded"}; - } - $upper2Sum = (scalar(@upper2)) ? ($upper2Sum/(scalar(@upper2))) : 0; - - my $lower2Sum=0; - foreach my $name (@lower2) { - $lower2Sum += $cache->{"$name:$problem:$part:awarded"}; - } - $lower2Sum = (scalar(@lower2)) ? ($lower2Sum/(scalar(@lower2))) : 0; - - my $df2 = $upper2Sum - $lower2Sum; - $data->{$_.':discriminationFactor2'} = sprintf("%.2f", $df2); - - my %storestats; - my $Average = ($data->{$_.':studentCount'}) ? - $data->{$_.':totalTries'}/$data->{$_.':studentCount'} : 0; - $storestats{$courseID.'___'.$cache->{$sequence.':source'}. - '___timestamp'}=time; - $storestats{$courseID.'___'.$cache->{$sequence.':source'}. - '___stdno'}=$data->{$_.':studentCount'}; - $storestats{$courseID.'___'.$cache->{$sequence.':source'}. - '___avetries'}=$Average; - $storestats{$courseID.'___'.$cache->{$sequence.':source'}. - '___difficulty'}=$data->{$_.':degreeOfDifficulty'}; - $cache->{$sequence.':source'} =~ /^(\w+)\/(\w+)/; - if($data->{$_.':studentCount'}) { - &Apache::lonnet::put('nohist_resevaldata',\%storestats,$1,$2); - } - } - - return; -} - #---- END Problem Statistics Web Page ---------------------------------------- 1;