';
+ #
+ $Str .= '';
+ $Str .= ' 'x5;
+ $Str .= 'Plot '.&plot_dropdown().(' 'x10);
+ #
+ return $Str;
+}
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- return 'Unable to tie database.';
- }
+###############################################
+###############################################
+
+=pod
- my @Header = ("Homework Sets Order","#Stdnts","Tries","Mod",
- "Mean","#YES","#yes","%Wrng","DoDiff",
- "S.D.","Skew.","D.F.1st","D.F.2nd","Disc.");
- my $color=&setbgcolor(0);
+=item &BuildProblemStatisticsPage()
-# my %Discuss=&Apache::loncoursedata::LoadDiscussion($courseID);
-# my ($upper, $lower) = &Discriminant(\%discriminant,$r);
- my ($problemData) = &ExtractStudentData(\%cache, $students);
- &CalculateStatistics($problemData);
- &SortProblems($problemData, $cache{'ProblemStatisticsSort'},
- $cache{'ProblemStatisticsAscend'});
- #$TempCache=
- &BuildStatisticsTable(\%cache, $cache{'DisplayFormat'},
- $problemData, \@Header, $r, $color);
- untie(%cache);
+Main interface to problem statistics.
-# foreach (keys %$TempCache) {
-# last if ($c->aborted());
-# if(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
-# $cache{$_}=$TempCache->{$_};
-# untie(%cache);
-# }
-# }
+=cut
-# if($c->aborted()) { return; }
-# untie(%cache);
+###############################################
+###############################################
+sub BuildProblemStatisticsPage {
+ my ($r,$c)=@_;
+ #
+ my %Saveable_Parameters = ('Status' => 'scalar',
+ 'statsoutputmode' => 'scalar',
+ 'Section' => 'array',
+ 'StudentData' => 'array',
+ 'Maps' => 'array',
+ 'fieldselections'=> 'array');
+ &Apache::loncommon::store_course_settings('statistics',
+ \%Saveable_Parameters);
+ &Apache::loncommon::restore_course_settings('statistics',
+ \%Saveable_Parameters);
+ #
+ &Apache::lonstatistics::PrepareClasslist();
+ #
+ # Clear the package variables
+ undef(@StatsArray);
+ undef(%SeqStat);
+ #
+ # Finally let the user know we are here
+ my $interface = &CreateInterface($r);
+ $r->print($interface);
+ $r->print('');
+ #
+ my @CacheButtonHTML =
+ &Apache::lonstathelpers::manage_caches($r,'Statistics','stats_status');
+ my $Str;
+ foreach my $html (@CacheButtonHTML) {
+ $Str.=$html.(' 'x5);
+ }
+ #
+ $r->print($Str);
+ if (! exists($ENV{'form.firstrun'})) {
+ $r->print('
'.
+ &mt('Press "Generate Statistics" when you are ready.').
+ '
'.
+ &mt('It may take some time to update the student data '.
+ 'for the first analysis. Future analysis this session '.
+ ' will not have this delay.').
+ '
');
+ return;
+ }
+ $r->rflush();
+ #
+ # This probably does not need to be done each time we are called, but
+ # it does not slow things down noticably.
+ &Apache::loncoursedata::populate_weight_table();
+ #
+ if (exists($ENV{'form.Excel'})) {
+ &Excel_output($r);
+ } else {
+ $r->print(''.' 'x5);
+ $r->rflush();
+ my $count = 0;
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ $count += $seq->{'num_assess_parts'};
+ }
+ if ($count > 10) {
+ $r->print('
'.
+ &mt('Compiling statistics for [_1] problems',$count).
+ '
\n";
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ if (defined($starttime) || defined($endtime)) {
+ # Inform the user what the time limits on the data are.
+ $Str .= '
'.&mt('Statistics on submissions from [_1] to [_2]',
+ &Apache::lonlocal::locallocaltime($starttime),
+ &Apache::lonlocal::locallocaltime($endtime)
+ ).'
';
}
- $Str .= "\n".'
'."\n";
-
+ $Str .= "
".&mt('Compiled on [_1]',
+ &Apache::lonlocal::locallocaltime(time))."
";
return $Str;
}
-sub BuildStatisticsTable {
- my ($cache,$displayFormat,$data,$headings,$r,$color)=@_;
-#6666666
-# my $file="/home/httpd/perl/tmp/183d.txt";
-# open(OUT, ">$file");
-#6666666
-## &Apache::lonstatistics::Create_PrgWin($r);
-##777777
-## my (%Activity) = &LoadActivityLog();
-## $r->print('');
-## my ($doDiffFile) = &LoadDoDiffFile();
-
-##777777
-## $Str .= &Classify($discriminantFactor, $students);
-
- my %TempCache;
- my $problems = $data->{'problemList'};
- if($displayFormat ne 'Display CSV Format') {
- $r->print('
'."\n");
- $r->print('
'."\n");
- $r->print(&CreateProblemStatisticsTableHeading($headings, $r));
- } else {
- $r->print(' ');
+###############################################
+###############################################
+##
+## Misc HTML output routines
+##
+###############################################
+###############################################
+sub statistics_html_table_data {
+ my ($data,$options) = @_;
+ my $row = '';
+ foreach my $field (@Fields) {
+ next if ($options =~ /no $field->{'name'}/);
+ next if ($field->{'selected'} ne 'yes');
+ $row .= '
Total number of students attempted the problem.';
- $Ptr .= '
';
- $Ptr .= 'Tries
';
- $Ptr .= '
Total number of tries for solving the problem.';
- $Ptr .= '
';
- $Ptr .= 'Mod
';
- $Ptr .= '
Largest number of tries for solving the problem by a student.';
- $Ptr .= '
';
- $Ptr .= 'Mean
';
- $Ptr .= '
Average number of tries. [ Tries / #Stdnts ]';
- $Ptr .= '
';
- $Ptr .= '#YES
';
- $Ptr .= '
Number of students solved the problem correctly.';
- $Ptr .= '
';
- $Ptr .= '#yes
';
- $Ptr .= '
Number of students solved the problem by override.';
- $Ptr .= '
';
- $Ptr .= '%Wrong
';
- $Ptr .= '
Percentage of students who tried to solve the problem ';
- $Ptr .= 'but is still incorrect. [ 100*((#Stdnts-(#YES+#yes))/#Stdnts) ]';
- $Ptr .= '
';
- $Ptr .= 'DoDiff
';
- $Ptr .= '
Degree of Difficulty of the problem. ';
- $Ptr .= '[ 1 - ((#YES+#yes) / Tries) ]';
- $Ptr .= '
';
- $Ptr .= 'S.D.
';
- $Ptr .= '
Standard Deviation of the tries. ';
- $Ptr .= '[ sqrt(sum((Xi - Mean)^2)) / (#Stdnts-1) ';
- $Ptr .= 'where Xi denotes every student\'s tries ]';
- $Ptr .= '
';
- $Ptr .= 'Skew.
';
- $Ptr .= '
Skewness of the students tries.';
- $Ptr .= '[(sqrt( sum((Xi - Mean)^3) / #Stdnts)) / (S.D.^3)]';
- $Ptr .= '
';
- $Ptr .= 'Dis.F.
';
- $Ptr .= '
Discrimination Factor: A Standard for evaluating the ';
- $Ptr .= 'problem according to a Criterion ';
- $Ptr .= '[Applied Criterion in %27 Upper Students - ';
- $Ptr .= 'Applied the same Criterion in %27 Lower Students] ';
- $Ptr .= '1st Criterion for Sorting the Students: ';
- $Ptr .= 'Sum of Partial Credit Awarded / Total Number of Tries ';
- $Ptr .= '2nd Criterion for Sorting the Students: ';
- $Ptr .= 'Total number of Correct Answers / Total Number of Tries';
- $Ptr .= '
';
- $Ptr .= '
Disc.
';
- $Ptr .= '
Number of Students had at least one discussion.';
- $Ptr .= '
';
-
- return $Ptr;
-}
-
-#------- Processing upperlist and lowerlist according to each problem
-
-sub ExtractStudentData {
- my ($cache, $students)=@_;
-
-#$Apache::lonxml::debug=1;
-#&Apache::lonhomework::showhash(%$cache);
-#$Apache::lonxml::debug=0;
-
- my @problemList=();
- my %problemData;
- foreach my $sequence (split(':', $cache->{'orderedSequences'})) {
- if($cache->{'ProblemStatisticsMaps'} ne 'All Maps' &&
- $cache->{'ProblemStatisticsMaps'} ne $cache->{$sequence.':title'}) {
+sub plot_dropdown {
+ my $current = '';
+ #
+ if (defined($ENV{'form.plot'})) {
+ $current = $ENV{'form.plot'};
+ }
+ #
+ my @Additional_Plots = (
+ { graphable=>'yes',
+ name => 'degrees',
+ title => 'Difficulty Indexes' },
+ { graphable=>'yes',
+ name => 'tries statistics',
+ title => 'Tries Statistics' });
+ #
+ my $Str= "\n".''."\n";
+ return $Str;
+}
- foreach my $problemID (split(':', $cache->{$sequence.':problems'})) {
- foreach my $part (split(/\:/,$cache->{$sequence.':'.
- $problemID.
- ':parts'})) {
- my $id = $sequence.':'.$problemID.':'.$part;
- push(@problemList, $id);
- my $totalTries = 0;
- my $totalAwarded = 0;
- my $correct = 0;
- my $correctByOverride = 0;
- my $studentCount = 0;
- my $maxTries = 0;
- my $totalFirst = 0;
- my @studentTries=();
- foreach(@$students) {
- my $code = $cache->{"$_:$problemID:$part:code"};
-
- if(defined($cache->{$_.':error'}) || $code eq ' ' ||
- $cache->{"$_:$problemID:NoVersion"} eq 'true') {
- next;
- }
+###############################################
+###############################################
+##
+## Excel output routines
+##
+###############################################
+###############################################
+sub Excel_output {
+ my ($r) = @_;
+ $r->print('
'.&mt('Preparing Excel Spreadsheet').'
');
+ ##
+ ## Compute the statistics
+ &compute_all_statistics($r);
+ my $c = $r->connection;
+ return if ($c->aborted());
+ ##
+ ## Create the excel workbook
+ my $filename = '/prtspool/'.
+ $ENV{'user.name'}.'_'.$ENV{'user.domain'}.'_'.
+ time.'_'.rand(1000000000).'.xls';
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ #
+ # Create sheet
+ my $excel_workbook = Spreadsheet::WriteExcel->new('/home/httpd'.$filename);
+ #
+ # Check for errors
+ if (! defined($excel_workbook)) {
+ $r->log_error("Error creating excel spreadsheet $filename: $!");
+ $r->print(&mt("Problems creating new Excel file. ".
+ "This error has been logged. ".
+ "Please alert your LON-CAPA administrator."));
+ return 0;
+ }
+ #
+ # The excel spreadsheet stores temporary data in files, then put them
+ # together. If needed we should be able to disable this (memory only).
+ # The temporary directory must be specified before calling 'addworksheet'.
+ # File::Temp is used to determine the temporary directory.
+ $excel_workbook->set_tempdir($Apache::lonnet::tmpdir);
+ #
+ # Add a worksheet
+ my $sheetname = $ENV{'course.'.$ENV{'request.course.id'}.'.description'};
+ if (length($sheetname) > 31) {
+ $sheetname = substr($sheetname,0,31);
+ }
+ my $excel_sheet = $excel_workbook->addworksheet(
+ &Apache::loncommon::clean_excel_name($sheetname));
+ #
+ my $format = &Apache::loncommon::define_excel_formats($excel_workbook);
+ ##
+ ## Begin creating excel sheet
+ ##
+ my ($rows_output,$cols_output) = (0,0);
+ #
+ # Put the course description in the header
+ $excel_sheet->write($rows_output,$cols_output++,
+ $ENV{'course.'.$ENV{'request.course.id'}.'.description'},
+ $format->{'h1'});
+ $cols_output += 3;
+ #
+ # Put a description of the sections listed
+ my $sectionstring = '';
+ $excel_sheet->write($rows_output,$cols_output++,
+ &Apache::lonstathelpers::sections_description
+ (@Apache::lonstatistics::SelectedSections),
+ $format->{'h3'});
+ $cols_output += scalar(@Apache::lonstatistics::SelectedSections);
+ #
+ # Time restrictions
+ my $time_string;
+ if (defined($starttime)) {
+ # call localtime but not lonlocal:locallocaltime because excel probably
+ # cannot handle localized text. Probably.
+ $time_string .= 'Data collected from '.localtime($time_string);
+ if (defined($endtime)) {
+ $time_string .= ' to '.localtime($endtime);
+ }
+ $time_string .= '.';
+ } elsif (defined($endtime)) {
+ # See note above about lonlocal:locallocaltime
+ $time_string .= 'Data collected before '.localtime($endtime).'.';
+ }
+ if (defined($time_string)) {
+ $excel_sheet->write($rows_output,$cols_output++,$time_string);
+ $cols_output+= 5;
+ }
+ #
+ # Put the date in there too
+ $excel_sheet->write($rows_output,$cols_output++,
+ 'Compiled on '.localtime(time));
+ #
+ $rows_output++;
+ $cols_output=0;
+ ##
+ ## Sequence Statistics
+ ##
+ &write_headers($excel_sheet,$format,\$rows_output,\$cols_output,
+ \@SeqFields);
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ next if ($seq->{'num_assess'} < 1);
+ my $data = $SeqStat{$seq->{'symb'}};
+ $cols_output=0;
+ foreach my $field (@SeqFields) {
+ next if ($field->{'selected'} ne 'yes');
+ my $fieldformat = undef;
+ if (exists($field->{'excel_format'})) {
+ $fieldformat = $format->{$field->{'excel_format'}};
+ }
+ $excel_sheet->write($rows_output,$cols_output++,
+ $data->{$field->{'name'}},$fieldformat);
+ }
+ $rows_output++;
+ $cols_output=0;
+ }
+ ##
+ ## Resource Statistics
+ ##
+ $rows_output++;
+ $cols_output=0;
+ &write_headers($excel_sheet,$format,\$rows_output,\$cols_output,
+ \@Fields);
+ #
+ foreach my $data (@StatsArray) {
+ $cols_output=0;
+ foreach my $field (@Fields) {
+ next if ($field->{'selected'} ne 'yes');
+ next if ($field->{'name'} eq 'problem_num');
+ my $fieldformat = undef;
+ if (exists($field->{'excel_format'})) {
+ $fieldformat = $format->{$field->{'excel_format'}};
+ }
+ $excel_sheet->write($rows_output,$cols_output++,
+ $data->{$field->{'name'}},$fieldformat);
+ }
+ $rows_output++;
+ $cols_output=0;
+ }
+ #
+ $excel_workbook->close();
+ #
+ # Tell the user where to get their excel file
+ $r->print(' '.
+ ''.
+ &mt('Your Excel Spreadsheet').''."\n");
+ $r->rflush();
+ return;
+}
- $studentCount++;
- my $tries = $cache->{"$_:$problemID:$part:tries"};
- if($maxTries < $tries) {
- $maxTries = $tries;
- }
- $totalTries += $tries;
- push(@studentTries, $tries);
+##
+## &write_headers
+##
+sub write_headers {
+ my ($excel_sheet,$format,$rows_output,$cols_output,$Fields) = @_;
+ ##
+ ## First the long titles
+ foreach my $field (@{$Fields}) {
+ next if ($field->{'name'} eq 'problem_num');
+ next if ($field->{'selected'} ne 'yes');
+ if (exists($field->{'long_title'})) {
+ $excel_sheet->write($$rows_output,${$cols_output},
+ $field->{'long_title'},
+ $format->{'bold'});
+ } else {
+ $excel_sheet->write($$rows_output,${$cols_output},'');
+ }
+ ${$cols_output}+= 1;
+ }
+ ${$cols_output} =0;
+ ${$rows_output}+=1;
+ ##
+ ## Then the short titles
+ foreach my $field (@{$Fields}) {
+ next if ($field->{'selected'} ne 'yes');
+ next if ($field->{'name'} eq 'problem_num');
+ # Use english for excel as I am not sure how well excel handles
+ # other character sets....
+ $excel_sheet->write($$rows_output,$$cols_output,
+ $field->{'title'},
+ $format->{'bold'});
+ $$cols_output+=1;
+ }
+ ${$cols_output} =0;
+ ${$rows_output}+=1;
+ return;
+}
- my $awarded = $cache->{"$_:$problemID:$part:awarded"};
- $totalAwarded += $awarded;
+##################################################
+##################################################
+##
+## Statistics Gathering and Manipulation Routines
+##
+##################################################
+##################################################
+sub compute_statistics_on_sequence {
+ my ($seq) = @_;
+ my @Data;
+ foreach my $res (@{$seq->{'contents'}}) {
+ next if ($res->{'type'} ne 'assessment');
+ foreach my $part (@{$res->{'parts'}}) {
+ next if ($res->{'partdata'}->{$part}->{'Survey'});
+ #
+ # This is where all the work happens
+ my $data = &get_statistics($seq,$res,$part,scalar(@StatsArray)+1);
+ push (@Data,$data);
+ push (@StatsArray,$data);
+ }
+ }
+ return @Data;
+}
- if($code eq '*') {
- $correct++;
- if($tries == 1) {
- $totalFirst++;
- }
- } elsif($code eq '+') {
- $correctByOverride++;
+sub compute_all_statistics {
+ my ($r) = @_;
+ if (@StatsArray > 0) {
+ # Assume we have already computed the statistics
+ return;
+ }
+ my $c = $r->connection;
+ foreach my $seq (&Apache::lonstatistics::Sequences_with_Assess()) {
+ last if ($c->aborted);
+ next if ($seq->{'num_assess'} < 1);
+ &compute_sequence_statistics($seq);
+ &compute_statistics_on_sequence($seq);
+ }
+}
+
+sub sort_data {
+ my ($sortkey) = @_;
+ return if (! @StatsArray);
+ #
+ # Sort the data
+ my $sortby = undef;
+ foreach my $field (@Fields) {
+ if ($sortkey eq $field->{'name'}) {
+ $sortby = $field->{'name'};
+ }
+ }
+ if (! defined($sortby) || $sortby eq '' || $sortby eq 'problem_num') {
+ $sortby = 'container';
+ }
+ if ($sortby ne 'container') {
+ # $sortby is already defined, so we can charge ahead
+ if ($sortby =~ /^(title|part)$/i) {
+ # Alpha comparison
+ @StatsArray = sort {
+ lc($a->{$sortby}) cmp lc($b->{$sortby}) ||
+ lc($a->{'title'}) cmp lc($b->{'title'}) ||
+ lc($a->{'part'}) cmp lc($b->{'part'});
+ } @StatsArray;
+ } else {
+ # Numerical comparison
+ @StatsArray = sort {
+ my $retvalue = 0;
+ if ($b->{$sortby} eq 'nan') {
+ if ($a->{$sortby} ne 'nan') {
+ $retvalue = -1;
+ } else {
+ $retvalue = 0;
}
}
-
- $problemData{$id.':sequenceTitle'} =
- $cache->{$sequence.':title'};
- $problemData{$id.':studentCount'} = $studentCount;
- $problemData{$id.':totalTries'} = $totalTries;
- $problemData{$id.':studentTries'} = \@studentTries;
- $problemData{$id.':totalAwarded'} = $totalAwarded;
- $problemData{$id.':correct'} = $correct;
- $problemData{$id.':correctByOverride'} = $correctByOverride;
- $problemData{$id.':wrong'} = $studentCount -
- ($correct + $correctByOverride);
- $problemData{$id.':maxTries'} = $maxTries;
- $problemData{$id.':totalFirst'} = $totalFirst;
- }
+ if ($a->{$sortby} eq 'nan') {
+ if ($b->{$sortby} ne 'nan') {
+ $retvalue = 1;
+ }
+ }
+ if ($retvalue eq '0') {
+ $retvalue = $b->{$sortby} <=> $a->{$sortby} ||
+ lc($a->{'title'}) <=> lc($b->{'title'}) ||
+ lc($a->{'part'}) <=> lc($b->{'part'});
+ }
+ $retvalue;
+ } @StatsArray;
}
}
+ #
+ # Renumber the data set
+ my $count;
+ foreach my $data (@StatsArray) {
+ $data->{'problem_num'} = ++$count;
+ }
+ return;
+}
+
+########################################################
+########################################################
+
+=pod
+
+=item &get_statistics()
- $problemData{'problemList'} = \@problemList;
-# $Discussed=0;
-# if($Discuss->{"$name:$problem"}) {
-# $TotDiscuss++;
-# $Discussed=1;
-# }
+Wrapper routine from the call to loncoursedata::get_problem_statistics.
+Calls lonstathelpers::get_time_limits() to limit the data set by time
+and &compute_discrimination_factor
- return \%problemData;
+Inputs: $sequence, $resource, $part, $problem_num
+
+Returns: Hash reference with statistics data from
+loncoursedata::get_problem_statistics.
+
+=cut
+
+########################################################
+########################################################
+sub get_statistics {
+ my ($sequence,$resource,$part,$problem_num) = @_;
+ #
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ my $symb = $resource->{'symb'};
+ my $courseid = $ENV{'request.course.id'};
+ #
+ my $data = &Apache::loncoursedata::get_problem_statistics
+ (\@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,
+ $symb,$part,$courseid,$starttime,$endtime);
+ $data->{'symb'} = $symb;
+ $data->{'part'} = $part;
+ $data->{'problem_num'} = $problem_num;
+ $data->{'container'} = $sequence->{'title'};
+ $data->{'title'} = $resource->{'title'};
+ $data->{'title.link'} = $resource->{'src'}.'?symb='.
+ &Apache::lonnet::escape($resource->{'symb'});
+ #
+ if ($SelectedFields{'deg_of_disc'}) {
+ $data->{'deg_of_disc'} =
+ &compute_discrimination_factor($resource,$part,$sequence);
+ }
+ #
+ # Store in metadata if computations were done for all students
+ if ($data->{'num_students'} > 1) {
+ my @Sections = @Apache::lonstatistics::SelectedSections;
+ my $sections = '"'.join(' ',@Sections).'"';
+ $sections =~ s/&+/_/g; # Ensure no special characters
+ $data->{'sections'}=$sections;
+ $data->{'course'} = $ENV{'request.course.id'};
+ my $urlres=(&Apache::lonnet::decode_symb($resource->{'symb'}))[2];
+ $data->{'urlres'}=$urlres;
+ my %storestats =
+ &LONCAPA::lonmetadata::dynamic_metadata_storage($data);
+ my ($dom,$user) = $urlres=~/^(\w+)\/(\w+)/;
+ &Apache::lonnet::put('nohist_resevaldata',\%storestats,$dom,$user);
+ }
+ #
+ # Get the due date for research purposes (commented out most of the time)
+# $data->{'duedate'} =
+# &Apache::lonnet::EXT('resource.'.$part.'.duedate',$symb);
+# $data->{'opendate'} =
+# &Apache::lonnet::EXT('resource.'.$part.'.opendate',$symb);
+# $data->{'resptypes'} = join(',',@{$resource->{'partdata'}->{$part}->{'ResponseTypes'}});
+ return $data;
}
-sub SortProblems {
- my ($problemData,$sortBy,$ascend)=@_;
+###############################################
+###############################################
- if($sortBy eq "Homework Sets Order") {
- return;
- }
+=pod
+
+=item &compute_discrimination_factor()
+
+Inputs: $Resource, $Sequence
- my $data;
+Returns: integer between -1 and 1
+
+=cut
- if ($sortBy eq "#Stdnts") { $data = ':studentCount'; }
- elsif($sortBy eq "Tries") { $data = ':totalTries'; }
- elsif($sortBy eq "Mod") { $data = ':maxTries'; }
- elsif($sortBy eq "Mean") { $data = ':mean'; }
- elsif($sortBy eq "#YES") { $data = ':correct'; }
- elsif($sortBy eq "#yes") { $data = ':correctByOverride'; }
- elsif($sortBy eq "%Wrng") { $data = ':percentWrong'; }
- elsif($sortBy eq "DoDiff") { $data = ':degreeOfDifficulty'; }
- elsif($sortBy eq "S.D.") { $data = ':standardDeviation'; }
- elsif($sortBy eq "Skew.") { $data = ':skewness'; }
- elsif($sortBy eq "D.F.1st") { $data = ':discriminantFactor1'; }
- elsif($sortBy eq "D.F.2nd") { $data = ':discriminantFactor2'; }
- elsif($sortBy eq "Disc.") { $data = ''; }
- else { return; }
-
- my $problems = $problemData->{'problemList'};
- my @orderedProblems =
- sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
- @$problems;
- if($ascend eq 'Descending') {
- @orderedProblems = reverse(@orderedProblems);
- }
-
- $problemData->{'problemList'} = \@orderedProblems;
-
- return;
-}
-
-sub CalculateStatistics {
- my ($data)=@_;
-
- my $problems = $data->{'problemList'};
- foreach(@$problems) {
- # Mean
- $data->{$_.':mean'} = ($data->{$_.':studentCount'}) ?
- ($data->{$_.':totalTries'} / $data->{$_.':studentCount'}) : 0;
-
- # %Wrong
- $data->{$_.':percentWrong'} = ($data->{$_.':studentCount'}) ?
- (($data->{$_.':wrong'} / $data->{$_.':studentCount'}) * 100.0) :
- 100.0;
-
- # Degree of Difficulty
- $data->{$_.':degreeOfDifficulty'} = ($data->{$_.':totalTries'}) ?
- (1 - (($data->{$_.':correct'} + $data->{$_.':correctByOverride'}) /
- $data->{$_.':totalTries'})) : 0;
-
- # Factor in mean
- my $studentTries = $data->{$_.':studentTries'};
- foreach(my $index=0; $index < scalar(@$studentTries); $index++) {
- $studentTries->[$index] -= $data->{$_.':mean'};
- }
- my $sumSquared = 0;
- my $sumCubed = 0;
- foreach(@$studentTries) {
- my $squared = ($_ * $_);
- my $cubed = ($squared * $_);
- $sumSquared += $squared;
- $sumCubed += $cubed;
- }
-
- # Standard deviation
- $data->{$_.':standardDeviation'} = ($data->{$_.':studentCount'} - 1) ?
- ((sqrt($sumSquared)) / ($data->{$_.':studentCount'} - 1)) : 0;
-
- # Skewness
- my $standardDeviation = $data->{$_.':standardDeviation'};
- $data->{$_.':skewness'} = ($data->{$_.':standardDeviation'}) ?
- (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) /
- ($standardDeviation * $standardDeviation * $standardDeviation)) :
- 0;
-
- # Discrimination Factor 1
- $data->{$_.':discriminationFactor1'} = 0;
-
- # Discrimination Factor 2
- $data->{$_.':discriminationFactor2'} = 0;
+###############################################
+###############################################
+sub compute_discrimination_factor {
+ my ($resource,$part,$sequence) = @_;
+ my @Resources;
+ foreach my $res (@{$sequence->{'contents'}}) {
+ next if ($res->{'symb'} eq $resource->{'symb'});
+ push (@Resources,$res->{'symb'});
+ }
+ #
+ # rank
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ my $ranking =
+ &Apache::loncoursedata::rank_students_by_scores_on_resources
+ (\@Resources,
+ \@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,undef,
+ $starttime,$endtime);
+ #
+ # compute their percent scores on the problems in the sequence,
+ my $number_to_grab = int(scalar(@{$ranking})/4);
+ my $num_students = scalar(@{$ranking});
+ my @BottomSet = map { $_->[&Apache::loncoursedata::RNK_student()];
+ } @{$ranking}[0..$number_to_grab];
+ my @TopSet =
+ map {
+ $_->[&Apache::loncoursedata::RNK_student()];
+ } @{$ranking}[($num_students-$number_to_grab)..($num_students-1)];
+ my ($bottom_sum,$bottom_max) =
+ &Apache::loncoursedata::get_sum_of_scores($resource,$part,\@BottomSet,
+ undef,$starttime,$endtime);
+ my ($top_sum,$top_max) =
+ &Apache::loncoursedata::get_sum_of_scores($resource,$part,\@TopSet,
+ undef,$starttime,$endtime);
+ my $deg_of_disc;
+ if ($top_max == 0 || $bottom_max==0) {
+ $deg_of_disc = 'nan';
+ } else {
+ $deg_of_disc = ($top_sum/$top_max) - ($bottom_sum/$bottom_max);
}
+ #&Apache::lonnet::logthis(' '.$top_sum.'/'.$top_max.
+ # ' - '.$bottom_sum.'/'.$bottom_max);
+ return $deg_of_disc;
+}
+###############################################
+###############################################
+##
+## Compute KR-21
+##
+## To compute KR-21, you need the following information:
+##
+## K=the number of items in your test
+## M=the mean score on the test
+## s=the standard deviation of the scores on your test
+##
+## then:
+##
+## KR-21 rk= [K/(K-1)] * [1- (M*(K-M))/(K*s^2))]
+##
+###############################################
+###############################################
+sub compute_sequence_statistics {
+ my ($seq) = @_;
+ my $symb = $seq->{'symb'};
+ my @Resources;
+ foreach my $res (@{$seq->{'contents'}}) {
+ next if ($res->{'type'} ne 'assessment');
+ push (@Resources,$res->{'symb'});
+ }
+ my ($starttime,$endtime) = &Apache::lonstathelpers::get_time_limits();
+ #
+ # First compute statistics based on student scores
+ my ($smin,$smax,$sMean,$sSTD,$scount,$sMAX) =
+ &Apache::loncoursedata::score_stats
+ (\@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,
+ \@Resources,$starttime,$endtime,undef);
+ $SeqStat{$symb}->{'title'} = $seq->{'title'};
+ $SeqStat{$symb}->{'scoremax'} = $smax;
+ $SeqStat{$symb}->{'scoremin'} = $smin;
+ $SeqStat{$symb}->{'scoremean'} = $sMean;
+ $SeqStat{$symb}->{'scorestd'} = $sSTD;
+ $SeqStat{$symb}->{'scorecount'} = $scount;
+ $SeqStat{$symb}->{'max_possible'} = $sMAX;
+ #
+ # Compute statistics based on the number of correct problems
+ # 'correct' is taken to mean
+ my ($cmin,$cmax,$cMean,$cSTD,$ccount)=
+ &Apache::loncoursedata::count_stats
+ (\@Apache::lonstatistics::SelectedSections,
+ $Apache::lonstatistics::enrollment_status,
+ \@Resources,$starttime,$endtime,undef);
+ my $K = $seq->{'num_assess_parts'};
+ my $kr_21;
+ if ($K > 1 && $cSTD > 0) {
+ $kr_21 = ($K/($K-1)) * (1 - $cMean*($K-$cMean)/($K*$cSTD**2));
+ } else {
+ $kr_21 = 'nan';
+ }
+ $SeqStat{$symb}->{'countmax'} = $cmax;
+ $SeqStat{$symb}->{'countmin'} = $cmin;
+ $SeqStat{$symb}->{'countstd'} = $cSTD;
+ $SeqStat{$symb}->{'countmean'} = $cMean;
+ $SeqStat{$symb}->{'count'} = $ccount;
+ $SeqStat{$symb}->{'items'} = $K;
+ $SeqStat{$symb}->{'KR-21'}=$kr_21;
return;
}
-sub ProcessDiscriminant {
- my ($List) = @_;
- my @sortedList = sort (@$List);
- my $Count = scalar @sortedList;
- my $Problem;
- my @Dis;
- my $Slvd=0;
- my $tmp;
- my $Sum1=0;
- my $Sum2=0;
- my $nIndex=0;
- my $nStudent=0;
- my %Proc=undef;
- while ($nIndex<$Count) {
-# $jr->print(" $nIndex) $sortedList[$nIndex]");
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- my $Temp = $Problem;
- do {
- $nIndex++;
- $nStudent++;
- $Sum1 += $Dis[0];
- $Sum2 += $Dis[1];
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- } while ( $Problem eq $Temp && $nIndex < $Count );
- $Proc{$Temp}=($Sum1/$nStudent).':'.($Sum2/$nStudent);
-# $jr->print(" $nIndex) $Temp --> ($nStudent) $Proc{$Temp}");
- $Sum1=0;
- $Sum2=0;
- $nStudent=0;
- }
-
- return %Proc;
-}
-
-#------- Creating Discimination factor
-sub Discriminant {
- my ($discriminant)=@_;
- my @discriminantKeys=keys(%$discriminant);
- my $Count = scalar @discriminantKeys;
-
- my $UpCnt = int(0.27*$Count);
- my $low=0;
- my $up=$Count-$UpCnt;
- my @UpList=();
- my @LowList=();
-
- $Count=0;
- foreach my $key (sort(@discriminantKeys)) {
- $Count++;
- if($low < $UpCnt || $Count > $up) {
- $low++;
- my $str=$discriminant->{$key};
- foreach(split(/\&/,$str)){
- if($_) {
- if($low<$UpCnt) { push(@LowList,$_); }
- else { push(@UpList,$_); }
- }
- }
- }
- }
- my %DisUp = &ProcessDiscriminant(\@UpList);
- my %DisLow = &ProcessDiscriminant(\@LowList);
- return (\%DisUp, \%DisLow);
-}
-#---- END Problem Statistics Web Page ----------------------------------------
+=pod
-#---- Problem Statistics Graph Web Page --------------------------------------
+=item ProblemStatisticsLegend
-# ------------------------------------------- Prepare data for Graphical chart
+=over 4
-sub BuildGraphicChart {
- my ($ylab,$r,$cacheDB)=@_;
- my %cache;
- my $Col;
- my $data='';
- my $count = 0;
- my $Max = 0;
+=item #Stdnts
+Total number of students attempted the problem.
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- return 'Unable to tie database.';
- }
-
- my $p_count = $cache{'ProblemCount'};
+=item Tries
+Total number of tries for solving the problem.
- for ( my $k=0; $k<$p_count;$k++) {
- my @Temp=split(/\:/,$cache{'GraphGif:'.$k});
- my $inf = $Temp[$Col];
- if ( $Max < $inf ) {$Max = $inf;}
- $data .= $inf.',';
- $count++;
- }
- untie(%cache);
-# $r->print(" count=$p_count >>data= $data");
+=item Max Tries
+Largest number of tries for solving the problem by a student.
- if ( $Max > 1 ) {
- $Max += (10 - $Max % 10);
- $Max = int($Max);
- } else { $Max = 1; }
+=item Mean
+Average number of tries. [ Tries / #Stdnts ]
- my $cid=$ENV{'request.course.id'};
+=item #YES
+Number of students solved the problem correctly.
- if ( $ylab eq 'DoDiff Graph' ) {
- $ylab = 'Degree-of-Difficulty';
- $Col = 0;
- } else {
- $ylab = 'Wrong-Percentage';
- $Col = 1;
- }
- my $Course = $ENV{'course.'.$cid.'.description'};
- $Course =~ s/\ /"_"/eg;
- my $GData=$Course.'&'.'Problems#'.'&'.$ylab.'&'.
- $Max.'&'.$count.'&'.$data;
+=item #yes
+Number of students solved the problem by override.
- $r->print('');
+=item %Wrong
+Percentage of students who tried to solve the problem
+but is still incorrect. [ 100*((#Stdnts-(#YES+#yes))/#Stdnts) ]
- return;
-}
+=item DoDiff
+Degree of Difficulty of the problem.
+[ 1 - ((#YES+#yes) / Tries) ]
+
+=item S.D.
+Standard Deviation of the tries.
+[ sqrt(sum((Xi - Mean)^2)) / (#Stdnts-1)
+where Xi denotes every student\'s tries ]
+
+=item Skew.
+Skewness of the students tries.
+[(sqrt( sum((Xi - Mean)^3) / #Stdnts)) / (S.D.^3)]
+
+=item Dis.F.
+Discrimination Factor: A Standard for evaluating the
+problem according to a Criterion
+
+=item [Criterion to group students into %27 Upper Students -
+and %27 Lower Students]
+1st Criterion for Sorting the Students:
+Sum of Partial Credit Awarded / Total Number of Tries
+2nd Criterion for Sorting the Students:
+Total number of Correct Answers / Total Number of Tries
+
+=item Disc.
+Number of Students had at least one discussion.
+
+=back
+
+=cut
+
+############################################################
+############################################################
1;
__END__