--- loncom/interface/statistics/lonproblemstatistics.pm 2002/08/06 02:07:19 1.15
+++ loncom/interface/statistics/lonproblemstatistics.pm 2002/10/30 18:37:00 1.34
@@ -1,7 +1,7 @@
# The LearningOnline Network with CAPA
# (Publication Handler
#
-# $Id: lonproblemstatistics.pm,v 1.15 2002/08/06 02:07:19 minaeibi Exp $
+# $Id: lonproblemstatistics.pm,v 1.34 2002/10/30 18:37:00 minaeibi Exp $
#
# Copyright Michigan State University Board of Trustees
#
@@ -43,687 +43,415 @@ use Apache::lonhtmlcommon;
use Apache::loncoursedata;
use GDBM_File;
+my $jr;
-sub BuildProblemStatisticsPage {
+sub InitializeProblemStatistics {
my ($cacheDB, $students, $courseID, $c, $r)=@_;
my %cache;
- #my %DoDiff;
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER,0640)) {
- return '
Unable to tie database.';
+
+ $jr = $r;
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database1.');
+ return ('ERROR', undef);
+ }
+
+ # Remove students who don't have the proper section.
+ my @sectionsSelected = split(':',$cache{'sectionsSelected'});
+ for(my $studentIndex=((scalar @$students)-1); $studentIndex>=0;
+ $studentIndex--) {
+ my $value = $cache{$students->[$studentIndex].':section'};
+ my $found = 0;
+ foreach (@sectionsSelected) {
+ if($_ eq 'none') {
+ if($value eq '' || !defined($value) || $value eq ' ') {
+ $found = 1;
+ last;
+ }
+ } else {
+ if($value eq $_) {
+ $found = 1;
+ last;
+ }
+ }
+ }
+ if($found == 0) {
+ splice(@$students, $studentIndex, 1);
+ }
+ }
+
+ my $isNotCached = 0;
+ my $lastStatus = (defined($cache{'StatisticsLastStatus'})) ?
+ $cache{'StatisticsLastStatus'} : 'Nothing';
+ my $whichStudents = join(':::',sort(@$students));
+ if(!defined($cache{'StatisticsCached'}) ||
+ $lastStatus ne $cache{'Status'} ||
+ $whichStudents ne $cache{'StatisticsWhichStudents'}) {
+ $isNotCached = 1;
+ }
+
+ untie(%cache);
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
+ $r->print('Unable to tie database.2');
+ return ('ERROR', undef);
+ }
+ if($isNotCached && defined($cache{'StatisticsCached'})) {
+ my @statkeys = split(':::', $cache{'StatisticsKeys'});
+ delete $cache{'StatisticsKeys'};
+ delete $cache{'StatisticsCached'};
+ foreach(@statkeys) {
+ delete $cache{$_};
+ }
+ }
+
+ untie(%cache);
+ if($isNotCached) {
+ &Apache::loncoursedata::DownloadStudentCourseDataSeparate($students,
+ 'true',
+ $cacheDB,
+ 'true',
+ 'true',
+ $courseID,
+ $r, $c);
+ }
+ if($c->aborted()) { return ('ERROR', undef); }
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.3');
+ return ('ERROR', undef);
+ }
+ my $problemData;
+ if($isNotCached) {
+ ($problemData) = &ExtractStudentData(\%cache, $students);
+ &CalculateStatistics($problemData, \%cache, $courseID);
+ }
+ untie(%cache);
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
+ $r->print('Unable to tie database.4');
+ return ('ERROR', undef);
+ }
+ if($isNotCached) {
+ foreach(keys(%$problemData)) {
+ $cache{$_} = $problemData->{$_};
+ }
+ $cache{'StatisticsKeys'} = join(':::', keys(%$problemData));
+ $cache{'StatisticsCached'} = 'true';
+ $cache{'StatisticsLastStatus'} = $cache{'Status'};
+ $cache{'StatisticsWhichStudents'} = $whichStudents;
+ }
+ untie(%cache);
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.5');
+ return ('ERROR', undef);
}
+ my $orderedProblems = &SortProblems(\%cache,
+ $cache{'ProblemStatisticsSort'},
+ $cache{'SortProblems'},
+ $cache{'ProblemStatisticsAscend'});
+ untie(%cache);
+
+ return ('OK', $orderedProblems);
+}
+
+sub BuildProblemStatisticsPage {
+ my ($cacheDB, $students, $courseID, $c, $r)=@_;
+
+ my @Header = ("Homework Sets Order","#Stdnts","Tries","Mod",
+ "Mean","#YES","#yes","%Wrng","DoDiff",
+ "S.D.","Skew.","D.F.1st","D.F.2nd");
+ my $color=&setbgcolor(0);
+ my %cache;
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.6');
+ return;
+ }
my $Ptr = '';
- $Ptr .= '';
$Ptr .= 'DoDiff | ';
$Ptr .= 'Degree of Difficulty of the problem. ';
@@ -809,8 +551,8 @@ sub ProblemStatisticsLegend {
$Ptr .= 'Dis.F. | ';
$Ptr .= 'Discrimination Factor: A Standard for evaluating the ';
$Ptr .= 'problem according to a Criterion ';
- $Ptr .= '[Applied Criterion in %27 Upper Students - ';
- $Ptr .= 'Applied the same Criterion in %27 Lower Students] ';
+ $Ptr .= '[Criterion to group students into %27 Upper Students - ';
+ $Ptr .= 'and %27 Lower Students] ';
$Ptr .= '1st Criterion for Sorting the Students: ';
$Ptr .= 'Sum of Partial Credit Awarded / Total Number of Tries ';
$Ptr .= '2nd Criterion for Sorting the Students: ';
@@ -823,148 +565,304 @@ sub ProblemStatisticsLegend {
return $Ptr;
}
-#------- Processing upperlist and lowerlist according to each problem
-sub ProcessDiscriminant {
- my ($List,$r) = @_;
- my @sortedList = sort (@$List);
- my $Count = scalar @sortedList;
- my $Problem;
- my @Dis;
- my $Slvd=0;
- my $tmp;
- my $Sum1=0;
- my $Sum2=0;
- my $nIndex=0;
- my $nStudent=0;
- my %Proc=undef;
- while ($nIndex<$Count) {
-# $r->print(" $nIndex) $sortedList[$nIndex]");
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- my $Temp = $Problem;
- do {
- $nIndex++;
- $nStudent++;
- $Sum1 += $Dis[0];
- $Sum2 += $Dis[1];
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- } while ( $Problem eq $Temp && $nIndex < $Count );
- $Proc{$Temp}=($Sum1/$nStudent).':'.($Sum2/$nStudent);
-# $r->print(" $nIndex) $Temp --> ($nStudent) $Proc{$Temp}");
- $Sum1=0;
- $Sum2=0;
- $nStudent=0;
- }
-
- return %Proc;
-}
-
-#------- Creating Discimination factor
-sub Discriminant {
- my ($discriminant,$r)=@_;
-#$Apache::lonxml::debug=1;
-#&Apache::lonhomework::showhash(%$discriminant);
-#$Apache::lonxml::debug=0;
- my @discriminantKeys=keys(%$discriminant);
- my $Count = scalar @discriminantKeys;
-
- my $UpCnt = int(0.27*$Count);
- my $low=0;
- my $up=$Count-$UpCnt;
- my @UpList=();
- my @LowList=();
-
- $Count=0;
- foreach my $key (sort(@discriminantKeys)) {
- $Count++;
- if($low < $UpCnt || $Count > $up) {
- $low++;
- my $str=$discriminant->{$key};
- foreach(split(/\&/,$str)){
- if($_) {
- if($low<$UpCnt) { push(@LowList,$_); }
- else { push(@UpList,$_); }
+sub ExtractStudentData {
+ my ($cache, $students)=@_;
+
+ my @problemList=();
+ my %problemData;
+ foreach my $sequence (split(':', $cache->{'orderedSequences'})) {
+ foreach my $problemID (split(':', $cache->{$sequence.':problems'})) {
+ foreach my $part (split(/\:/,$cache->{$sequence.':'.
+ $problemID.
+ ':parts'})) {
+ my $id = $sequence.':'.$problemID.':'.$part;
+ push(@problemList, $id);
+ my $totalTries = 0;
+ my $totalAwarded = 0;
+ my $correct = 0;
+ my $correctByOverride = 0;
+ my $studentCount = 0;
+ my $maxTries = 0;
+ my $totalFirst = 0;
+ my @studentTries=();
+ foreach(@$students) {
+ my $code = $cache->{"$_:$problemID:$part:code"};
+
+ if(defined($cache->{$_.':error'}) || $code eq ' ' ||
+ $cache->{"$_:$problemID:NoVersion"} eq 'true') {
+ next;
+ }
+
+ $studentCount++;
+ my $tries = $cache->{"$_:$problemID:$part:tries"};
+ if($maxTries < $tries) {
+ $maxTries = $tries;
+ }
+ $totalTries += $tries;
+ push(@studentTries, $tries);
+
+ my $awarded = $cache->{"$_:$problemID:$part:awarded"};
+ $totalAwarded += $awarded;
+
+ if($code eq '*') {
+ $correct++;
+ if($tries == 1) {
+ $totalFirst++;
+ }
+ } elsif($code eq '+') {
+ $correctByOverride++;
+ }
}
+
+ my $studentTriesJoined = join(':::', @studentTries);
+ $problemData{$id.':sequenceTitle'} =
+ $cache->{$sequence.':title'};
+ $problemData{$id.':studentCount'} = $studentCount;
+ $problemData{$id.':totalTries'} = $totalTries;
+ $problemData{$id.':studentTries'} = $studentTriesJoined;
+ $problemData{$id.':totalAwarded'} = $totalAwarded;
+ $problemData{$id.':correct'} = $correct;
+ $problemData{$id.':correctByOverride'} = $correctByOverride;
+ $problemData{$id.':wrong'} = $studentCount -
+ ($correct + $correctByOverride);
+ $problemData{$id.':maxTries'} = $maxTries;
+ $problemData{$id.':totalFirst'} = $totalFirst;
}
}
}
- my %DisUp = &ProcessDiscriminant(\@UpList,$r);
- my %DisLow = &ProcessDiscriminant(\@LowList,$r);
- return (\%DisUp, \%DisLow);
-}
+ my @upperStudents1=();
+ my @lowerStudents1=();
+ my @upperStudents2=();
+ my @lowerStudents2=();
+ my $upperCount = int(0.27*scalar(@$students));
+ # Discriminant Factor criterion 1
+ my $sortedStudents = &SortDivideByTries($students,$cache,':totalAwarded');
+
+ for(my $i=0; $i<$upperCount; $i++) {
+ push(@lowerStudents1, $sortedStudents->[$i]);
+ push(@upperStudents1, $sortedStudents->[(scalar(@$students)-$i-1)]);
+ }
+
+ $problemData{'studentsUpperListCriterion1'}=join(':::', @upperStudents1);
+ $problemData{'studentsLowerListCriterion1'}=join(':::', @lowerStudents1);
+
+ # Discriminant Factor criterion 2
+ $sortedStudents = &SortDivideByTries($students, $cache, ':totalSolved');
+
+ for(my $i=0; $i<$upperCount; $i++) {
+ push(@lowerStudents2, $sortedStudents->[$i]);
+ push(@upperStudents2, $sortedStudents->[(scalar(@$students)-$i-1)]);
+ }
+ $problemData{'studentsUpperListCriterion2'}=join(':::', @upperStudents2);
+ $problemData{'studentsLowerListCriterion2'}=join(':::', @lowerStudents2);
+
+ $problemData{'problemList'} = join(':::', @problemList);
+
+ return \%problemData;
+}
+
+sub SortDivideByTries {
+ my ($toSort, $data, $sortOn)=@_;
+ my @orderedData = sort { ($data->{$a.':totalTries'}) ?
+ ($data->{$a.$sortOn}/$data->{$a.':totalTries'}):0
+ <=>
+ ($data->{$b.':totalTries'}) ?
+ ($data->{$b.$sortOn}/$data->{$b.':totalTries'}):0
+ } @$toSort;
+
+ return \@orderedData;
+}
+
+sub SortProblems {
+ my ($problemData,$sortBy,$sortProblems,$ascend)=@_;
+
+ my @problems = split(':::', $problemData->{'problemList'});
+ if($sortBy eq "Homework Sets Order") {
+ return \@problems;
+ }
+
+ my $data;
+
+ if ($sortBy eq "#Stdnts") { $data = ':studentCount'; }
+ elsif($sortBy eq "Tries") { $data = ':totalTries'; }
+ elsif($sortBy eq "Mod") { $data = ':maxTries'; }
+ elsif($sortBy eq "Mean") { $data = ':mean'; }
+ elsif($sortBy eq "#YES") { $data = ':correct'; }
+ elsif($sortBy eq "#yes") { $data = ':correctByOverride'; }
+ elsif($sortBy eq "%Wrng") { $data = ':percentWrong'; }
+ elsif($sortBy eq "DoDiff") { $data = ':degreeOfDifficulty'; }
+ elsif($sortBy eq "S.D.") { $data = ':standardDeviation'; }
+ elsif($sortBy eq "Skew.") { $data = ':skewness'; }
+ elsif($sortBy eq "D.F.1st") { $data = ':discriminationFactor1'; }
+ elsif($sortBy eq "D.F.2nd") { $data = ':discriminationFactor2'; }
+ else { return \@problems; }
+
+ my %temp;
+ my @sequenceList=();
+ foreach(@problems) {
+ my ($sequence) = split(':', $_);
+
+ my @array=();
+ my $tempArray;
+ if(defined($temp{$sequence})) {
+ $tempArray = $temp{$sequence};
+ } else {
+ push(@sequenceList, $sequence);
+ $tempArray = \@array;
+ $temp{$sequence} = $tempArray;
+ }
-#---- END Problem Statistics Web Page ----------------------------------------
+ push(@$tempArray, $_);
+ }
-#---- Problem Statistics Graph Web Page --------------------------------------
+ my @orderedProblems;
+ if($sortProblems eq "Sort Within Sequence") {
+ foreach(keys(%temp)) {
+ my $tempArray = $temp{$_};
+ my @tempOrder =
+ sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
+ @$tempArray;
+ $temp{$_} = \@tempOrder;
+ }
+ foreach(@sequenceList) {
+ my $tempArray = $temp{$_};
+ @orderedProblems = (@orderedProblems, @$tempArray);
+ }
+ } else {
+ @orderedProblems =
+ sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
+ @problems;
+ }
-# ------------------------------------------- Prepare data for Graphical chart
+ if($ascend eq 'Descending') {
+ @orderedProblems = reverse(@orderedProblems);
+ }
-sub BuildDiffGraph {
- my ($r)=@_;
+ return \@orderedProblems;
+}
- my $graphData = &GetGraphData('DiffGraph', $r);
- $r->print('');
+sub CalculateStatistics {
+ my ($data, $cache, $courseID)=@_;
- return;
-}
+ my @problems = split(':::', $data->{'problemList'});
+ foreach(@problems) {
+ # Mean
+ my $mean = ($data->{$_.':studentCount'}) ?
+ ($data->{$_.':totalTries'} / $data->{$_.':studentCount'}) : 0;
+ $data->{$_.':mean'} = sprintf("%.2f", $mean);
-sub BuildWrongGraph {
- my ($r)=@_;
+ # %Wrong
+ my $pw = ($data->{$_.':studentCount'}) ?
+ (($data->{$_.':wrong'} / $data->{$_.':studentCount'}) * 100.0) :
+ 100.0;
+ $data->{$_.':percentWrong'} = sprintf("%.1f", $pw);
- my $graphData = &GetGraphData('WrongGraph', $r);
- $r->print('');
+ # Degree of Difficulty
+ my $dod = ($data->{$_.':totalTries'}) ?
+ (1 - (($data->{$_.':correct'} + $data->{$_.':correctByOverride'}) /
+ $data->{$_.':totalTries'})) : 0;
- return;
-}
+ $data->{$_.':degreeOfDifficulty'} = sprintf("%.2f", $dod);
+
+ # Factor in mean
+ my @studentTries = split(':::', $data->{$_.':studentTries'});
+ foreach(my $index=0; $index < scalar(@studentTries); $index++) {
+ $studentTries[$index] -= $mean;
+ }
+ my $sumSquared = 0;
+ my $sumCubed = 0;
+ foreach(@studentTries) {
+ my $squared = ($_ * $_);
+ my $cubed = ($squared * $_);
+ $sumSquared += $squared;
+ $sumCubed += $cubed;
+ }
+
+ # Standard deviation
+ my $standardDeviation;
+ if($data->{$_.':studentCount'} - 1 > 0) {
+ $standardDeviation = (sqrt($sumSquared)) /
+ ($data->{$_.':studentCount'} - 1);
+ } else {
+ $standardDeviation = 0.0;
+ }
+ $data->{$_.':standardDeviation'} = sprintf("%.1f", $standardDeviation);
+
+ # Skewness
+ my $skew;
+ if($standardDeviation > 0.0999 && $data->{$_.':studentCount'} > 0) {
+ $skew = (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) /
+ ($standardDeviation *
+ $standardDeviation *
+ $standardDeviation));
+ } else {
+ $skew = 0.0;
+ }
+ $data->{$_.':skewness'} = sprintf("%.1f", $skew);
+
+ # Discrimination Factor 1
+ my ($sequence, $problem, $part) = split(':', $_);
+
+ my @upper1 = split(':::', $data->{'studentsUpperListCriterion1'});
+ my @lower1 = split(':::', $data->{'studentsLowerListCriterion1'});
+
+ my $upper1Sum=0;
+ foreach my $name (@upper1) {
+ $upper1Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $upper1Sum = (scalar(@upper1)) ? ($upper1Sum/(scalar(@upper1))) : 0;
+
+ my $lower1Sum=0;
+ foreach my $name (@lower1) {
+ $lower1Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $lower1Sum = (scalar(@lower1)) ? ($lower1Sum/(scalar(@lower1))) : 0;
-sub GetGraphData {
- my ($ylab,$r,$cache)=@_;
- my $Col;
- my $data='';
- my $count = 0;
- my $Max = 0;
- my $cid=$ENV{'request.course.id'};
-
- if ( $ylab eq 'DoDiff Graph' ) {
- $ylab = 'Degree-of-Difficulty';
- $Col = 0;
- }
- else {
- $ylab = 'Wrong-Percentage';
- $Col = 1;
- }
-
- my $p_count = $cache->{'ProblemCount'};
-
- for ( my $k=0; $k<$p_count;$k++) {
- my $key=$cache->{'CacheTable:'.$k};
- my @Temp=split(/\&/,$key);
- # $list[$k]=$key;
- }
-
- # foreach (sort NumericSort keys %GraphDat) {
- # my @Temp=split(/\:/,$GraphDat{$_});
- # my $inf = $Temp[$Col];
- # if ( $Max < $inf ) {$Max = $inf;}
- # $data .= $inf.',';
- # $count++;
- # }
- if ( $Max > 1 ) {
- $Max += (10 - $Max % 10);
- $Max = int($Max);
- } else { $Max = 1; }
-
- #untie(%GraphDat);
-
- my $Course = $ENV{'course.'.$cid.'.description'};
- $Course =~ s/\ /"_"/eg;
- my $GData=$Course.'&'.'Problems'.'&'.$ylab.'&'.
- $Max.'&'.$count.'&'.$data;
+ my $df1 = $upper1Sum - $lower1Sum;
+ $data->{$_.':discriminationFactor1'} = sprintf("%.2f", $df1);
+
+ # Discrimination Factor 2
+ my @upper2 = split(':::', $data->{'studentsUpperListCriterion2'});
+ my @lower2 = split(':::', $data->{'studentsLowerListCriterion2'});
+
+ my $upper2Sum=0;
+ foreach my $name (@upper2) {
+ $upper2Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $upper2Sum = (scalar(@upper2)) ? ($upper2Sum/(scalar(@upper2))) : 0;
+
+ my $lower2Sum=0;
+ foreach my $name (@lower2) {
+ $lower2Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $lower2Sum = (scalar(@lower2)) ? ($lower2Sum/(scalar(@lower2))) : 0;
+
+ my $df2 = $upper2Sum - $lower2Sum;
+ $data->{$_.':discriminationFactor2'} = sprintf("%.2f", $df2);
+
+ my %storestats;
+ my $Average = ($data->{$_.':studentCount'}) ?
+ $data->{$_.':totalTries'}/$data->{$_.':studentCount'} : 0;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___timestamp'}=time;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___stdno'}=$data->{$_.':studentCount'};
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___avetries'}=$Average;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___difficulty'}=$data->{$_.':degreeOfDifficulty'};
+ $cache->{$sequence.':source'} =~ /^(\w+)\/(\w+)/;
+ if($data->{$_.':studentCount'}) {
+ &Apache::lonnet::put('nohist_resevaldata',\%storestats,$1,$2);
+ }
+ }
+
+ return;
}
+#---- END Problem Statistics Web Page ----------------------------------------
1;
__END__
|