--- loncom/interface/statistics/lonproblemstatistics.pm 2002/08/13 00:37:18 1.19
+++ loncom/interface/statistics/lonproblemstatistics.pm 2002/08/15 14:15:20 1.30
@@ -1,7 +1,7 @@
# The LearningOnline Network with CAPA
# (Publication Handler
#
-# $Id: lonproblemstatistics.pm,v 1.19 2002/08/13 00:37:18 stredwic Exp $
+# $Id: lonproblemstatistics.pm,v 1.30 2002/08/15 14:15:20 stredwic Exp $
#
# Copyright Michigan State University Board of Trustees
#
@@ -45,18 +45,132 @@ use GDBM_File;
my $jr;
-sub BuildProblemStatisticsPage {
+sub InitializeProblemStatistics {
my ($cacheDB, $students, $courseID, $c, $r)=@_;
my %cache;
$jr = $r;
unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- return '
Unable to tie database.';
+ $r->print('Unable to tie database1.');
+ return ('ERROR', undef);
+ }
+
+ # Remove students who don't have the proper section.
+ my @sectionsSelected = split(':',$cache{'sectionsSelected'});
+ for(my $studentIndex=((scalar @$students)-1); $studentIndex>=0;
+ $studentIndex--) {
+ my $value = $cache{$students->[$studentIndex].':section'};
+ my $found = 0;
+ foreach (@sectionsSelected) {
+ if($_ eq 'none') {
+ if($value eq '' || !defined($value) || $value eq ' ') {
+ $found = 1;
+ last;
+ }
+ } else {
+ if($value eq $_) {
+ $found = 1;
+ last;
+ }
+ }
+ }
+ if($found == 0) {
+ splice(@$students, $studentIndex, 1);
+ }
+ }
+
+ my $isNotCached = 0;
+ my $lastStatus = (defined($cache{'StatisticsLastStatus'})) ?
+ $cache{'StatisticsLastStatus'} : 'Nothing';
+ my $whichStudents = join(':::',sort(@$students));
+ if(!defined($cache{'StatisticsCached'}) ||
+ $lastStatus ne $cache{'Status'} ||
+ $whichStudents ne $cache{'StatisticsWhichStudents'}) {
+ $isNotCached = 1;
+ }
+
+ untie(%cache);
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
+ $r->print('Unable to tie database.2');
+ return ('ERROR', undef);
+ }
+ if($isNotCached && defined($cache{'StatisticsCached'})) {
+ my @statkeys = split(':::', $cache{'StatisticsKeys'});
+ delete $cache{'StatisticsKeys'};
+ delete $cache{'StatisticsCached'};
+ foreach(@statkeys) {
+ delete $cache{$_};
+ }
+ }
+
+ untie(%cache);
+ if($isNotCached) {
+ &Apache::loncoursedata::DownloadStudentCourseDataSeparate($students,
+ 'true',
+ $cacheDB,
+ 'true',
+ 'true',
+ $courseID,
+ $r, $c);
+ }
+ if($c->aborted()) { return ('ERROR', undef); }
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.3');
+ return ('ERROR', undef);
}
+ my $problemData;
+ if($isNotCached) {
+ ($problemData) = &ExtractStudentData(\%cache, $students);
+ &CalculateStatistics($problemData, \%cache, $courseID);
+ }
+ untie(%cache);
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_WRCREAT(),0640)) {
+ $r->print('Unable to tie database.4');
+ return ('ERROR', undef);
+ }
+ if($isNotCached) {
+ foreach(keys(%$problemData)) {
+ $cache{$_} = $problemData->{$_};
+ }
+ $cache{'StatisticsKeys'} = join(':::', keys(%$problemData));
+ $cache{'StatisticsCached'} = 'true';
+ $cache{'StatisticsLastStatus'} = $cache{'Status'};
+ $cache{'StatisticsWhichStudents'} = $whichStudents;
+ }
+ untie(%cache);
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.5');
+ return ('ERROR', undef);
+ }
+
+ my $orderedProblems = &SortProblems(\%cache,
+ $cache{'ProblemStatisticsSort'},
+ $cache{'SortProblems'},
+ $cache{'ProblemStatisticsAscend'});
+ untie(%cache);
+
+ return ('OK', $orderedProblems);
+}
+
+sub BuildProblemStatisticsPage {
+ my ($cacheDB, $students, $courseID, $c, $r)=@_;
+ my @Header = ("Homework Sets Order","#Stdnts","Tries","Mod",
+ "Mean","#YES","#yes","%Wrng","DoDiff",
+ "S.D.","Skew.","D.F.1st","D.F.2nd");
+ my $color=&setbgcolor(0);
+ my %cache;
+
+ unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
+ $r->print('Unable to tie database.6');
+ return;
+ }
my $Ptr = '';
- $Ptr .= ' | ';
$Ptr .= '{'orderedSequences'})) {
- if($cache->{'ProblemStatisticsMaps'} ne 'All Maps' &&
- $cache->{'ProblemStatisticsMaps'} ne $cache->{$sequence.':title'}) {
- next;
- }
-
foreach my $problemID (split(':', $cache->{$sequence.':problems'})) {
foreach my $part (split(/\:/,$cache->{$sequence.':'.
$problemID.
@@ -492,11 +570,12 @@ sub ExtractStudentData {
}
}
+ my $studentTriesJoined = join(':::', @studentTries);
$problemData{$id.':sequenceTitle'} =
$cache->{$sequence.':title'};
$problemData{$id.':studentCount'} = $studentCount;
$problemData{$id.':totalTries'} = $totalTries;
- $problemData{$id.':studentTries'} = \@studentTries;
+ $problemData{$id.':studentTries'} = $studentTriesJoined;
$problemData{$id.':totalAwarded'} = $totalAwarded;
$problemData{$id.':correct'} = $correct;
$problemData{$id.':correctByOverride'} = $correctByOverride;
@@ -508,21 +587,55 @@ sub ExtractStudentData {
}
}
- $problemData{'problemList'} = \@problemList;
-# $Discussed=0;
-# if($Discuss->{"$name:$problem"}) {
-# $TotDiscuss++;
-# $Discussed=1;
-# }
+ my @upperStudents1=();
+ my @lowerStudents1=();
+ my @upperStudents2=();
+ my @lowerStudents2=();
+ my $upperCount = int(0.27*scalar(@$students));
+ # Discriminant Factor criterion 1
+ my $sortedStudents = &SortDivideByTries($students,$cache,':totalAwarded');
+
+ for(my $i=0; $i<$upperCount; $i++) {
+ push(@lowerStudents1, $sortedStudents->[$i]);
+ push(@upperStudents1, $sortedStudents->[(scalar(@$students)-$i-1)]);
+ }
+
+ $problemData{'studentsUpperListCriterion1'}=join(':::', @upperStudents1);
+ $problemData{'studentsLowerListCriterion1'}=join(':::', @lowerStudents1);
+
+ # Discriminant Factor criterion 2
+ $sortedStudents = &SortDivideByTries($students, $cache, ':totalSolved');
+
+ for(my $i=0; $i<$upperCount; $i++) {
+ push(@lowerStudents2, $sortedStudents->[$i]);
+ push(@upperStudents2, $sortedStudents->[(scalar(@$students)-$i-1)]);
+ }
+ $problemData{'studentsUpperListCriterion2'}=join(':::', @upperStudents2);
+ $problemData{'studentsLowerListCriterion2'}=join(':::', @lowerStudents2);
+
+ $problemData{'problemList'} = join(':::', @problemList);
return \%problemData;
}
+sub SortDivideByTries {
+ my ($toSort, $data, $sortOn)=@_;
+ my @orderedData = sort { ($data->{$a.':totalTries'}) ?
+ ($data->{$a.$sortOn}/$data->{$a.':totalTries'}):0
+ <=>
+ ($data->{$b.':totalTries'}) ?
+ ($data->{$b.$sortOn}/$data->{$b.':totalTries'}):0
+ } @$toSort;
+
+ return \@orderedData;
+}
+
sub SortProblems {
- my ($problemData,$sortBy,$ascend)=@_;
+ my ($problemData,$sortBy,$sortProblems,$ascend)=@_;
+ my @problems = split(':::', $problemData->{'problemList'});
if($sortBy eq "Homework Sets Order") {
- return;
+ return \@problems;
}
my $data;
@@ -537,51 +650,85 @@ sub SortProblems {
elsif($sortBy eq "DoDiff") { $data = ':degreeOfDifficulty'; }
elsif($sortBy eq "S.D.") { $data = ':standardDeviation'; }
elsif($sortBy eq "Skew.") { $data = ':skewness'; }
- elsif($sortBy eq "D.F.1st") { $data = ':discriminantFactor1'; }
- elsif($sortBy eq "D.F.2nd") { $data = ':discriminantFactor2'; }
- elsif($sortBy eq "Disc.") { $data = ''; }
- else { return; }
-
- my $problems = $problemData->{'problemList'};
- my @orderedProblems =
- sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
- @$problems;
+ elsif($sortBy eq "D.F.1st") { $data = ':discriminationFactor1'; }
+ elsif($sortBy eq "D.F.2nd") { $data = ':discriminationFactor2'; }
+ else { return \@problems; }
+
+ my %temp;
+ my @sequenceList=();
+ foreach(@problems) {
+ my ($sequence) = split(':', $_);
+
+ my @array=();
+ my $tempArray;
+ if(defined($temp{$sequence})) {
+ $tempArray = $temp{$sequence};
+ } else {
+ push(@sequenceList, $sequence);
+ $tempArray = \@array;
+ $temp{$sequence} = $tempArray;
+ }
+
+ push(@$tempArray, $_);
+ }
+
+ my @orderedProblems;
+ if($sortProblems eq "Sort Within Sequence") {
+ foreach(keys(%temp)) {
+ my $tempArray = $temp{$_};
+ my @tempOrder =
+ sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
+ @$tempArray;
+ $temp{$_} = \@tempOrder;
+ }
+ foreach(@sequenceList) {
+ my $tempArray = $temp{$_};
+ @orderedProblems = (@orderedProblems, @$tempArray);
+ }
+ } else {
+ @orderedProblems =
+ sort { $problemData->{$a.$data} <=> $problemData->{$b.$data} }
+ @problems;
+ }
+
if($ascend eq 'Descending') {
@orderedProblems = reverse(@orderedProblems);
}
- $problemData->{'problemList'} = \@orderedProblems;
-
- return;
+ return \@orderedProblems;
}
sub CalculateStatistics {
- my ($data)=@_;
+ my ($data, $cache, $courseID)=@_;
- my $problems = $data->{'problemList'};
- foreach(@$problems) {
+ my @problems = split(':::', $data->{'problemList'});
+ foreach(@problems) {
# Mean
- $data->{$_.':mean'} = ($data->{$_.':studentCount'}) ?
+ my $mean = ($data->{$_.':studentCount'}) ?
($data->{$_.':totalTries'} / $data->{$_.':studentCount'}) : 0;
+ $data->{$_.':mean'} = sprintf("%.2f", $mean);
# %Wrong
- $data->{$_.':percentWrong'} = ($data->{$_.':studentCount'}) ?
+ my $pw = ($data->{$_.':studentCount'}) ?
(($data->{$_.':wrong'} / $data->{$_.':studentCount'}) * 100.0) :
100.0;
+ $data->{$_.':percentWrong'} = sprintf("%.1f", $pw);
# Degree of Difficulty
- $data->{$_.':degreeOfDifficulty'} = ($data->{$_.':totalTries'}) ?
+ my $dod = ($data->{$_.':totalTries'}) ?
(1 - (($data->{$_.':correct'} + $data->{$_.':correctByOverride'}) /
$data->{$_.':totalTries'})) : 0;
+ $data->{$_.':degreeOfDifficulty'} = sprintf("%.2f", $dod);
+
# Factor in mean
- my $studentTries = $data->{$_.':studentTries'};
- foreach(my $index=0; $index < scalar(@$studentTries); $index++) {
- $studentTries->[$index] -= $data->{$_.':mean'};
+ my @studentTries = split(':::', $data->{$_.':studentTries'});
+ foreach(my $index=0; $index < scalar(@studentTries); $index++) {
+ $studentTries[$index] -= $mean;
}
my $sumSquared = 0;
my $sumCubed = 0;
- foreach(@$studentTries) {
+ foreach(@studentTries) {
my $squared = ($_ * $_);
my $cubed = ($squared * $_);
$sumSquared += $squared;
@@ -589,147 +736,89 @@ sub CalculateStatistics {
}
# Standard deviation
- $data->{$_.':standardDeviation'} = ($data->{$_.':studentCount'} - 1) ?
- ((sqrt($sumSquared)) / ($data->{$_.':studentCount'} - 1)) : 0;
+ my $standardDeviation;
+ if($data->{$_.':studentCount'} - 1 > 0) {
+ $standardDeviation = (sqrt($sumSquared)) /
+ ($data->{$_.':studentCount'} - 1);
+ } else {
+ $standardDeviation = 0.0;
+ }
+ $data->{$_.':standardDeviation'} = sprintf("%.1f", $standardDeviation);
# Skewness
- my $standardDeviation = $data->{$_.':standardDeviation'};
- $data->{$_.':skewness'} = ($data->{$_.':standardDeviation'}) ?
- (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) /
- ($standardDeviation * $standardDeviation * $standardDeviation)) :
- 0;
+ my $skew;
+ if($standardDeviation > 0.0999 && $data->{$_.':studentCount'} > 0) {
+ $skew = (((sqrt($sumSquared)) / $data->{$_.':studentCount'}) /
+ ($standardDeviation *
+ $standardDeviation *
+ $standardDeviation));
+ } else {
+ $skew = 0.0;
+ }
- # Discrimination Factor 1
- $data->{$_.':discriminationFactor1'} = 0;
+ $data->{$_.':skewness'} = sprintf("%.1f", $skew);
- # Discrimination Factor 2
- $data->{$_.':discriminationFactor2'} = 0;
- }
+ # Discrimination Factor 1
+ my ($sequence, $problem, $part) = split(':', $_);
- return;
-}
+ my @upper1 = split(':::', $data->{'studentsUpperListCriterion1'});
+ my @lower1 = split(':::', $data->{'studentsLowerListCriterion1'});
-sub ProcessDiscriminant {
- my ($List) = @_;
- my @sortedList = sort (@$List);
- my $Count = scalar @sortedList;
- my $Problem;
- my @Dis;
- my $Slvd=0;
- my $tmp;
- my $Sum1=0;
- my $Sum2=0;
- my $nIndex=0;
- my $nStudent=0;
- my %Proc=undef;
- while ($nIndex<$Count) {
-# $jr->print(" $nIndex) $sortedList[$nIndex]");
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- my $Temp = $Problem;
- do {
- $nIndex++;
- $nStudent++;
- $Sum1 += $Dis[0];
- $Sum2 += $Dis[1];
- ($Problem,$tmp)=split(/\=/,$sortedList[$nIndex]);
- @Dis=split(/\+/,$tmp);
- } while ( $Problem eq $Temp && $nIndex < $Count );
- $Proc{$Temp}=($Sum1/$nStudent).':'.($Sum2/$nStudent);
-# $jr->print(" $nIndex) $Temp --> ($nStudent) $Proc{$Temp}");
- $Sum1=0;
- $Sum2=0;
- $nStudent=0;
- }
-
- return %Proc;
-}
-
-#------- Creating Discimination factor
-sub Discriminant {
- my ($discriminant)=@_;
- my @discriminantKeys=keys(%$discriminant);
- my $Count = scalar @discriminantKeys;
-
- my $UpCnt = int(0.27*$Count);
- my $low=0;
- my $up=$Count-$UpCnt;
- my @UpList=();
- my @LowList=();
-
- $Count=0;
- foreach my $key (sort(@discriminantKeys)) {
- $Count++;
- if($low < $UpCnt || $Count > $up) {
- $low++;
- my $str=$discriminant->{$key};
- foreach(split(/\&/,$str)){
- if($_) {
- if($low<$UpCnt) { push(@LowList,$_); }
- else { push(@UpList,$_); }
- }
- }
+ my $upper1Sum=0;
+ foreach my $name (@upper1) {
+ $upper1Sum += $cache->{"$name:$problem:$part:awarded"};
}
- }
- my %DisUp = &ProcessDiscriminant(\@UpList);
- my %DisLow = &ProcessDiscriminant(\@LowList);
-
- return (\%DisUp, \%DisLow);
-}
+ $upper1Sum = (scalar(@upper1)) ? ($upper1Sum/(scalar(@upper1))) : 0;
-#---- END Problem Statistics Web Page ----------------------------------------
+ my $lower1Sum=0;
+ foreach my $name (@lower1) {
+ $lower1Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $lower1Sum = (scalar(@lower1)) ? ($lower1Sum/(scalar(@lower1))) : 0;
-#---- Problem Statistics Graph Web Page --------------------------------------
+ my $df1 = $upper1Sum - $lower1Sum;
+ $data->{$_.':discriminationFactor1'} = sprintf("%.2f", $df1);
-# ------------------------------------------- Prepare data for Graphical chart
+ # Discrimination Factor 2
+ my @upper2 = split(':::', $data->{'studentsUpperListCriterion2'});
+ my @lower2 = split(':::', $data->{'studentsLowerListCriterion2'});
-sub BuildGraphicChart {
- my ($ylab,$r,$cacheDB)=@_;
- my %cache;
- my $Col;
- my $data='';
- my $count = 0;
- my $Max = 0;
+ my $upper2Sum=0;
+ foreach my $name (@upper2) {
+ $upper2Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $upper2Sum = (scalar(@upper2)) ? ($upper2Sum/(scalar(@upper2))) : 0;
- unless(tie(%cache,'GDBM_File',$cacheDB,&GDBM_READER(),0640)) {
- return 'Unable to tie database.';
- }
-
- my $p_count = $cache{'ProblemCount'};
+ my $lower2Sum=0;
+ foreach my $name (@lower2) {
+ $lower2Sum += $cache->{"$name:$problem:$part:awarded"};
+ }
+ $lower2Sum = (scalar(@lower2)) ? ($lower2Sum/(scalar(@lower2))) : 0;
- for ( my $k=0; $k<$p_count;$k++) {
- my @Temp=split(/\:/,$cache{'GraphGif:'.$k});
- my $inf = $Temp[$Col];
- if ( $Max < $inf ) {$Max = $inf;}
- $data .= $inf.',';
- $count++;
- }
- untie(%cache);
-# $r->print(" count=$p_count >>data= $data");
+ my $df2 = $upper2Sum - $lower2Sum;
+ $data->{$_.':discriminationFactor2'} = sprintf("%.2f", $df2);
- if ( $Max > 1 ) {
- $Max += (10 - $Max % 10);
- $Max = int($Max);
- } else { $Max = 1; }
-
- my $cid=$ENV{'request.course.id'};
-
- if ( $ylab eq 'DoDiff Graph' ) {
- $ylab = 'Degree-of-Difficulty';
- $Col = 0;
- } else {
- $ylab = 'Wrong-Percentage';
- $Col = 1;
+ my %storestats;
+ my $Average = ($data->{$_.':studentCount'}) ?
+ $data->{$_.':totalTries'}/$data->{$_.':studentCount'} : 0;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___timestamp'}=time;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___stdno'}=$data->{$_.':studentCount'};
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___avetries'}=$Average;
+ $storestats{$courseID.'___'.$cache->{$sequence.':source'}.
+ '___difficulty'}=$data->{$_.':degreeOfDifficulty'};
+ $cache->{$sequence.':source'} =~ /^(\w+)\/(\w+)/;
+ if($data->{$_.':studentCount'}) {
+ &Apache::lonnet::put('resevaldata',\%storestats,$1,$2);
+ }
}
- my $Course = $ENV{'course.'.$cid.'.description'};
- $Course =~ s/\ /"_"/eg;
- my $GData=$Course.'&'.'Problems#'.'&'.$ylab.'&'.
- $Max.'&'.$count.'&'.$data;
-
- $r->print('');
return;
}
+#---- END Problem Statistics Web Page ----------------------------------------
+
1;
__END__
|