Completed
Push — master ( 505b4c...62d9c0 )
by Seth
05:17 queued 03:12
created

data-collection.php ➔ collectStatistics()   F

Complexity

Conditions 23
Paths 4325

Size

Total Lines 188
Code Lines 109

Duplication

Lines 0
Ratio 0 %

Importance

Changes 0
Metric Value
cc 23
eloc 109
nc 4325
nop 4
dl 0
loc 188
rs 2
c 0
b 0
f 0

How to fix   Long Method    Complexity   

Long Method

Small methods make your code easier to understand, in particular if combined with a good name. Besides, if your method is small, finding a good name is usually much easier.

For example, if you find yourself adding comments to a method's body, this is usually a good sign to extract the commented part to a new method, and use the comment as a starting point when coming up with a good name for this new method.

Commonly applied refactorings include:

1
#!/usr/bin/env php
0 ignored issues
show
Coding Style Compatibility introduced by
For compatibility and reusability of your code, PSR1 recommends that a file should introduce either new symbols (like classes, functions, etc.) or have side-effects (like outputting something, or including other files), but not both at the same time. The first symbol is defined on line 4 and the first side effect is on line 1.

The PSR-1: Basic Coding Standard recommends that a file should either introduce new symbols, that is classes, functions, constants or similar, or have side effects. Side effects are anything that executes logic, like for example printing output, changing ini settings or writing to a file.

The idea behind this recommendation is that merely auto-loading a class should not change the state of an application. It also promotes a cleaner style of programming and makes your code less prone to errors, because the logic is not spread out all over the place.

To learn more about the PSR-1, please see the PHP-FIG site on the PSR-1.

Loading history...
2
<?php
3
4
define('DEBUGGING', DEBUGGING_LOG);
5
define('IGNORE_LTI', true);
6
7
require_once __DIR__ . '/../common.inc.php';
8
require_once __DIR__ . '/../constants.inc.php';
9
10
// http://stackoverflow.com/a/21896310
11
function hoursRange($lower = 0, $upper = 86400, $step = 3600, $keyFormat = '', $value = '', $valueIsFormat = false)
12
{
13
    $times = array();
14
15
    if (empty( $value ) && $valueIsFormat) {
16
        $value = 'g:i a';
17
    }
18
19
    if (empty($keyFormat)) {
20
        $keyFormat = 'g:i a';
21
    }
22
23
    foreach (range( $lower, $upper, $step ) as $increment) {
24
        $increment = gmdate( $keyFormat, $increment );
25
26
        list( $hour, $minutes ) = explode( ':', $increment );
27
28
        $date = new DateTime( $hour . ':' . $minutes );
29
30
        $times[(string) $increment] = ($valueIsFormat ? $date->format( $value ) : $value);
31
    }
32
33
    return $times;
34
}
35
36
function collectStatistics($term, $api, $sql, $metadata)
37
{
38
    // TODO make this configurable
39
    $courses = $api->get(
40
        '/accounts/132/courses',
41
        array(
42
            'with_enrollments' => 'true',
43
            'enrollment_term_id' => $term
44
        )
45
    );
46
47
    // so that everything has a consistent benchmark
48
    $timestamp = time();
49
50
    foreach ($courses as $course) {
51
        $statistic = array(
52
            'timestamp' => date(DATE_ISO8601, $timestamp),
53
            'course[id]' => $course['id'],
54
            'course[name]' => $course['name'],
55
            'course[account_id]' => $course['account_id'],
56
            'gradebook_url' => 'https://' . parse_url($metadata['CANVAS_API_URL'], PHP_URL_HOST) . "/courses/{$course['id']}/gradebook2",
57
            'assignments_due_count' => 0,
58
            'dateless_assignment_count' => 0,
59
            'created_after_due_count' => 0,
60
            'gradeable_assignment_count' => 0,
61
            'graded_assignment_count' => 0,
62
            'zero_point_assignment_count' => 0,
63
            'analytics_page' => $metadata['APP_URL'] . "/course-summary.php?course_id={$course['id']}"
64
        );
65
66
        $teacherIds = array();
67
        $teacherNames = array();
68
        $teachers = $api->get(
69
            "/courses/{$course['id']}/enrollments",
70
            array(
71
                'type[]' => 'TeacherEnrollment'
72
            )
73
        );
74
        foreach ($teachers as $teacher) {
75
            $teacherIds[] = $teacher['user']['id'];
76
            $teacherNames[] = $teacher['user']['sortable_name'];
77
        }
78
        $statistic['teacher[id]s'] = serialize($teacherIds);
79
        $statistic['teacher[sortable_name]s'] = serialize($teacherNames);
80
81
        $account = $api->get("/accounts/{$course['account_id']}");
82
        $statistic['account[name]'] = $account['name'];
83
84
        // ignore classes with no teachers (how do they even exist? weird.)
85
        if (count($teacherIds) != 0) {
86
            $statistic['student_count'] = 0;
87
            $students = $api->get(
88
                "/courses/{$course['id']}/enrollments",
89
                array(
90
                    'type[]' => 'StudentEnrollment'
91
                )
92
            );
93
            $statistic['student_count'] = $students->count();
94
95
            // ignore classes with no students
96
            if ($statistic['student_count'] != 0) {
97
                $assignments = $api->get(
98
                    "/courses/{$course['id']}/assignments"
99
                );
100
101
                $gradedSubmissionsCount = 0;
102
                $turnAroundTimeTally = 0;
103
                $leadTimeTally = 0;
104
                $createdModifiedHistogram = array(
105
                    HISTOGRAM_CREATED => hoursRange(0, 86400, 3600, '', 0),
106
                    HISTOGRAM_MODIFIED => hoursRange(0, 86400, 3600, '', 0)
107
                );
108
109
                foreach ($assignments as $assignment) {
110
                    // ignore unpublished assignments
111
                    if ($assignment['published'] == true) {
112
                        // check for due dates
113
                        $dueDate = new DateTime($assignment['due_at']);
114
                        $dueDate->setTimeZone(new DateTimeZone(SCHOOL_TIME_ZONE));
115
                        if (($timestamp - $dueDate->getTimestamp()) > 0) {
116
                            $statistic['assignments_due_count']++;
117
118
                            // update created_modified_histogram
119
                            $createdAt = new DateTime($assignment['created_at']);
120
                            $createdAt->setTimeZone(new DateTimeZone(SCHOOL_TIME_ZONE));
121
                            $updatedAt = new DateTime($assignment['updated_at']);
122
                            $updatedAt->setTimeZone(new DateTimeZone(SCHOOL_TIME_ZONE));
123
                            $createdModifiedHistogram[HISTOGRAM_CREATED][$createdAt->format('g:00 a')]++;
124
                            if ($createdAt != $updatedAt) {
125
                                $createdModifiedHistogram[HISTOGRAM_MODIFIED][$updatedAt->format('g:00 a')]++;
126
                            }
127
128
                            // tally lead time on the assignment
129
                            $leadTimeTally += strtotime($assignment['due_at']) - strtotime($assignment['created_at']);
130
131
                            // was the assignment created after it was due?
132
                            if (strtotime($assignment['due_at']) < strtotime($assignment['created_at'])) {
133
                                $statistic['created_after_due_count']++;
134
                            }
135
136
                            // ignore ungraded assignments
137
                            if ($assignment['grading_type'] != 'not_graded') {
138
                                $statistic['gradeable_assignment_count']++;
139
                                $hasBeenGraded = false;
140
141
                                // tally zero point assignments
142
                                if ($assignment['points_possible'] == '0') {
143
                                    $statistic['zero_point_assignment_count']++;
144
                                }
145
146
                                // build submission statistic
147
                                $submissions = $api->get(
148
                                    "/courses/{$course['id']}/assignments/{$assignment['id']}/submissions"
149
                                );
150
                                foreach ($submissions as $submission) {
151
                                    if ($submission['workflow_state'] == 'graded') {
152
                                        if ($hasBeenGraded == false) {
0 ignored issues
show
Coding Style Best Practice introduced by
It seems like you are loosely comparing two booleans. Considering using the strict comparison === instead.

When comparing two booleans, it is generally considered safer to use the strict comparison operator.

Loading history...
153
                                            $hasBeenGraded = true;
154
                                            $statistic['graded_assignment_count']++;
155
                                        }
156
                                        $gradedSubmissionsCount++;
157
                                        $turnAroundTimeTally += max(
158
                                            0,
159
                                            strtotime($submission['graded_at']) - strtotime($assignment['due_at'])
160
                                        );
161
                                    }
162
                                }
163
164
                                if (!$hasBeenGraded) {
165
                                    if (array_key_exists('oldest_ungraded_assignment_due_date', $statistic)) {
166
                                        if (strtotime($assignment['due_at']) < strtotime($statistic['oldest_ungraded_assignment_due_date'])) {
167
                                            $statistic['oldest_ungraded_assignment_due_date'] = $assignment['due_at'];
168
                                            $statistic['oldest_ungraded_assignment_url'] = $assignment['html_url'];
169
                                            $statistic['oldest_ungraded_assignment_name'] = $assignment['name'];
170
                                        }
171
                                    } else {
172
                                        $statistic['oldest_ungraded_assignment_due_date'] = $assignment['due_at'];
173
                                        $statistic['oldest_ungraded_assignment_url'] = $assignment['html_url'];
174
                                        $statistic['oldest_ungraded_assignment_name'] = $assignment['name'];
175
                                    }
176
                                }
177
                            }
178
                        } else {
179
                            $statistic['dateless_assignment_count']++;
180
                        }
181
                    }
182
                }
183
184
                $statistic['created_modified_histogram'] = serialize($createdModifiedHistogram);
185
186
                // calculate average submissions graded per assignment (if non-zero)
187
                if ($statistic['gradeable_assignment_count'] && $statistic['student_count']) {
188
                    $statistic['average_submissions_graded'] = $gradedSubmissionsCount / ($statistic['gradeable_assignment_count'] * $statistic['student_count']);
189
                }
190
191
                // calculate the average lead-time on assignments
192
                if ($statistic['assignments_due_count']) {
193
                    $statistic['average_assignment_lead_time'] = $leadTimeTally / $statistic['assignments_due_count'] / 60 / 60 / 24;
194
                }
195
196
                // calculate average grading turn-around per submission
197
                if ($gradedSubmissionsCount) {
198
                    $statistic['average_grading_turn_around'] = $turnAroundTimeTally / $gradedSubmissionsCount / 60 / 60 / 24;
199
                }
200
201
                $query = "INSERT INTO `course_statistics`";
202
                $fields = array();
203
                $values = array();
204
                while (list($field, $value) = each($statistic)) {
205
                    $fields[] = $field;
206
                    $values[] = $value;
207
                }
208
                $query .= ' (`' . implode('`, `', $fields) . "`) VALUES ('" . implode("', '", $values) . "')";
209
                $result = $sql->query($query);
0 ignored issues
show
Unused Code introduced by
$result is not used, you could remove the assignment.

This check looks for variable assignements that are either overwritten by other assignments or where the variable is not used subsequently.

$myVar = 'Value';
$higher = false;

if (rand(1, 6) > 3) {
    $higher = true;
} else {
    $higher = false;
}

Both the $myVar assignment in line 1 and the $higher assignment in line 2 are dead. The first because $myVar is never used and the second because $higher is always overwritten for every possible time line.

Loading history...
210
                /* displayError(
0 ignored issues
show
Unused Code Comprehensibility introduced by
57% of this comment could be valid code. Did you maybe forget this after debugging?

Sometimes obsolete code just ends up commented out instead of removed. In this case it is better to remove the code once you have checked you do not need it.

The code might also have been commented out for debugging purposes. In this case it is vital that someone uncomments it again or your project may behave in very unexpected ways in production.

This check looks for comments that seem to be mostly valid code and reports them.

Loading history...
211
                    array(
212
                        'gradedSubmissionsCount' => $gradedSubmissionsCount,
213
                        'turnAroundTimeTally' => $turnAroundTimeTally,
214
                        'statistic' => $statistic,
215
                        'query' => $query,
216
                        'result' => $result
217
                    ),
218
                    true
219
                ); */
220
            }
221
        }
222
    }
223
}
224
225
//debugFlag('START');
226
227
/* create an API connector if not already extant */
228
if (empty($api)) {
229
    $api = new CanvasPest($metadata['CANVAS_API_URL'], $metadata['CANVAS_API_TOKEN']);
230
}
231
232
/* collect data on terms currently in session */
233
$terms = $api->get('accounts/1/terms');
234
$now = strtotime('now');
235
foreach ($terms['enrollment_terms'] as $term) {
236
    if (isset($term['start_at']) && isset($term['end_at'])) {
237
        if ((strtotime($term['start_at']) <= $now) && ($now <= strtotime($term['end_at']))) {
238
            collectStatistics($term['id'], $api, $sql, $metadata);
239
        }
240
    }
241
}
242
243
/* check to see if this data collection has been scheduled. If it hasn't,
244
   schedule it to run nightly. */
245
/* thank you http://stackoverflow.com/a/4421284 ! */
246
$crontab = DATA_COLLECTION_CRONTAB . ' ' . realpath('.') . '/data-collection.sh';
247
$crontabs = shell_exec('crontab -l');
248
if (strpos($crontabs, $crontab) === false) {
249
    $filename = md5(time()) . '.txt';
250
    file_put_contents("/tmp/$filename", $crontabs . $crontab . PHP_EOL);
251
    shell_exec("crontab /tmp/$filename");
252
    debugFlag("added new scheduled data-collection to crontab");
253
}
254
255
//debugFlag('FINISH');
256