forked from tl-its-umich-edu/kartograafr
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
576 lines (421 loc) · 22.5 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
## TTD:
### set log level by property / env variable
import argparse
from datetime import datetime
import logging
logger = logging.getLogger(__name__)
loggingLevel = None
import sys
import os
import re
import arcgisUM
import dateutil.parser
import dateutil.tz
from bs4 import BeautifulSoup
from bs4.builder._htmlparser import HTMLParserTreeBuilder
import config
from CanvasAPI import CanvasAPI
# The secrets module really is used during import (to change sensitive
# properties).
import secrets #@UnusedImport
import util
##### Improved code tracebacks for exceptions
import traceback
def handleError(self, record): # @UnusedVariable
traceback.print_stack()
logging.Handler.handleError = handleError
#####
TIMEZONE_UTC = dateutil.tz.tzutc()
RUN_START_TIME = datetime.now(tz=TIMEZONE_UTC)
RUN_START_TIME_FORMATTED = RUN_START_TIME.strftime('%Y%m%d%H%M%S')
# Hold parsed options
options = None
# Adjustable level to use for all logging
logger.error("loggingLevel: {}".format(loggingLevel))
if loggingLevel is None:
loggingLevel = config.Application.Logging.DEFAULT_LOG_LEVEL
logger = None # type: logging.Logger
logFormatter = None # type: logging.Formatter
courseLogHandlers = dict()
courseLoggers = dict()
def getCanvasInstance():
return CanvasAPI(config.Canvas.API_BASE_URL,
authZToken=config.Canvas.API_AUTHZ_TOKEN)
def getCourseIDsWithOutcome(canvas, courseIDs, outcome):
"""Get Canvas courses that have assignments marked with outcome indicating there should be a corresponding ArgGIS group."""
matchingCourseIDs = set()
for courseID in courseIDs:
courseOutcomeGroupLinks = \
canvas.getCoursesOutcomeGroupLinksObjects(courseID)
# Is it possible to short-circuit this using itertools?
matchingCourseIDs.update(
set(courseID for outcomeLink in courseOutcomeGroupLinks
if outcomeLink.outcome.id == outcome.id)
)
return matchingCourseIDs
def getCourseAssignmentsWithOutcome(canvas, courseIDs, outcome):
"""Get specific assignments from Canvas courses. Remove assignments that are expired or aren't marked to match up with ArgGIS group."""
matchingCourseAssignments = []
for courseID in courseIDs:
courseAssignments = canvas.getCoursesAssignmentsObjects(courseID)
for assignment in courseAssignments:
expirationTimestamp = assignment.lock_at or assignment.due_at
expirationTime = dateutil.parser.parse(expirationTimestamp) if expirationTimestamp else RUN_START_TIME
if (expirationTime < RUN_START_TIME):
logger.info('Skipping Assignment {} for Course {}, expired on: {}'
.format(assignment,
courseID,
assignment.lock_at if assignment.lock_at else assignment.due_at))
continue
if not assignment.rubric:
logger.info('Skipping Assignment {} for Course {}, no rubrics'
.format(assignment,
courseID))
continue
for rubric in assignment.rubric:
if rubric.outcome_id == outcome.id:
matchingCourseAssignments.append(assignment)
break
return matchingCourseAssignments
# Take two lists and separate out entries only in first list, those only in second list, and those in both.
# Uses sets to do this so duplicate entries will become singular and order in the list will be arbitrary.
def computeListDifferences(leftList, rightList):
"""Take 2 lists and return 3 lists of entries: only in first, only in seconds, only in both lists. Element order is not preserved. Duplicates will be compressed."""
leftOnly = list(set(leftList) - set(rightList))
rightOnly = list(set(rightList) - set(leftList))
both = list(set(rightList) & set(leftList))
return leftOnly, rightOnly, both
# Look at lists of users already in group and those currently in the course and return new lists
# of only the users that need to be added and need to be removed, so unchanged people remain untouched.
def minimizeUserChanges(groupUsers, courseUsers):
"""Compute minimal changes to ArgGIS group membership so that members who don't need to be changed aren't changed."""
logger.debug('groupUsers input: {}'.format(groupUsers))
logger.debug('courseUsers input: {}'.format(courseUsers))
# Based on current Canvas and ArcGIS memberships find obsolete users in ArcGIS group, new users in course,
# and members in both (hence unchanged).
minGroupUsers, minCourseUsers, unchangedUsers = computeListDifferences(groupUsers,courseUsers)
logger.info('changedArcGISGroupUsers: {} changedCanvasUsers: {} unchanged Users {}'.format(minGroupUsers,minCourseUsers,unchangedUsers))
return minGroupUsers, minCourseUsers
def updateGroupUsers(courseUserDictionary, course, instructorLog, groupTitle, group):
"""Add remove / users from group to match Canvas course"""
# get the arcgis group members and the canvas course members.
groupNameAndID = util.formatNameAndID(group)
groupUsers = arcgisUM.getCurrentArcGISMembers(group, groupNameAndID)
logger.debug('group users: {}'.format(groupUsers))
groupUsersTrimmed = [re.sub('_\S+$', '', gu) for gu in groupUsers]
logger.debug('All ArcGIS users currently in Group {}: ArcGIS Users: {}'.format(groupNameAndID, groupUsers))
canvasCourseUsers = [user.login_id for user in courseUserDictionary[course.id] if user.login_id is not None]
logger.debug('All Canvas users in course for Group {}: Canvas Users: {}'.format(groupNameAndID, canvasCourseUsers))
# compute the exact sets of users to change.
changedArcGISGroupUsers, changedCourseUsers = minimizeUserChanges(groupUsersTrimmed, canvasCourseUsers)
# added to avoid undefined variable warning
# fix up the user name format for ArcGIS users names
changedArcGISGroupUsers = arcgisUM.formatUsersNamesForArcGIS(changedArcGISGroupUsers)
logger.info('Users to remove from ArcGIS: Group {}: ArcGIS Users: {}'.format(groupNameAndID, changedArcGISGroupUsers))
logger.info('Users to add from Canvas course for ArcGIS: Group {}: Canvas Users: {}'.format(groupNameAndID, changedCourseUsers))
# Now update only the users in the group that have changed.
instructorLog, results = arcgisUM.removeSomeExistingGroupMembers(groupTitle, group, instructorLog, changedArcGISGroupUsers) # @UnusedVariable
instructorLog = arcgisUM.addCanvasUsersToGroup(instructorLog, group, changedCourseUsers)
return instructorLog
def updateArcGISGroupForAssignment(arcGIS, courseUserDictionary, groupTags, assignment, course,instructorLog):
"""" Make sure there is a corresponding ArcGIS group for this Canvas course and assignment. Sync up the ArcGIS members with the Canvas course members."""
groupTitle = '%s_%s_%s_%s' % (course.name, course.id, assignment.name, assignment.id)
group = arcgisUM.lookForExistingArcGISGroup(arcGIS, groupTitle)
if group is None:
group, instructorLog = arcgisUM.createNewArcGISGroup(arcGIS, groupTags, groupTitle,instructorLog)
# if creation didn't work then log that.
if group is None:
logger.info('Problem creating or updating ArcGIS group "{}": Missing group object.'.format(groupTitle))
instructorLog += 'Problem creating or updating ArcGIS group "{}"\n'.format(groupTitle)
else:
# have a group. Might be new or existing.
instructorLog = updateGroupUsers(courseUserDictionary, course, instructorLog, groupTitle, group)
courseLogger = getCourseLogger(course.id, course.name)
logger.debug("update group instructor log: {}".format(instructorLog))
courseLogger.info(instructorLog)
# For all the assignments and their courses update the ArcGIS group.
def updateArcGISGroupsForAssignments(arcGIS, assignments, courseDictionary,courseUserDictionary):
"""For each assignment listed ensure there is an ArcGIS group corresponding to the Canvas course / assignment."""
groupTags = ','.join(('kartograafr', 'umich'))
logger.debug("groupTags: {}".format(groupTags))
for assignment in assignments:
course = courseDictionary[assignment.course_id]
instructorLog = ''
updateArcGISGroupForAssignment(arcGIS, courseUserDictionary, groupTags, assignment, course,instructorLog)
def getCoursesByID(canvas, courseIDs):
"""Get Canvas course objects for the listed courses."""
courses = {}
for courseID in courseIDs:
logger.info("getCoursesById: courseId: {}".format(courseID))
courses[courseID] = canvas.getCourseObject(courseID)
return courses
def getCoursesUsersByID(canvas, courseIDs, enrollmentType=None):
"""Get Canvas course members for specific course. Can filter by members's Canvas role.
:param canvas:
:type canvas: CanvasAPI
:param courseIDs:
:type courseIDs: set or list
:param enrollmentType: (optional) Canvas user enrollment type: 'student', 'teacher', etc.
:type enrollmentType: str
:return:
"""
coursesUsers = {}
for courseID in courseIDs:
coursesUsers[courseID] = canvas.getCoursesUsersObjects(courseID, enrollmentType=enrollmentType,
params={'include[]': 'email'})
return coursesUsers
def getCourseLogFilePath(courseID):
"""Each course will have a separate sub-log file. This is the path to that file."""
return os.path.realpath(os.path.normpath(os.path.join(
config.Application.Logging.COURSE_DIRECTORY,
courseID + config.Application.Logging.LOG_FILENAME_EXTENSION,
)))
def getMainLogFilePath(nameSuffix=None):
"""Return the path/filename of the main log file."""
mainLogName = config.Application.Logging.MAIN_LOG_BASENAME
if nameSuffix is not None:
mainLogName += '-' + str(nameSuffix)
return os.path.realpath(os.path.normpath(os.path.join(
config.Application.Logging.DIRECTORY,
mainLogName + config.Application.Logging.LOG_FILENAME_EXTENSION,
)))
def logToStdOut():
"""Have log output go to stdout in addition to any file."""
root = logging.getLogger()
root.setLevel(loggingLevel)
ch = logging.StreamHandler(sys.stdout)
#ch.setLevel(logging.DEBUG)
ch.setLevel(loggingLevel)
formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
ch.setFormatter(formatter)
root.addHandler(ch)
def getCourseLogger(courseID, courseName):
"""Set up course specific logger.
:param courseID: ID number of the course
:type courseID: str or int
:param courseName: Name of the course
:type courseName: str
:return: A logging handler for a specific course's log file
:rtype: logging.FileHandler
"""
global courseLoggers # type: dict
courseID = str(courseID)
if courseID in courseLoggers:
return courseLoggers[courseID]
logFormatterFriendly = logging.Formatter('Running at: %(asctime)s\n\n%(message)s', '%I:%M:%S %p on %B %d, %Y')
logHandlerMain = logging.FileHandler(getMainLogFilePath())
logHandlerMain.setFormatter(logFormatterFriendly)
logHandlerCourse = logging.FileHandler(getCourseLogFilePath(courseID))
logHandlerCourse.setFormatter(logFormatterFriendly)
courseLogger = logging.getLogger(courseID) # type: logging.Logger
courseLogger.setLevel(loggingLevel)
courseLogger.addHandler(logHandlerMain)
courseLogger.addHandler(logHandlerCourse)
courseLoggers[courseID] = courseLogger
return courseLogger
def getCourseLogHandler(courseID, courseName):
"""Lookup the course specific logger for this course.
:param courseID: ID number of the course
:type courseID: str or int
:param courseName: Name of the course
:type courseName: str
:return: A logging handler for a specific course's log file
:rtype: logging.FileHandler
"""
global logFormatter # type: logging.Formatter
global courseLogHandlers # type: dict
courseID = str(courseID)
if courseID in courseLogHandlers:
return courseLogHandlers[courseID]
courseLogHandler = logging.FileHandler(getCourseLogFilePath(courseID))
courseLogHandler.setFormatter(logFormatter)
courseLogHandlers[courseID] = courseLogHandler
return courseLogHandler
def closeAllCourseLoggerHandlers():
global courseLoggers
for (courseID, courseLogger) in courseLoggers.items(): # type: logging.Logger
for handler in courseLogger.handlers: # type: logging.Handler
handler.close()
def closeAllCourseLogHandlers():
global courseLogHandlers
for (courseID, courseLogHandler) in courseLogHandlers.items():
courseLogHandler.close()
def getCourseIDsFromConfigCoursePage(canvas, courseID):
"""Read hand edited list of Canvas course ids to process from a specific Canvas course page."""
VALID_COURSE_URL_REGEX = '^https://umich\.instructure\.com/courses/[0-9]+$'
pages = canvas.getCoursesPagesByNameObjects(courseID, 'course-ids') # type: list of CanvasObject
courseIDs = None
if pages:
configCoursePage = pages.pop()
configCoursePageTree = BeautifulSoup(configCoursePage.body, builder=HTMLParserTreeBuilder())
courseURLs = set([a['href'] for a in configCoursePageTree.find_all('a', href=re.compile(VALID_COURSE_URL_REGEX))])
if courseURLs:
courseIDs = [int(url.split('/').pop()) for url in courseURLs]
return courseIDs
def renameLogForCourseID(courseID=-1):
"""Change name of the course specific log file."""
if courseID == -1:
raise RuntimeError('Renaming logs requires either a course ID number to rename the log for that course, '
'or the None value to rename the main log.')
if courseID is not None:
courseID = str(courseID)
oldLogName = getCourseLogFilePath(courseID)
newLogName = getCourseLogFilePath(courseID + '-' + RUN_START_TIME_FORMATTED)
else:
oldLogName = getMainLogFilePath()
newLogName = getMainLogFilePath(nameSuffix=RUN_START_TIME_FORMATTED)
if os.path.isfile(oldLogName) is True:
os.rename(oldLogName, newLogName)
return (oldLogName, newLogName)
def emailLogForCourseID(courseID, recipients):
"""Email course information to a list of multiple recipients."""
import smtplib
from email.mime.text import MIMEText
from email.header import Header
if not isinstance(recipients, list):
recipients = [recipients]
courseID = str(courseID)
logContent = None
# File may not exist if no changes were made to group.
if os.path.isfile(getCourseLogFilePath(courseID)) is not True:
logger.debug('No logfile {} for course: {}'.format(getCourseLogFilePath(courseID),courseID))
return
try:
READ_BINARY_MODE = 'rb'
logfile = open(getCourseLogFilePath(courseID), mode=READ_BINARY_MODE)
logContent = logfile.read()
logfile.close()
except Exception as exception:
logger.warning('Exception while trying to read logfile for course {courseID}: {exception}'
.format(**locals()))
return
message = MIMEText(logContent,'plain','utf-8')
message['From'] = Header(config.Application.Email.SENDER_ADDRESS,'utf-8')
message['To'] = Header(', '.join(recipients),'utf-8')
message['Subject'] = Header(config.Application.Email.SUBJECT.format(**locals()),'utf-8')
if options.printEmail is True:
logger.info("email message: {}".format(message))
else:
try:
server = smtplib.SMTP(config.Application.Email.SMTP_SERVER)
logger.debug("mail server: " + config.Application.Email.SMTP_SERVER)
server.set_debuglevel(config.Application.Email.DEBUG_LEVEL)
server.sendmail(config.Application.Email.SENDER_ADDRESS, recipients, message.as_string())
server.quit()
logger.info('Email sent to {recipients} for course {courseID}'.format(**locals()))
except Exception as exception:
logger.exception('Failed to send email to {recipients} for course {courseID}. Exception: {exception}'
.format(**locals()))
try:
(oldLogName, newLogName) = renameLogForCourseID(courseID)
logger.info('Renamed course log "{oldLogName}" to "{newLogName}"'.format(**locals()))
except Exception as exception:
logger.exception('Failed to rename log file for course {courseID}. Exception: {exception}'
.format(**locals()))
def emailCourseLogs(courseInstructors):
""" Loop through instructors to email course information to them.
:param courseInstructors: Dictionary of courses to list of their instructors
:type courseInstructors: dict
"""
logger.info('Preparing to send email to instructors...')
for courseID, instructors in list(courseInstructors.items()):
recipients = [instructor.sis_login_id +
config.Application.Email.RECIPIENT_AT_DOMAIN for instructor in instructors]
emailLogForCourseID(courseID, recipients)
def main():
"""Setup and run Canvas / ArcGIS group sync.
* parse command line arguments.
* setup loggers.
* connect to Canvas and ArcGIS instances.
* get list of relevant assignments from Canvas courses listed hand-edited Canvas page.
* update membership of ArcGIS groups corresponding to Canvas course / assignments.
"""
global logger
global logFormatter
global options
logFormatter = util.Iso8601UTCTimeFormatter('%(asctime)s|%(levelname)s|%(name)s|%(message)s')
logHandler = logging.FileHandler(getMainLogFilePath())
logHandler.setFormatter(logFormatter)
logger = logging.getLogger(config.Application.Logging.MAIN_LOGGER_NAME) # type: logging.Logger
logger.setLevel(loggingLevel)
logger.addHandler(logHandler)
# Add logging to stdout for OpenShift.
logToStdOut()
logger.info("Starting kartograafr")
argumentParser = argparse.ArgumentParser()
argumentParser.add_argument('--mail', '--email', dest='sendEmail',
action=argparse._StoreTrueAction,
help='email all available course logs to instructors, then rename all logs.')
argumentParser.add_argument('--printMail', '--printEmail', dest='printEmail',
action=argparse._StoreTrueAction,
help='print emails to log instead of sending them.')
options, unknownOptions = argumentParser.parse_known_args()
logger.info('kart sys args: {} '.format(sys.argv[1:]))
if unknownOptions:
unknownOptionMessage = 'unrecognized arguments: %s' % ' '.join(unknownOptions)
usageMessage = argumentParser.format_usage()
logger.warning(unknownOptionMessage)
logger.warning(usageMessage)
# Also print usage error messages so they will appear in email to sysadmins, sent from crond
print(unknownOptionMessage)
print(usageMessage)
logger.info('{} email to instructors with logs after courses are processed'
.format('Sending' if options.sendEmail else 'Not sending'))
canvas = getCanvasInstance()
arcGIS = arcgisUM.getArcGISConnection(config.ArcGIS.SECURITYINFO)
outcomeID = config.Canvas.TARGET_OUTCOME_ID
logger.info('Config -> Outcome ID to find: {}'.format(outcomeID))
validOutcome = canvas.getOutcomeObject(outcomeID)
if validOutcome is None:
raise RuntimeError('Outcome ID {} was not found'.format(outcomeID))
logger.info('Config -> Found valid Outcome: {}'.format(validOutcome))
configCourseID = config.Canvas.CONFIG_COURSE_ID
configCoursePageName = config.Canvas.CONFIG_COURSE_PAGE_NAME
logger.info('Config -> Attempting to get course IDs from page '
'"{configCoursePageName}" of course {configCourseID}...'
.format(**locals()))
courseIDs = getCourseIDsFromConfigCoursePage(canvas, configCourseID)
if courseIDs is None:
logger.warning('Warning: Config -> Course IDs not found in page '
'"{configCoursePageName}" of course {configCourseID}. '
'Using default course IDs instead.'
.format(**locals()))
courseIDs = config.Canvas.COURSE_ID_SET
else:
logger.info('Config -> Found Course IDs in page '
'"{configCoursePageName}" of course {configCourseID}.'
.format(**locals()))
logger.info('Config -> Course IDs to check for Outcome {}: {}'.format(validOutcome,
list(courseIDs)))
matchingCourseIDs = getCourseIDsWithOutcome(canvas, courseIDs,
validOutcome)
if len(matchingCourseIDs) == 0:
raise RuntimeError('No Courses linked to Outcome {} were found'.format(validOutcome))
logger.info('Config -> Found Course IDs for Outcome {}: {}'.format(validOutcome,
list(matchingCourseIDs)))
logger.info('Searching specified Courses for Assignments linked to Outcome {}'.format(validOutcome))
matchingCourseAssignments = getCourseAssignmentsWithOutcome(
canvas, matchingCourseIDs, validOutcome)
if not matchingCourseAssignments:
logger.info('No valid Assignments linked to Outcome {} were found'.format(validOutcome))
return
logger.info('Found Assignments linked to Outcome {}: {}'.format(validOutcome,
', '.join(map(str, matchingCourseAssignments))))
courseDictionary = getCoursesByID(canvas, matchingCourseIDs)
courseUserDictionary = getCoursesUsersByID(canvas, matchingCourseIDs)
courseInstructorDictionary = getCoursesUsersByID(canvas, matchingCourseIDs, 'teacher')
updateArcGISGroupsForAssignments(arcGIS, matchingCourseAssignments, courseDictionary, courseUserDictionary)
closeAllCourseLoggerHandlers()
if options.sendEmail:
emailCourseLogs(courseInstructorDictionary)
renameLogForCourseID(None)
logger.info("current kartograaf run finished.")
if __name__ == '__main__':
kartStartTime = datetime.now()
try:
main()
except Exception as exp:
logger.error("abnormal ending: {}".format(exp))
traceback.print_exc(exp)
finally:
logger.info("Stopping kartograafr. Duration: {} seconds".format(datetime.now()-kartStartTime))