-
Notifications
You must be signed in to change notification settings - Fork 289
/
utils.py
510 lines (366 loc) · 15 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
from flask import session, request, make_response
from website.flask_helpers import render_template
from bs4 import BeautifulSoup
import contextlib
import datetime
import time
import functools
import os
from io import StringIO
from os import path
import re
import string
import random
import uuid
import unicodedata
import sys
import traceback
import collections
from email_validator import EmailNotValidError, validate_email
from flask_babel import format_date, format_datetime, format_timedelta
from website.flask_helpers import gettext_with_fallback as gettext
from ruamel import yaml
import commonmark
commonmark_parser = commonmark.Parser()
commonmark_renderer = commonmark.HtmlRenderer()
IS_WINDOWS = os.name == 'nt'
prefixes_dir = path.join(path.dirname(__file__), 'prefixes')
# Define code that will be used if some turtle command is present
with open(f'{prefixes_dir}/turtle.py', encoding='utf-8') as f:
TURTLE_PREFIX_CODE = f.read()
# Preamble that will be used for non-Turtle programs
# numerals list generated from: https://replit.com/@mevrHermans/multilangnumerals
with open(f'{prefixes_dir}/normal.py', encoding='utf-8') as f:
NORMAL_PREFIX_CODE = f.read()
# Define code that will be used if a pressed command is used
with open(f'{prefixes_dir}/pressed.py', encoding='utf-8') as f:
PRESSSED_PREFIX_CODE = f.read()
# Define code that will be used if music code is used
with open(f'{prefixes_dir}/music.py', encoding='utf-8') as f:
MUSIC_PREFIX_CODE = f.read()
class Timer:
"""A quick and dirty timer."""
def __init__(self, name):
self.name = name
def __enter__(self):
self.start = time.time()
def __exit__(self, type, value, tb):
delta = time.time() - self.start
print(f'{self.name}: {delta}s')
def timer(fn):
"""Decoractor for fn."""
@functools.wraps(fn)
def wrapper(*args, **kwargs):
with Timer(fn.__name__):
return fn(*args, **kwargs)
return wrapper
def timems():
"""Return the UNIX timestamp in milliseconds.
You only need to use this function if you are doing performance-sensitive
timing. Otherwise, `times` (which returns second-resolution) is probably
a better choice.
"""
return int(round(time.time() * 1000))
def times():
"""Return the UNIX timestamp in seconds.
If you need to store a date/time in the database, prefer this function.
"""
return int(round(time.time()))
DEBUG_MODE = False
def is_debug_mode():
"""Return whether or not we're in debug mode.
We do more expensive things that are better for development in debug mode.
"""
return DEBUG_MODE
def is_offline_mode():
"""Return whether or not we're in offline mode.
Offline mode is a special build of Hedy that teachers can download and run
on their own computers.
"""
return getattr(sys, 'frozen', False) and offline_data_dir() is not None
def offline_data_dir():
"""Return the data directory in offline mode."""
return getattr(sys, '_MEIPASS')
def set_debug_mode(debug_mode):
"""Switch debug mode to given value."""
global DEBUG_MODE
DEBUG_MODE = debug_mode
def rt_yaml():
y = yaml.YAML(typ='rt')
# Needs to match the Weblate YAML settings for all components
y.indent = 4
y.preserve_quotes = True
y.width = 30000
return y
def load_yaml_rt(filename):
"""Load YAML with the round trip loader."""
try:
rt = rt_yaml()
with open(filename, 'r', encoding='utf-8') as f:
return rt.load(f)
except IOError:
return {}
def dump_yaml_rt(data):
"""Dump round-tripped YAML."""
out = StringIO()
rt_yaml().dump(data, out)
return out.getvalue()
def slash_join(*args):
ret = []
for arg in args:
if not arg:
continue
if ret and not ret[-1].endswith('/'):
ret.append('/')
ret.append(arg.lstrip('/') if ret else arg)
return ''.join(ret)
def is_testing_request(request):
"""Whether the current request is a test request.
Test requests are performed by the e2e tests and have special privileges
to do things other requests cannot do.
Test requests are only allowed on non-Heroku instances.
"""
return not is_heroku() and bool('X-Testing' in request.headers and request.headers['X-Testing'])
def extract_bcrypt_rounds(hash):
return int(re.match(r'\$2b\$\d+', hash)[0].replace('$2b$', ''))
def isoformat(timestamp):
"""Turn a timestamp into an ISO formatted string."""
dt = datetime.datetime.utcfromtimestamp(timestamp)
return dt.isoformat() + 'Z'
def is_production():
"""Whether we are serving production traffic."""
return os.getenv('IS_PRODUCTION', '') != ''
def is_heroku():
"""Whether we are running on Heroku.
Only use this flag if you are making a decision that really has to do with
Heroku-based hosting or not.
If you are trying to make a decision whether something needs to be done
"for real" or not, prefer using:
- `is_production()` to see if we're serving customer traffic and trying to
optimize for safety and speed.
- `is_debug_mode()` to see if we're on a developer machine and we're trying
to optimize for developer productivity.
"""
return os.getenv('DYNO', '') != ''
def version():
# """Get the version from the Heroku environment variables."""
if not is_heroku():
return 'DEV'
vrz = os.getenv('HEROKU_RELEASE_CREATED_AT')
the_date = datetime.date.fromisoformat(vrz[:10]) if vrz else datetime.date.today()
commit = os.getenv('HEROKU_SLUG_COMMIT', '????')[0:6]
return the_date.strftime('%Y %b %d') + f'({commit})'
def valid_email(s):
try:
_ = validate_email(s, check_deliverability=False)
return True
except EmailNotValidError:
return False
@contextlib.contextmanager
def atomic_write_file(filename, mode='wb'):
"""Write to a filename atomically.
First write to a unique tempfile, then rename the tempfile into
place. Use replace instead of rename to make it atomic on windows as well.
Use as a context manager:
with atomic_write_file('file.txt') as f:
f.write('hello')
"""
tmp_file = f'{filename}.{os.getpid()}'
with open(tmp_file, mode) as f:
yield f
os.replace(tmp_file, filename)
# This function takes a date in milliseconds from the Unix epoch and transforms it into a printable date
# It operates by converting the date to a string, removing its last 3 digits, converting it back to an int
# and then invoking the `isoformat` date function on it
def mstoisostring(date):
return datetime.datetime.fromtimestamp(int(str(date)[:-3])).isoformat()
def string_date_to_date(date):
return datetime.datetime.strptime(date, "%Y-%m-%d")
def timestamp_to_date(timestamp, short_format=False):
try:
if short_format:
return datetime.datetime.fromtimestamp(int(str(timestamp)))
else:
return datetime.datetime.fromtimestamp(int(str(timestamp)[:-3]))
except BaseException:
return None
def delta_timestamp(date, short_format=False):
if short_format:
delta = datetime.datetime.now() - datetime.datetime.fromtimestamp(int(str(date)))
else:
delta = datetime.datetime.now() - datetime.datetime.fromtimestamp(int(str(date)[:-3]))
return format_timedelta(delta)
def stoisostring(date):
return datetime.datetime.fromtimestamp(date)
def localized_date_format(date, short_format=False):
# Improve the date by using the Flask Babel library and return timestamp as expected by language
if short_format:
timestamp = datetime.datetime.fromtimestamp(int(str(date)))
else:
timestamp = datetime.datetime.fromtimestamp(int(str(date)[:-3]))
return format_date(timestamp, format='medium') + " " + format_datetime(timestamp, "H:mm")
def datetotimeordate(date):
print(date)
return date.replace("T", " ")
# https://stackoverflow.com/a/2257449
def random_id_generator(
size=6,
chars=string.ascii_uppercase +
string.ascii_lowercase +
string.digits):
return ''.join(random.choice(chars) for _ in range(size))
def markdown_to_html_tags(markdown):
"""
This function takes a Markdown string and returns a list with each of the HTML elements obtained
by rendering the Markdown into HTML.
"""
_html = commonmark_renderer.render(commonmark_parser.parse(markdown))
soup = BeautifulSoup(_html, 'html.parser')
return soup.find_all()
MarkdownCode = collections.namedtuple('MarkdownCode', ('code', 'info'))
def code_blocks_from_markdown(markdown):
"""
Takes a MarkDown string and returns a list of code blocks, along with their metadata.
Returns pairs of `(code, info)`, where 'info' is the text that appears after the three
backticks (usually used to indicate the programming language).
"""
md = commonmark_parser.parse(markdown)
for node, _ in md.walker():
# We will only ever see '_entered == True' for CodeBlock nodes.
if node.t == 'code_block':
yield MarkdownCode(node.literal.strip(), node.info)
def error_page(error=404, page_error=None, ui_message=None, menu=True, iframe=None, exception=None):
if error not in [400, 403, 404, 500, 401]:
error = 404
default = gettext('default_404')
error_image = error
if error == 401:
default = gettext('default_401')
error_image = 403
if error == 403:
default = gettext('default_403')
elif error == 500:
default = gettext('default_500')
hx_request = bool(request.headers.get('Hx-Request'))
if hx_request:
# For HTMX-request, just return the error as plain text body
return make_response(f'{default} {exception}', error)
if request.accept_mimetypes.accept_json and not request.accept_mimetypes.accept_html:
# Produce a JSON response instead of an HTML response
return make_response({"code": error,
"error": default,
"exception": traceback.format_exception(type(exception), exception, exception.__traceback__) if exception else None}, error)
return render_template("error-page.html", menu=menu, error_image=error_image, iframe=iframe,
page_error=page_error or ui_message or default or '', default=default), error
def session_id():
"""Returns or sets the current session ID."""
if 'session_id' not in session:
if os.getenv('IS_TEST_ENV') and 'X-session_id' in request.headers:
session['session_id'] = request.headers['X-session_id']
else:
session['session_id'] = uuid.uuid4().hex
return session['session_id']
# https://github.com/python-babel/babel/issues/454
def customize_babel_locale(custom_locales: dict):
from babel.core import get_global
db = get_global('likely_subtags')
for custom_name in custom_locales:
db[custom_name] = custom_name
import babel.localedata
o_exists, o_load = babel.localedata.exists, babel.localedata.load
if o_exists.__module__ != __name__:
def exists(name):
name = custom_locales.get(name, name)
return o_exists(name)
def load(name, merge_inherited=True):
name = custom_locales.get(name, name)
return o_load(name, merge_inherited)
babel.localedata.exists = exists
babel.localedata.load = load
def strip_accents(s):
return ''.join(c for c in unicodedata.normalize('NFD', s)
if unicodedata.category(c) != 'Mn')
def base_url():
"""Return the base URL, excluding the leading slash
Returns either from configuration or otherwise from Flask.
"""
url = os.getenv('BASE_URL')
if not url:
url = request.host_url
return url if not url.endswith('/') else url[:-1]
def can_edit_class(user, Class):
"""
Check if a given user has the permission to edit a class.
Returns:
bool: True if the user has edit permission, False otherwise.
"""
return Class["teacher"] == user["username"] or \
any(second_teacher["username"] == user["username"] and second_teacher["role"] == "teacher"
for second_teacher in Class.get("second_teachers", []))
def get_unanswered_questions(survey, new_questions):
unanswered_questions = []
db = survey.get('responses')
if not db:
return new_questions, ""
for key, value in db.items():
if value['answer'] == '':
unanswered_questions.append(new_questions[int(key)-1])
i = 0
for key, value in db.items():
if value['answer'] == '':
value['question'] = unanswered_questions[i]
i += 1
return unanswered_questions, db
def find_prev_next_levels(level_list, target_level):
sorted_levels = level_list
index = sorted_levels.index(target_level)
prev_level = sorted_levels[index - 1] if index > 0 else None
next_level = sorted_levels[index + 1] if index < len(sorted_levels) - 1 else None
return prev_level, next_level
def preserve_html_tags(content):
"""
Transforms HTML tags in the content.
"""
# Define patterns to match target tags
tag_pattern = r"<(?P<tag_name>[^>]+)(?P<attributes>.*?)>(?P<inner_content>.*?)</(?P=tag_name)>"
def replace(match):
tag_name = match.group("tag_name")
attributes = match.group("attributes")
inner_content = match.group("inner_content")
return f"<{tag_name}{attributes}>{inner_content}</{tag_name}>"
return re.sub(tag_pattern, replace, content, flags=re.DOTALL)
def transform_encoded_tags_secure(content):
"""
Transforms encoded HTML tags in adventure content, removing any script tags.
This is an extra step on top of the DOMPurify when saving an adventure.
"""
def pre_process(content):
# Remove script tags and their content using regular expression
script_pattern = r"<script(?:\s[^>]*?)?>(?P<content>.*?)</script>"
return re.sub(script_pattern, "", content, flags=re.DOTALL)
# Pre-process the input to remove scripts
processed_content = pre_process(content)
transformed_content = preserve_html_tags(processed_content)
return transformed_content
def prepare_content_for_ckeditor(content):
"""
Adds code tags to pre blocks that don't have them, reserving existing attributes as well.
"""
pattern = r"<pre(?P<attributes>.*?)>(?P<inner_content>.*?)</pre>"
def replace(match):
attributes = match.group("attributes")
inner_content = match.group("inner_content").strip() # Strip leading/trailing whitespaces
if not inner_content.startswith("<code>"):
inner_content = f"<code>{inner_content}</code>"
return f"<pre{attributes}>{inner_content}</pre>"
content = transform_encoded_tags_secure(content)
content = re.sub(pattern, replace, content, flags=re.DOTALL)
# Add "<p> </p>" (an extra line) if not exists
if len(content) and not content.endswith("<p> </p>"):
content += "<p> </p>"
return content
def remove_class_preview():
try:
del session["preview_class"]
except KeyError:
pass