This repository has been archived by the owner on Feb 23, 2022. It is now read-only.
forked from hedyorg/hedy
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutils.py
327 lines (263 loc) · 10.7 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
import datetime
import time
from config import config
import boto3
import functools
import os
import re
from ruamel import yaml
from website import querylog
class Timer:
"""A quick and dirty timer."""
def __init__(self, name):
self.name = name
def __enter__(self):
self.start = time.time()
def __exit__(self, type, value, tb):
delta = time.time() - self.start
print(f'{self.name}: {delta}s')
def timer(fn):
"""Decoractor for fn."""
@functools.wraps(fn)
def wrapper(*args, **kwargs):
with Timer(fn.__name__):
return fn(*args, **kwargs)
return wrapper
def type_check (val, Type):
if Type == 'dict':
return isinstance (val, dict)
if Type == 'list':
return isinstance (val, list)
if Type == 'str':
return isinstance (val, str)
if Type == 'int':
return isinstance (val, int)
if Type == 'tuple':
return isinstance (val, tuple)
if Type == 'fun':
return callable (val)
if Type == 'bool':
return type (val) == bool
def object_check (obj, key, Type):
if not type_check (obj, 'dict') or not key in obj:
return False
return type_check (obj [key], Type)
def timems ():
return int (round (time.time () * 1000))
def times ():
return int (round (time.time ()))
DEBUG_MODE = False
def is_debug_mode():
"""Return whether or not we're in debug mode.
We do more expensive things that are better for development in debug mode.
"""
return DEBUG_MODE
def set_debug_mode(debug_mode):
"""Switch debug mode to given value."""
global DEBUG_MODE
DEBUG_MODE = debug_mode
YAML_CACHE = {}
@querylog.timed
def load_yaml(filename):
"""Load the given YAML file.
The file load will be cached in production, but reloaded everytime in development mode.
Whether we are running in production or not will be determined
by the Flask config (FLASK_ENV).
"""
# Bypass the cache in DEBUG mode for mucho iterating
if not is_debug_mode() and filename in YAML_CACHE:
return YAML_CACHE[filename]
try:
with open (filename, 'r', encoding='utf-8') as f:
data = yaml.safe_load(f)
YAML_CACHE[filename] = data
return data
except IOError:
return {}
def load_yaml_rt(filename):
"""Load YAML with the round trip loader."""
try:
with open(filename, 'r', encoding='utf-8') as f:
return yaml.round_trip_load(f, preserve_quotes=True)
except IOError:
return {}
def dump_yaml_rt(data):
"""Dump round-tripped YAML."""
return yaml.round_trip_dump(data, indent=4, width=999)
# *** DYNAMO DB ***
# https://boto3.amazonaws.com/v1/documentation/api/latest/reference/services/dynamodb.html
db = boto3.client ('dynamodb', region_name = config ['dynamodb'] ['region'], aws_access_key_id = os.getenv ('AWS_DYNAMODB_ACCESS_KEY'), aws_secret_access_key = os.getenv ('AWS_DYNAMODB_SECRET_KEY'))
db_prefix = os.getenv ('AWS_DYNAMODB_TABLE_PREFIX')
# Encode a dict so that it has the format expected by DynamoDB
def db_encode (data):
# update is a boolean flag which we use to detect whether we should format the payload for update_item
processed_data = {}
for key in data:
if type_check (data [key], 'str'):
processed_data [key] = {'S': data [key]}
elif type_check (data [key], 'int'):
# Note we convert the value into a string
processed_data [key] = {'N': str (data [key])}
elif data [key] == None:
processed_data [key] = {'NULL': True}
else:
raise ValueError ('Unsupported type passed to db_put')
return processed_data
# Encode a dict so that it has the format expected by DynamoDB
def db_encode_updates (data):
processed_data = {}
for key in data:
if type_check (data [key], 'str'):
processed_data [key] = {'Value': {'S': data [key]}}
elif type_check (data [key], 'int'):
# Note we convert the value into a string
processed_data [key] = {'Value': {'N': str (data [key])}}
elif data [key] == None:
processed_data [key] = {'Action': 'DELETE'}
else:
raise ValueError ('Unsupported type passed to db_put')
return processed_data
# Decode data in DynamoDB format to a plain dict
def db_decode (data):
processed_data = {}
for key in data:
if 'S' in data [key]:
processed_data [key] = data [key] ['S']
elif 'N' in data [key]:
processed_data [key] = int (data [key] ['N'])
elif 'NULL' in data [key]:
processed_data [key] = None
else:
raise ValueError ('Unsupported type passed to db_put')
return processed_data
db_main_indexes = {
'users': 'username',
'tokens': 'id',
'programs': 'id'
}
# This function takes a dict `data` and returns a new dict with only the key/value for the index key for the table.
# If remove is truthy, then the index key is removed instead, leaving the rest of the keys intact.
def db_key (table, data, remove=False):
processed_data = {}
if remove:
for key in data:
if key != db_main_indexes [table]:
processed_data [key] = data [key]
else:
processed_data [db_main_indexes [table]] = data [db_main_indexes [table]]
return processed_data
# Gets an item by index from the database. If not_primary is truthy, the search is done by a field that should be set as a secondary index.
@querylog.timed
def db_get (table, data, not_primary=False):
querylog.log_counter('db_get:' + table)
# If we're querying by something else than the primary key of the table, we assume that data contains only one field, that on which we want to search. We also require that field to have an index.
if not_primary:
field = list (data.keys ()) [0]
result = db.query (TableName = db_prefix + '-' + table, IndexName = field + '-index', KeyConditionExpression = field + ' = :value', ExpressionAttributeValues = {':value': {'S': data [field]}})
if len (result ['Items']):
return db_decode (result ['Items'] [0])
else:
return None
else:
result = db.get_item (TableName = db_prefix + '-' + table, Key = db_encode (db_key (table, data)))
if 'Item' not in result:
return None
return db_decode (result ['Item'])
# Gets an item by index from the database. If not_primary is truthy, the search is done by a field that should be set as a secondary index.
@querylog.timed
def db_get_many (table, data, not_primary=False):
querylog.log_counter('db_get_many:' + table)
if not_primary:
field = list (data.keys ()) [0]
# We use ScanIndexForward = False to get the latest items from the Programs table
result = db.query (TableName = db_prefix + '-' + table, IndexName = field + '-index', KeyConditionExpression = field + ' = :value', ExpressionAttributeValues = {':value': {'S': data [field]}}, ScanIndexForward = False)
else:
result = db.query (TableName = db_prefix + '-' + table, Key = db_encode (db_key (table, data)))
data = []
querylog.log_counter('db_get_many_items', len(result['Items']))
for item in result ['Items']:
data.append (db_decode (item))
return data
# Creates an item.
@querylog.timed
def db_create (table, data):
querylog.log_counter('db_create:' + table)
return db.put_item (TableName = db_prefix + '-' + table, Item = db_encode (data))
# Updates an item by primary key.
@querylog.timed
def db_update (table, data):
querylog.log_counter('db_update:' + table)
return db.update_item (TableName = db_prefix + '-' + table, Key = db_encode (db_key (table, data)), AttributeUpdates = db_encode_updates (db_key (table, data, True)))
# Deletes an item by primary key.
@querylog.timed
def db_del (table, data):
querylog.log_counter('db_del:' + table)
return db.delete_item (TableName = db_prefix + '-' + table, Key = db_encode (db_key (table, data)))
# Deletes multiple items.
@querylog.timed
def db_del_many (table, data, not_primary=False):
querylog.log_counter('db_del_many:' + table)
# We define a recursive function in case the number of results is very large and cannot be returned with a single call to db_get_many.
def batch ():
to_delete = db_get_many (table, data, not_primary)
if len (to_delete) == 0:
return
for item in to_delete:
db_del (table, db_key (table, item))
batch ()
batch ()
# Searches for items.
@querylog.timed
def db_scan (table):
querylog.log_counter('db_scan:' + table)
result = db.scan (TableName = db_prefix + '-' + table)
output = []
querylog.log_counter('db_scan_items', len(result['Items']))
for item in result ['Items']:
output.append (db_decode (item))
return output
@querylog.timed
def db_describe (table):
querylog.log_counter('db_describe:' + table)
return db.describe_table (TableName = db_prefix + '-' + table)
def slash_join(*args):
ret = []
for arg in args:
if not arg: continue
if ret and not ret[-1].endswith('/'):
ret.append('/')
ret.append(arg.lstrip('/') if ret else arg)
return ''.join(ret)
def is_testing_request(request):
return bool ('X-Testing' in request.headers and request.headers ['X-Testing'])
def extract_bcrypt_rounds (hash):
return int (re.match ('\$2b\$\d+', hash) [0].replace ('$2b$', ''))
def isoformat(timestamp):
"""Turn a timestamp into an ISO formatted string."""
dt = datetime.datetime.utcfromtimestamp(timestamp)
return dt.isoformat() + 'Z'
def is_production():
"""Whether we are serving production traffic."""
return os.getenv('IS_PRODUCTION', '') != ''
def is_heroku():
"""Whether we are running on Heroku.
Only use this flag if you are making a decision that really has to do with
Heroku-based hosting or not.
If you are trying to make a decision whether something needs to be done
"for real" or not, prefer using:
- `is_production()` to see if we're serving customer traffic and trying to
optimize for safety and speed.
- `is_debug_mode()` to see if we're on a developer machine and we're trying
to optimize for developer productivity.
"""
return os.getenv('DYNO', '') != ''
def version():
"""Get the version from the Heroku environment variables."""
if not is_heroku():
return 'DEV'
vrz = os.getenv('HEROKU_RELEASE_CREATED_AT')
the_date = datetime.date.fromisoformat(vrz[:10]) if vrz else datetime.date.today()
commit = os.getenv('HEROKU_SLUG_COMMIT', '????')[0:6]
return the_date.strftime('%b %d') + f' ({commit})'
def valid_email(s):
return bool (re.match ('^(([a-zA-Z0-9_+\.\-]+)@([\da-zA-Z\.\-]+)\.([a-zA-Z\.]{2,6})\s*)$', s))