This repository has been archived by the owner on Jun 8, 2022. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 124
/
hash.py
151 lines (115 loc) · 3.86 KB
/
hash.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
# Generates a content hash of the source_path, which is used to determine if
# the Lambda code has changed, ignoring file modification and access times.
#
# Outputs a filename and a command to run if the archive needs to be built.
import datetime
import errno
import hashlib
import json
import os
import sys
def abort(message):
"""
Exits with an error message.
"""
sys.stderr.write(message + '\n')
sys.exit(1)
def delete_old_archives():
"""
Deletes previously created archives.
"""
now = datetime.datetime.now()
delete_older_than = now - datetime.timedelta(days=7)
for name in os.listdir('builds'):
if name.endswith('.zip'):
try:
file_modified = datetime.datetime.fromtimestamp(
os.path.getmtime(name)
)
if file_modified < delete_older_than:
os.remove(name)
except OSError as error:
if error.errno == errno.ENOENT:
# Ignore "not found" errors as they are probably race
# conditions between multiple usages of this module.
pass
else:
raise
def list_files(top_path):
"""
Returns a sorted list of all files in a directory.
"""
results = []
for root, dirs, files in os.walk(top_path):
if root.endswith("__pycache__"):
continue
for file_name in files:
results.append(os.path.join(root, file_name))
results.sort()
return results
def generate_content_hash(source_paths):
"""
Generate a content hash of the source paths.
"""
sha256 = hashlib.sha256()
for source_path in source_paths:
if os.path.isdir(source_path):
source_dir = source_path
for source_file in list_files(source_dir):
update_hash(sha256, source_dir, source_file)
else:
source_dir = os.path.dirname(source_path)
source_file = source_path
update_hash(sha256, source_dir, source_file)
return sha256
def update_hash(hash_obj, file_root, file_path):
"""
Update a hashlib object with the relative path and contents of a file.
"""
relative_path = os.path.relpath(file_path, file_root)
hash_obj.update(relative_path.encode())
with open(file_path, 'rb') as open_file:
while True:
data = open_file.read(1024)
if not data:
break
hash_obj.update(data)
# Parse the query.
query = json.load(sys.stdin)
build_command = query['build_command']
build_paths = json.loads(query['build_paths'])
module_relpath = query['module_relpath']
runtime = query['runtime']
source_path = os.path.abspath(query['source_path'])
# Validate the query.
if not source_path:
abort('source_path must be set.')
# Change working directory to the module path
# so references to build.py will work.
os.chdir(module_relpath)
# Generate a hash based on file names and content. Also use the
# runtime value, build command, and content of the build paths
# because they can have an effect on the resulting archive.
content_hash = generate_content_hash([source_path] + build_paths)
content_hash.update(runtime.encode())
content_hash.update(build_command.encode())
# Generate a unique filename based on the hash.
filename = 'builds/{content_hash}.zip'.format(
content_hash=content_hash.hexdigest(),
)
# Replace variables in the build command with calculated values.
replacements = {
'$filename': filename,
'$runtime': runtime,
'$source': source_path,
}
for old, new in replacements.items():
build_command = build_command.replace(old, new)
# Delete previous archives.
delete_old_archives()
# Output the result to Terraform.
json.dump({
'filename': filename,
'build_command': build_command,
}, sys.stdout, indent=2)
sys.stdout.write('\n')