-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathaddone.py
executable file
·51 lines (39 loc) · 1.23 KB
/
addone.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#!/usr/bin/env python3
#
# hack to add a file to the collection manually
#
from sys import argv
import os
from datetime import datetime
import logging
import hashlib
import canonicaljson
headers_dir = "collection/log/"
resource_dir = "collection/resource/"
def save(path, data):
logging.info(path)
os.makedirs(os.path.dirname(path), exist_ok=True)
with open(path, "wb") as f:
f.write(data)
def addone(dataset, organisation, path):
headers = {
"dataset": dataset,
"organisation": organisation,
"datetime": datetime.utcnow().isoformat(),
}
headers_key = hashlib.sha256(path.encode("utf-8")).hexdigest()
headers_path = os.path.join(
headers_dir, headers["datetime"][:10], headers_key + ".json"
)
with open(path, mode="rb") as f:
content = f.read()
resource = hashlib.sha256(content).hexdigest()
headers["resource"] = resource
save(os.path.join(resource_dir, resource), content)
headers_json = canonicaljson.encode_canonical_json(headers)
save(headers_path, headers_json)
if __name__ == "__main__":
logging.basicConfig(
level=logging.INFO, format="%(asctime)s %(levelname)s %(message)s"
)
addone(argv[1], argv[2], argv[3])