-
Notifications
You must be signed in to change notification settings - Fork 1
/
generate_qa_json.py
96 lines (75 loc) · 2.85 KB
/
generate_qa_json.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
#!/bin/env python3.9
import base64
import json
import os
from PIL import Image
from pyzbar.pyzbar import decode
import zlib
from base45 import b45decode
from cbor2 import loads
from cose.messages import Sign1Message
from datetime import datetime
# Files starting with these prefixes will be skipped
EXCLUDED_PREFIXES = ('.', '_', '@')
# Only files with these extensions will be processed
ALLOWED_EXT = ['.PNG']
def read_file(file: str) -> str:
"""
Reads the given file and returns the contents as a base64 string
@param file: Path to a file
@return: base64 string containing the file bytes
"""
with open(file, "rb") as f:
return base64.b64encode(f.read()).decode()
def read_qr(file: str) -> str:
"""
Scans the barcode and returns the contents as a string
@param file: Path to the QR file
@return: Barcode string
"""
barcode = decode(Image.open(file))[0]
return barcode.data.decode("utf-8")
def read_dcc_payload(hcert):
base45 = hcert[4:]
compressed_bytes = b45decode(base45)
cose_bytes = zlib.decompress(compressed_bytes)
cose_message = Sign1Message.decode(cose_bytes)
cbor_message = loads(cose_message.payload)
return cbor_message[-260][1]
def relative_path_unc(root_dir: str, full_path: str) -> str:
"""
Converts a full path to a relative path and normalizes to unix notation.
@param root_dir: Root directory using OS-specific notation
@param full_path: Full path to file using OS-specific notation
@return: Path to file relative to *root_dir* using unix/posix notation
"""
if root_dir == ".":
return full_path.replace("\\", "/")[2:]
else:
return full_path[:](root_dir, "").replace("\\", "/")[1:]
def date_time_serializer(obj):
# It's sad that this is needed, but hey!
if isinstance(obj, datetime):
return obj.isoformat()
return None
def process(source_dir: str) -> str:
"""
Creates a JSON containing all of the QRs in the repository in b64 form and as hcert string form.
@param source_dir: Directory containing the QR codes
@return: Results encoded as an JSON string
"""
result = list()
for dir_path, dir_names, filenames in os.walk(source_dir):
dir_names[:] = [dir_name for dir_name in dir_names if not dir_name.startswith(EXCLUDED_PREFIXES)]
for filename in filenames:
if os.path.splitext(filename)[1].upper() in ALLOWED_EXT:
source_file = os.path.join(dir_path, filename)
hcert = read_qr(source_file)
result.append({
"path": relative_path_unc(source_dir, source_file),
"data": read_file(source_file),
"hcert": hcert,
"dcc": read_dcc_payload(hcert)
})
return json.dumps(result, default=date_time_serializer)
print(process("."))