aboutsummaryrefslogtreecommitdiff
path: root/test/gorilla.py
blob: 5bf64f5cde9d2f8d4657314f3ecc90882367d075 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
#!/usr/bin/env python3
#
# Copyright (C) 2021 jahoti <jahoti@tilde.team>
# Licensing information is collated in the `copyright` file

"""
A partial re-implementation of Hydrilla in Python, for testing purposes.

This will eventually be replaced with a build of the actual thing.
"""

import json, os, sys

def load_db(path):
	DB = {'script': {}, 'bag': {}, 'page': {}}
	if path[-1] != os.sep:
		path += os.sep
	
	DB['path'] = path
	for file in os.listdir(path):
		subdir = path + file
		
		if (os.st.S_IFMT(os.stat(subdir).st_mode) & os.st.S_IFDIR) == 0:
			continue
		
		with open(subdir + os.sep + 'index.json') as f:
			data = json.load(f)
		
		type_, data['file'] = data['type'], file
		name_key = 'pattern' if type_ == 'page' else 'name'
		
		DB[type_][data[name_key]] = data
		del data['type'], data[name_key]
		if type_ == 'script':
			with open(path + file + os.sep + data['location']) as f:
				data['text'] = f.read()
	
	return DB


def mkhachette(patterns):
	patterns = set(patterns)
	if '*' in patterns:
		patterns.remove('*')
		patterns.update(DB['page'].keys())
	
	scripts, bags, pages, new_bags = {}, {}, {}, []
	for pattern in patterns:
		pages[pattern] = data = DB['page'][pattern]
		type_, name = data['payload']
		if type_ == 'script':
			scripts[name] = DB['script'][name]
		else:
			new_bags.append(name)
	
	while new_bags:
		name = new_bags.pop(0)
		if name in bags:
			continue
		
		bags[name] = data = DB['bag'][name]['components']
		for type_, name in data:
			if type_ == 'script':
				scripts[name] = DB['script'][name]
			else:
				new_bags.append(name)
	
	items, path = [], DB['path']
	for script, data in scripts.items():
		item = {'hash': data['sha256']}
		with open(path + data['file'] + os.sep + data['location']) as f:
			item['text'] = f.read()
		
		items.append({'s' + script: item})
	
	for bag, data in bags.items():
		items.append({'b' + bag: [[type_[0], name] for type_, name in data]})
	
	for page, data in pages.items():
		type_, name = data['payload']
		items.append({'p' + page: {'components': [type_[0], name]}})
	
	return items


if __name__ == '__main__':
	if len(sys.argv) < 3 or not os.path.isdir(sys.argv[1]):
		sys.stderr.write('Usage: %s [hydrilla content path] (page pattern (page pattern (...)))' % sys.argv[0])
		sys.exit(1)
	
	DB = load_db(sys.argv[1])
	print(json.dumps(mkhachette(sys.argv[2:])))