-
Notifications
You must be signed in to change notification settings - Fork 61
/
Copy pathdocker-entrypoint.py
73 lines (58 loc) · 4.53 KB
/
docker-entrypoint.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
#!/usr/bin/env python
import json
from os import environ,system,path
from ast import literal_eval
from shutil import copyfile
def loadConfig(filename):
with open(filename, "r+") as filecontent:
data = json.load(filecontent)
return data
def setConfig(setting, value, configdata, section=None):
if section is not None:
if section not in configdata:
configdata[section] = {}
configdata[section][setting] = value
else:
configdata[setting] = value
def writeConfig(filename,configdata):
with open(filename, 'w') as f:
f.write(json.dumps(configdata, indent=2))
def strToBool(string):
if string in ["true", "True", "yes", "y", "1"]:
return True
else:
return False
configfile = "/app/config/config.json"
if not path.exists(configfile):
copyfile("/app/config.sample/config.json.example", configfile)
configdata = loadConfig(configfile)
if "HYPHE_MONGODB_HOST" in environ: setConfig("host", environ["HYPHE_MONGODB_HOST"],configdata,"mongo-scrapy")
if "HYPHE_MONGODB_PORT" in environ: setConfig("mongo_port", int(environ["HYPHE_MONGODB_PORT"]),configdata,"mongo-scrapy")
if "HYPHE_MONGODB_DBNAME" in environ: setConfig("db_name", environ["HYPHE_MONGODB_DBNAME"],configdata,"mongo-scrapy")
if "HYPHE_CRAWLER_PORT" in environ: setConfig("scrapy_port", int(environ["HYPHE_CRAWLER_PORT"]),configdata,"mongo-scrapy")
if "HYPHE_PROXY_HOST" in environ: setConfig("proxy_host", environ["HYPHE_PROXY_HOST"],configdata,"mongo-scrapy")
if "HYPHE_PROXY_PORT" in environ: setConfig("proxy_port", int(environ["HYPHE_PROXY_PORT"]),configdata,"mongo-scrapy")
if "HYPHE_MAXDEPTH" in environ: setConfig("max_depth", int(environ["HYPHE_MAXDEPTH"]),configdata,"mongo-scrapy")
if "HYPHE_DOWNLOAD_DELAY" in environ: setConfig("download_delay", float(environ["HYPHE_DOWNLOAD_DELAY"]),configdata,"mongo-scrapy")
if "HYPHE_STORE_CRAWLED_HTML" in environ: setConfig("store_crawled_html_content", strToBool(environ["HYPHE_STORE_CRAWLED_HTML"]),configdata,"mongo-scrapy")
if "HYPHE_IGNORE_INTERNAL_LINKS" in environ: setConfig("ignore_internal_links", strToBool(environ["HYPHE_IGNORE_INTERNAL_LINKS"]),configdata,"mongo-scrapy")
if "HYPHE_MAX_SIM_REQ" in environ: setConfig("max_simul_requests", int(environ["HYPHE_MAX_SIM_REQ"]),configdata,"mongo-scrapy")
if "HYPHE_HOST_MAX_SIM_REQ" in environ: setConfig("max_simul_requests_per_host", int(environ["HYPHE_HOST_MAX_SIM_REQ"]),configdata,"mongo-scrapy")
if "HYPHE_OBEY_ROBOTS" in environ: setConfig("obey_robots", strToBool(environ["HYPHE_OBEY_ROBOTS"]),configdata,"mongo-scrapy")
if "HYPHE_TRAPH_KEEPALIVE" in environ: setConfig("keepalive", int(environ["HYPHE_TRAPH_KEEPALIVE"]),configdata,"traph")
if "HYPHE_TRAPH_DATAPATH" in environ: setConfig("data_path", environ["HYPHE_TRAPH_DATAPATH"],configdata,"traph")
if "HYPHE_TRAPH_MAX_SIM_PAGES" in environ: setConfig("max_simul_pages_indexing", int(environ["HYPHE_TRAPH_MAX_SIM_PAGES"]),configdata,"traph")
if "HYPHE_DEFAULT_STARTPAGES_MODE" in environ: setConfig("defaultStartpagesMode", literal_eval(environ["HYPHE_DEFAULT_STARTPAGES_MODE"]),configdata)
if "HYPHE_DEFAULT_CREATION_RULE" in environ: setConfig("defaultCreationRule", environ["HYPHE_DEFAULT_CREATION_RULE"],configdata)
if "HYPHE_CREATION_RULES" in environ: setConfig("creationRules", literal_eval(environ["HYPHE_CREATION_RULES"]),configdata)
if "HYPHE_FOLLOW_REDIRECTS" in environ: setConfig("discoverPrefixes", literal_eval(environ["HYPHE_FOLLOW_REDIRECTS"]),configdata)
# TODO: Phantom config
if "HYPHE_WEBARCHIVES_OPTIONS" in environ: setConfig("options", literal_eval(environ["HYPHE_WEBARCHIVES_OPTIONS"] or '[]'),configdata, "webarchives")
if "HYPHE_WEBARCHIVES_DATE" in environ: setConfig("date", environ["HYPHE_WEBARCHIVES_DATE"],configdata or "", "webarchives")
if "HYPHE_WEBARCHIVES_DAYSRANGE" in environ: setConfig("days_range", int(environ["HYPHE_WEBARCHIVES_DAYSRANGE"] or 0),configdata, "webarchives")
if "HYPHE_WEBARCHIVES_PASSWORD" in environ: setConfig("password", environ["HYPHE_WEBARCHIVES_PASSWORD"] or "",configdata, "webarchives")
if "HYPHE_ADMIN_PASSWORD" in environ: setConfig("ADMIN_PASSWORD", environ["HYPHE_ADMIN_PASSWORD"] or "",configdata)
if "HYPHE_OPEN_CORS_API" in environ: setConfig("OPEN_CORS_API", strToBool(environ["HYPHE_OPEN_CORS_API"]),configdata)
if "HYPHE_DEBUG" in environ: setConfig("DEBUG", int(environ["HYPHE_DEBUG"]),configdata)
writeConfig(configfile, configdata)
system("/app/hyphe_backend/core.tac")