forked from elixir-europe/plant-brapi-etl-faidare
-
Notifications
You must be signed in to change notification settings - Fork 0
/
main.py
executable file
·62 lines (46 loc) · 1.83 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#!/usr/bin/env python
import os
import signal
import sys
import etl.extract.brapi
import etl.load.elasticsearch
import etl.load.virtuoso
import etl.transform.elasticsearch
import etl.transform.jsonld
import etl.transform.rdf
from etl.cli import parse_cli_arguments
from etl.config import load_file_config, extend_config
from etl.common.utils import get_folder_path
def main():
def handler(*_):
sys.exit(0)
# Trap SIGINT to force exit the program
signal.signal(signal.SIGINT, handler)
# Initialize defaults
config = dict()
config['root-dir'] = os.path.dirname(__file__)
config['default-data-dir'] = os.path.join(config['root-dir'], 'data')
config['conf-dir'] = os.path.join(config['root-dir'], 'config')
config['log-dir'] = get_folder_path([config['root-dir'], 'log'], create=True)
# Load file configs
config = load_file_config(config)
# Parse command line arguments
options = parse_cli_arguments(config)
# Extend config with CLI arguments
config = extend_config(config, options)
# Execute ETL actions based on CLI arguments:
if 'extract' in options or 'etl_es' in options or 'etl_virtuoso' in options:
etl.extract.brapi.main(config)
if 'transform_elasticsearch' in options or 'etl_es' in options:
etl.transform.elasticsearch.main(config)
if 'transform_jsonld' in options or 'transform_rdf' in options or 'etl_virtuoso' in options:
etl.transform.jsonld.main(config)
if 'transform_rdf' in options or 'etl_virtuoso' in options:
etl.transform.rdf.main(config)
if 'load_elasticsearch' in options or 'etl_es' in options:
etl.load.elasticsearch.main(config)
if 'load_virtuoso' in options or 'etl_virtuoso' in options:
etl.load.virtuoso.main(config)
# If used directly in command line
if __name__ == "__main__":
main()