-
Notifications
You must be signed in to change notification settings - Fork 1
/
devops_template.py
155 lines (122 loc) · 5.17 KB
/
devops_template.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
import argparse
import contextlib
import importlib.metadata
import json
import logging
import sys
logger = logging.getLogger(__name__)
def arguments() -> dict:
"""create parameters and parse arguments
:return: script arguments
:rtype: dict
"""
parser = argparse.ArgumentParser(
prog='devops_template.py',
description='template script for developer operations tasks',
epilog='Developed by Gabriele Ron ([email protected])'
)
parser_output = parser.add_argument_group(title='output arguments')
parser_output.add_argument('-o', '--outfile', help='output to a file')
parser_output_format = parser_output.add_mutually_exclusive_group()
parser_output_format.add_argument('--csv', help='output in CSV format',
action='store_const', const='csv', dest='format')
parser_output_format.add_argument('--json', help='output in JSON format',
action='store_const', const='json', dest='format')
parser_output_format.add_argument('--pandas-parquet', help='output a Pandas dataframe to a parquet',
action='store_const', const='pandas-parquet', dest='format')
parser_output_format.add_argument('--python', help='output a Python dict',
action='store_const', const='python', dest='format')
parser_output_format.add_argument('--text', help='output in a human readable format',
action='store_const', const='text', dest='format')
parser_logging = parser.add_argument_group(title='logging arguments')
parser_logging.add_argument('-v', '--verbose', help='get verbose output', action='count', default=0)
parser_logging.add_argument('-q', '--quiet', help='suppress output', action='count', default=0)
if len(sys.argv) == 1:
parser.print_help()
sys.exit(1)
args = vars(parser.parse_args())
if not args.get('format'):
args['format'] = 'text'
elif args['format'] in ['csv', 'pandas-parquet']:
try:
pandas_version = importlib.metadata.version('pandas')
logger.info('Found Pandas version %s', pandas_version)
except importlib.metadata.PackageNotFoundError as exc:
logger.error('An output mode that requires pandas was specified, but pandas is not available')
sys.exit(1)
if args['format'] == 'pandas-parquet':
try:
parquet_version = importlib.metadata.version('pyarrow')
logger.info('Found PyArrow version %s', parquet_version)
except importlib.metadata.PackageNotFoundError as exc:
try:
parquet_version = importlib.metadata.version('fastparquet')
logger.info('Found FastParquet version %s', parquet_version)
except importlib.metadata.PackageNotFoundError as exc:
logger.error('Parquet output was specified, but no parquet backend was found')
sys.exit(1)
if not args.get('outfile'):
logger.error('The parquet format requires an output file to be specified')
sys.exit(1)
return args
def generate_output(data: dict, *, outfile: str = None, format: str = None, **_) -> int:
"""generate and write output of dependency data
:param data: data
:type data: dict
:param outfile: output file
:type outfile: str
:param format: output format
:type format: str
:return: exit code
:rtype: int
"""
if not format:
format = 'text'
out = ''
# This allows for the file to be written as a string or binary, that way it can handle
# data like parquets. NOTE: sys.stdout __cannot__ accept binary so you must check that
# you're not writing to sys.stdout.
flags = 'w'
if format == 'text':
out = str(data)
elif format == 'json':
out = json.dumps(data)
elif format in ['csv', 'pandas-parquet']:
from pandas import DataFrame
rows = []
for k, v in data.items():
rows.append(v)
df = DataFrame.from_dict(rows)
if format == 'csv':
out = df.to_csv(index=False)
elif format == 'pandas-parquet':
flags += 'b'
out = df.to_parquet(index=False)
try:
with open(outfile, flags) if outfile else contextlib.nullcontext(sys.stdout) as f:
f.write(out)
except FileNotFoundError as exc:
logger.error(exc)
return exc.errno
return 0
def main() -> int:
args = arguments()
if verbose := args.get('verbose'):
if verbose >= 2:
logger.setLevel(logging.DEBUG)
else:
logger.setLevel(logging.INFO)
elif quiet := args.get('quiet'):
if quiet >= 2:
logger.setLevel(logging.FATAL)
else:
logger.setLevel(logging.ERROR)
else:
logger.setLevel(logging.WARNING)
logger.debug('args: %s', args)
data = {}
ret = generate_output(data, **args)
return ret
if __name__ == '__main__':
logging.basicConfig(format="[%(asctime)s] %(levelname)s -- %(message)s")
sys.exit(main())