#! /usr/bin/env python3 # remarshal, a utility to convert between serialization formats. # Copyright (c) 2014, 2015, 2016, 2017, 2018, 2019 dbohdan # License: MIT # Originally from: # https://github.com/dbohdan/remarshal from __future__ import print_function import argparse import datetime # import dateutil.parser import io import json import os.path import re import string import sys from ansible.module_utils.pytoml import loads as pytoml_loads from ansible.module_utils.pytoml import dumps as pytoml_dumps from ansible.module_utils.pytoml import TomlError # import umsgpack # import yaml from collections import OrderedDict __version__ = '0.11.2' FORMATS = ['json', 'msgpack', 'toml', 'yaml'] # === JSON === if hasattr(json, 'JSONDecodeError'): JSONDecodeError = json.JSONDecodeError else: JSONDecodeError = ValueError def json_default(obj): if isinstance(obj, datetime.datetime): return obj.isoformat() raise TypeError("{0} is not JSON-serializable".format(repr(obj))) # === CLI === def argv0_to_format(argv0): possible_format = '(' + '|'.join(FORMATS) + ')' match = re.search('^' + possible_format + '2' + possible_format, argv0) if match: from_, to = match.groups() return True, from_, to else: return False, None, None def extension_to_format(path): _, ext = os.path.splitext(path) ext = ext[1:] if ext == 'yml': ext = 'yaml' return ext if ext in FORMATS else None def parse_command_line(argv): me = os.path.basename(argv[0]) format_from_argv0, argv0_from, argv0_to = argv0_to_format(me) parser = argparse.ArgumentParser( description='Convert between TOML, MessagePack, YAML, and JSON.' ) input_group = parser.add_mutually_exclusive_group() input_group.add_argument( 'input', nargs='?', default='-', help='input file' ) input_group.add_argument( '-i', '--input', dest='input_flag', metavar='input', default=None, help='input file' ) output_group = parser.add_mutually_exclusive_group() output_group.add_argument( 'output', nargs='?', default='-', help='input file' ) output_group.add_argument( '-o', '--output', dest='output_flag', metavar='output', default=None, help='output file' ) if not format_from_argv0: parser.add_argument( '--if', '-if', '--input-format', dest='input_format', help="input format", choices=FORMATS ) parser.add_argument( '--of', '-of', '--output-format', dest='output_format', help="output format", choices=FORMATS ) if not format_from_argv0 or argv0_to == 'json': parser.add_argument( '--indent-json', dest='indent_json', metavar='n', type=int, default=None, help='indent JSON output' ) if not format_from_argv0 or argv0_to == 'yaml': parser.add_argument( '--yaml-style', dest='yaml_style', default=None, help='YAML formatting style', choices=['', '\'', '"', '|', '>'] ) parser.add_argument( '--wrap', dest='wrap', metavar='key', default=None, help='wrap the data in a map type with the given key' ) parser.add_argument( '--unwrap', dest='unwrap', metavar='key', default=None, help='only output the data stored under the given key' ) parser.add_argument( '-p', '--preserve-key-order', dest='ordered', action='store_true', help='preserve the order of dictionary/mapping keys' ) parser.add_argument( '-v', '--version', action='version', version=__version__ ) args = parser.parse_args(args=argv[1:]) # Use the positional input and output arguments. if args.input_flag is not None: args.input = args.input_flag if args.output_flag is not None: args.output = args.output_flag # Determine the implicit input and output format if possible. if format_from_argv0: args.input_format = argv0_from args.output_format = argv0_to if argv0_to != 'json': args.__dict__['indent_json'] = None if argv0_to != 'yaml': args.__dict__['yaml_style'] = None else: if args.input_format is None: args.input_format = extension_to_format(args.input) if args.input_format is None: parser.error('Need an explicit input format') if args.output_format is None: args.output_format = extension_to_format(args.output) if args.output_format is None: parser.error('Need an explicit output format') # Wrap yaml_style. args.__dict__['yaml_options'] = {'default_style': args.yaml_style} del args.__dict__['yaml_style'] return args # === Parser/serializer wrappers === def decode_json(input_data, ordered): try: pairs_hook = OrderedDict if ordered else dict return json.loads( input_data.decode('utf-8'), object_pairs_hook=pairs_hook ) except JSONDecodeError as e: raise ValueError('Cannot parse as JSON ({0})'.format(e)) def decode_msgpack(input_data, ordered): try: return umsgpack.unpackb(input_data, use_ordered_dict=ordered) except umsgpack.UnpackException as e: raise ValueError('Cannot parse as MessagePack ({0})'.format(e)) def decode_toml(input_data, ordered): try: pairs_hook = OrderedDict if ordered else dict return pytoml_loads( input_data, object_pairs_hook=pairs_hook ) except TomlError as e: raise ValueError('Cannot parse as TOML ({0})'.format(e)) def decode(input_format, input_data, ordered): decoder = { 'json': decode_json, 'msgpack': decode_msgpack, 'toml': decode_toml, } if input_format not in decoder: raise ValueError('Unknown input format: {0}'.format(input_format)) return decoder[input_format](input_data, ordered) def encode_json(data, ordered, indent): if indent is True: indent = 2 if indent: separators = (',', ': ') else: separators = (',', ':') try: return json.dumps( data, default=json_default, ensure_ascii=False, indent=indent, separators=separators, sort_keys=not ordered ) + "\n" except TypeError as e: raise ValueError('Cannot convert data to JSON ({0})'.format(e)) def traverse( col, dict_callback=lambda x: x, list_callback=lambda x: x, key_callback=lambda x: x, value_callback=lambda x: x ): if isinstance(col, dict): return dict_callback(col.__class__([ (key_callback(k), traverse( v, dict_callback, list_callback, key_callback, value_callback )) for (k, v) in col.items() ])) elif isinstance(col, list): return list_callback([traverse( x, dict_callback, list_callback, key_callback, value_callback ) for x in col]) else: return value_callback(col) def encode_msgpack(data): try: return umsgpack.packb(data) except umsgpack.UnsupportedTypeException as e: raise ValueError('Cannot convert data to MessagePack ({0})'.format(e)) def encode_toml(data, ordered): try: return pytoml_dumps(data, sort_keys=not ordered) except AttributeError as e: if str(e) == "'list' object has no attribute 'keys'": raise ValueError( 'Cannot convert non-dictionary data to ' 'TOML; use "wrap" to wrap it in a ' 'dictionary' ) else: raise e except TypeError as e: if str(e) == "'in ' requires string as left operand, not int": raise ValueError('Cannot convert binary to TOML') else: raise ValueError('Cannot convert data to TOML ({0})'.format(e)) # === Main === def run(argv): args = parse_command_line(argv) remarshal( args.input, args.output, args.input_format, args.output_format, args.wrap, args.unwrap, args.indent_json, args.yaml_options, args.ordered ) def remarshal( input, output, input_format, output_format, wrap=None, unwrap=None, indent_json=None, yaml_options={}, ordered=False, transform=None, ): try: if input == '-': input_file = getattr(sys.stdin, 'buffer', sys.stdin) else: input_file = open(input, 'rb') if output == '-': output_file = getattr(sys.stdout, 'buffer', sys.stdout) else: output_file = open(output, 'wb') input_data = input_file.read() parsed = decode(input_format, input_data, ordered) if unwrap is not None: parsed = parsed[unwrap] if wrap is not None: temp = {} temp[wrap] = parsed parsed = temp if transform: parsed = transform(parsed) if output_format == 'json': output_data = encode_json(parsed, ordered, indent_json) elif output_format == 'msgpack': output_data = encode_msgpack(parsed) elif output_format == 'toml': output_data = encode_toml(parsed, ordered) else: raise ValueError( 'Unknown output format: {0}'.format(output_format) ) if output_format == 'msgpack': encoded = output_data else: encoded = output_data.encode('utf-8') output_file.write(encoded) output_file.close() finally: if 'input_file' in locals(): input_file.close() if 'output_file' in locals(): output_file.close() def main(): try: run(sys.argv) except KeyboardInterrupt as e: pass except (IOError, ValueError) as e: print('Error: {0}'.format(e), file=sys.stderr) sys.exit(1) if __name__ == '__main__': main()