forked from numat/EQeq
-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathjson_formatter.py
84 lines (72 loc) · 2.96 KB
/
json_formatter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
"""
Some small edits to json output.
* Float decimals are truncated to three digits
* [x, y, z] vectors are displayed on one line
* Converts numpy arrays to lists and defined objects to dictionaries
* Removes internal parent references in objects
* Atoms and bonds are on one line each (looks more like other chem formats)
"""
from itertools import takewhile
import re
import json
from json import encoder
encoder.FLOAT_REPR = lambda o: format(o, '.6f')
import numpy as np
load = json.load
loads = json.loads
def compress(obj):
"""Outputs json without whitespace + object handling."""
return json.dumps(obj, sort_keys=True, separators=(",", ":"),
cls=CustomEncoder)
def dumps(obj):
"""Outputs json with formatting edits + object handling."""
return json.dumps(obj, indent=4, sort_keys=True, cls=CustomEncoder)
class CustomEncoder(json.JSONEncoder):
def default(self, obj):
"""Fired when an unserializable object is hit."""
if hasattr(obj, '__dict__'):
d = obj.__dict__.copy()
d.pop("parent_block", None)
return d
elif isinstance(obj, np.ndarray):
return obj.copy().tolist()
else:
raise TypeError(("Object of type %s with value of %s is not JSON "
"serializable") % (type(obj), repr(obj)))
def encode(self, obj):
"""Fired for every object."""
if hasattr(obj, "history"):
del obj.history
s = super(CustomEncoder, self).encode(obj)
# If uncompressed, postprocess for formatting
if len(s.splitlines()) > 1:
s = self.postprocess(s)
return s
def postprocess(self, json_string):
"""Display float lists as one line in json. Useful for vectors."""
# As a general rule, all three-element float lists are on one line
json_string = re.sub("\[\s*([-+]?\d*\.?\d*), \s*([-+]?\d*\.?\d*),"
"\s*([-+]?\d*\.?\d*)\s*\]", r"[ \1, \2, \3 ]",
json_string)
# This further compresses atoms and bonds to be on one line
is_compressing = False
compressed = []
spaces = 0
for row in json_string.split("\n"):
if is_compressing:
if row.strip() == "{":
compressed.append(row.rstrip())
elif row.rstrip() == " " * spaces + "],":
compressed.append(row.rstrip())
is_compressing = False
else:
compressed[-1] += " " + row.strip()
else:
compressed.append(row.rstrip())
if any(a in row for a in ["atoms", "bonds"]):
# Fix to handle issues that arise with empty lists
if "[]" in row:
continue
spaces = sum(1 for _ in takewhile(str.isspace, row))
is_compressing = True
return "\n".join(compressed)