-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathmisc.py
241 lines (178 loc) · 6.62 KB
/
misc.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
'''
Miscellaneous helper functions
'''
import re
from . import lut
def _Z_from_str(s):
if s.isdecimal():
return int(s)
else:
return lut.element_Z_from_sym(s)
def transpose_matrix(mat):
'''Transposes a matrix (list of lists) commonly done do coefficients'''
return list(map(list, zip(*mat)))
def max_am(shells):
'''Determine the maximum angular momentum of a list of shells or potentials'''
all_am = [max(x['angular_momentum']) for x in shells]
return max(all_am)
def contraction_string(element):
"""
Forms a string specifying the contractions for an element
ie, (16s,10p) -> [4s,3p]
"""
# Does not have electron shells (ECP only?)
if 'electron_shells' not in element:
return ""
cont_map = dict()
for sh in element['electron_shells']:
nprim = len(sh['exponents'])
ngeneral = len(sh['coefficients'])
# is a combined general contraction (sp, spd, etc)
is_spdf = len(sh['angular_momentum']) > 1
for am in sh['angular_momentum']:
# If this a general contraction (and not combined am), then use that
ncont = ngeneral if not is_spdf else 1
if am not in cont_map:
cont_map[am] = (nprim, ncont)
else:
cont_map[am] = (cont_map[am][0] + nprim, cont_map[am][1] + ncont)
primstr = ""
contstr = ""
for am in sorted(cont_map.keys()):
nprim, ncont = cont_map[am]
if am != 0:
primstr += ','
contstr += ','
primstr += str(nprim) + lut.amint_to_char([am])
contstr += str(ncont) + lut.amint_to_char([am])
return "({}) -> [{}]".format(primstr, contstr)
def compact_elements(elements):
"""
Create a string (with ranges) given a list of element numbers
For example, [1, 2, 3, 6, 7, 8, 10] will return "H-Li,C-O,Ne"
"""
if not elements:
return
# We have to convert to integers for this function
elements = [int(el) for el in elements]
# Just to be safe, sort the list
el = sorted(set(elements))
ranges = []
i = 0
while i < len(el):
start_el = el[i]
end_el = start_el
i += 1
while i < len(el):
if el[i] != end_el + 1:
break
end_el += 1
i += 1
if start_el == end_el:
ranges.append([start_el])
else:
ranges.append([start_el, end_el])
# Convert to elemental symbols
range_strs = []
for r in ranges:
sym = lut.element_sym_from_Z(r[0], True)
if len(r) == 1:
range_strs.append(sym)
elif len(r) == 2 and r[1] == r[0] + 1:
sym2 = lut.element_sym_from_Z(r[1], True)
range_strs.append(sym + "," + sym2)
else:
sym2 = lut.element_sym_from_Z(r[1], True)
range_strs.append(sym + "-" + sym2)
return ",".join(range_strs)
def expand_elements(compact_el, as_str=False):
"""
Create a list of integers given a string or list of compacted elements
This is partly the opposite of compact_elements, but is more flexible.
compact_el can be a list or a string. If compact_el is a list, each element is processed individually
as a string (meaning list elements can contain commas, ranges, etc)
If compact_el is a string, it is split by commas and then each section is processed.
In all cases, element symbols (case insensitive) and Z numbers (as integers or strings)
can be used interchangeably. Ranges are also allowed in both lists and strings.
Some examples:
"H-Li,C-O,Ne" will return [1, 2, 3, 6, 7, 8, 10]
"H-N,8,Na-12" will return [1, 2, 3, 4, 5, 6, 7, 8, 11, 12]
['C', 'Al-15,S', 17, '18'] will return [6, 13, 14, 15, 16, 17, 18]
If as_str is True, the list will contain strings of the integers
(ie, the first example above will return ['1', '2', '3', '6', '7', '8', '10']
"""
# If an integer, just return it
if isinstance(compact_el, int):
if as_str:
return [str(compact_el)]
else:
return [compact_el]
# If compact_el is a list, make it a comma-separated string
if isinstance(compact_el, list):
compact_el = [str(x) for x in compact_el]
compact_el = [x for x in compact_el if x]
compact_el = ','.join(compact_el)
# Find multiple - or ,
# Also replace all whitespace with spaces
compact_el = re.sub(r',+', ',', compact_el)
compact_el = re.sub(r'-+', '-', compact_el)
compact_el = re.sub(r'\s+', '', compact_el)
# Find starting with or ending with comma and strip them
compact_el = compact_el.strip(',')
# Check if I was passed an empty string or list
if not compact_el:
return []
# Find some erroneous patterns
# -, and ,-
if '-,' in compact_el:
raise RuntimeError("Malformed element string")
if ',-' in compact_el:
raise RuntimeError("Malformed element string")
# Strings ends or begins with -
if compact_el.startswith('-') or compact_el.endswith('-'):
raise RuntimeError("Malformed element string")
# x-y-z
if re.search(r'\w+-\w+-\w+', compact_el):
raise RuntimeError("Malformed element string")
# Split on commas
tmp_list = compact_el.split(',')
# Now go over each one and replace elements with ints
el_list = []
for el in tmp_list:
if '-' not in el:
el_list.append(_Z_from_str(el))
else:
begin, end = el.split('-')
begin = _Z_from_str(begin)
end = _Z_from_str(end)
el_list.extend(list(range(begin, end + 1)))
if as_str:
return [str(x) for x in el_list]
else:
return el_list
def transform_basis_name(name):
"""
Transforms the name of a basis set to an internal representation
This makes comparison of basis set names easier by, for example,
converting the name to all lower case.
"""
name = name.lower()
name = name.replace('/', '_sl_')
name = name.replace('*', '_st_')
return name
def basis_name_to_filename(name):
'''
Given a basis set name, transform it into a valid filename
This makes sure filenames don't contain invalid characters
'''
return transform_basis_name(name)
def basis_name_from_filename(filename):
'''
Given a basis set name that was part of a filename, determine the basis set name
This is opposite of :func:`transform_basis_name`
Pass only the part of the filename that contains the basis set name
'''
name = filename.lower()
name = name.replace('_sl_', '/')
name = name.replace('_st_', '*')
return name