-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdoc2ahelp.py
executable file
·375 lines (292 loc) · 11 KB
/
doc2ahelp.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
#!/usr/bin/env python
"""
Usage:
./doc2ahelp.py outdir [names]
--debug
--sxml
--models
--annotations keep | delete
Aim:
Extract the docstring information from Sherpa and create ahelp XML
files for these symbols (functions, objects that we treat as
strings/functions in Sherpa, meta data created from these symbols).
The --sxml flag means that the output will use the "SXML" DTD
instead of the AHELP one (at present this only changes the name of
the root element, so there is no attempt to take advantage of the
extra functionality provided by the SXML DTD).
The script requires that a CIAO installation has been initialized,
since it is used to access the Sherpa documentation from
sherpa.astro.ui
sherpa.stats CURRENTLY UNUSED
sherpa.optmethods CURRENTLY UNUSED
The ahelp files in the CIAO documentation are used to create the
ahelp metadata.
The following files are auto-created:
models
xs
The output is to outdir/<key>.<suffix> where <key> is based on the
"ahelp key" (it should be the same but may be different), and
<suffix> is 'xml' or 'sxml' depending on the DTD.
The script will over-write any existing file.
TODO:
- indicate new/missing files
- how to handle the known problem cases?
- NEED TO ENSURE DO NOT OVERWRITE EXISTING AHELP FILES (THAT ARE
NOT SHERPA)
"""
from collections import defaultdict
import os
from sherpa.astro import ui
from parsers.ahelp import find_metadata
from parsers.sherpa import unwanted, find_synonyms
from helpers import save_doc, list_xspec_models, \
list_sherpa_models, process_symbol
def convert(outdir, dtd='ahelp', modelsonly=False,
skip_synonyms=False,
handle_annotations="keep",
debug=False, restrict=None):
"""Convert the symbols.
Parameters
----------
outdir : string
The output directory, which must already exist.
dtd : {'ahelp', 'sxml'}, optional
The DTD to use for the output
modelsonly : bool, optional
Only process Sherpa models (this will subset any values given
in the restrict parameter if both are specified).
skip_synonyms : bool, optional
Should synonyms be skipped or not?
handle_annotations : str, optional
Options are "keep", "delete"
debug : optional, boool
If True then print out parsed versions of the symbols
(expected to be used when restrict is not None but this
is not enforced).
restrict : optional, None or list of str
The set of symbols to use (if not all).
"""
if not os.path.isdir(outdir):
sys.stderr.write("ERROR: outdir={} does not exist\n".format(outdir))
sys.exit(1)
if dtd not in ['ahelp', 'sxml']:
raise ValueError("Invalid dtd argument")
synonyms, originals = find_synonyms()
# Restrict the symbols that get processed
#
names = sorted(list(ui.__all__))
to_process = []
for name in names:
if restrict is not None and name not in restrict:
continue
print("# {}".format(name))
sym = getattr(ui, name)
if modelsonly and not isinstance(sym, ModelWrapper):
print(" - skipping as not a model")
continue
if unwanted(name, sym):
print(" - skipping as unwanted")
continue
if name in synonyms and skip_synonyms:
print(" - skipping as a synonym for {}".format(synonyms[name]))
continue
# Skip AbsorptionVoigt and EmissionVoigt from the list
#
if name in ['absorptionvoigt', 'emissionvoigt']:
print(' - skipping absorption/emissionvoigt symbols')
continue
to_process.append(name)
# Find potential mappings to identify multi-keyword files.
# We could store the find_metadata call to avoid calling it twice,
# but let's not bother.
#
filemaps = defaultdict(set)
for name in to_process:
sym = getattr(ui, name)
try:
syn_names = originals[name]
except KeyError:
syn_names = None
if name in synonyms:
# We want to treat this as if the synonym is the
# other way around (to get the 'Synonym: ...' output
# included).
#
assert syn_names is None
syn_names = [synonyms[name]]
try:
ahelp = find_metadata(name, synonyms=syn_names)
except ValueError as exc:
continue
# we want to store a mapping from the keyword to this file
#
for key in ahelp['refkeywords'].split(' '):
key = key.lower()
if key in to_process and key != name:
filemaps[key].add(name)
nproc = 0
error_list = []
# Count the number of commands with some level of annotation
# support.
#
annotations = {"none": 0, # \ is this worth tracking
"missing": 0, # / seprately?
"return-only": 0,
"argument-only": 0,
"both": 0}
for name in to_process:
print("## {}".format(name))
sym = getattr(ui, name)
try:
syn_names = originals[name]
except KeyError:
syn_names = None
if name in synonyms:
# We want to treat this as if the synonym is the
# other way around (to get the 'Synonym: ...' output
# included).
#
assert syn_names is None
syn_names = [synonyms[name]]
try:
ahelp = find_metadata(name, synonyms=syn_names)
except ValueError as exc:
# See if we can use the "parent" ahelp file. This is based on
# the assumption that for multi-command ahelp files the
# refkeywords would contain the "other" commands (those
# extra ones documented in the file), and so hopefully
# we can use the mapping we created to identify these
# commands.
#
fmaps = list(filemaps[name])
if len(fmaps) == 1:
ahelp = find_metadata(fmaps[0])
if ahelp is None:
raise ValueError("Expected to have a usable metadata copy!")
else:
print(f" - using metadata from {fmaps[0]}")
ahelp['key'] = name # important!
else:
print(" - ahelp metadata skipped as {}".format(exc))
ahelp = None
try:
xml = process_symbol(name, sym, dtd=dtd, ahelp=ahelp,
synonyms=syn_names,
annotations=handle_annotations,
debug=debug)
except Exception as exc:
print(" - ERROR PROCESSING: {}".format(exc))
error_list.append(name)
continue
if xml is None:
continue
# track the annotations (ony do this once we created the
# XML version).
#
if hasattr(sym, "__annotations__"):
nann = len(sym.__annotations__)
if nann == 0:
label = 'none'
elif nann == 1 and "return" in sym.__annotations__:
label = 'return-only'
elif "return" in sym.__annotations__:
label = 'both'
else:
label = 'argument-only'
else:
label = 'missing'
annotations[label] += 1
out_name = 'group_sherpa' if name == 'group' else name
suffix = 'sxml' if dtd == 'sxml' else 'xml'
outfile = os.path.join(outdir, '{}.{}'.format(out_name, suffix))
save_doc(outfile, xml)
print("Created: {}".format(outfile))
nproc += 1
nskip = len(names) - nproc
print("\nProcessed {} files, skipped {}.".format(nproc, nskip))
if error_list != []:
print("Errored out: {}".format(error_list))
# Create the model lists:
# models.suffix
# xs.suffix
#
print("\nAlso:")
for outfile in [list_sherpa_models(outdir, dtd=dtd),
list_xspec_models(outdir, dtd=dtd)]:
print(f" {outfile}")
print("")
# Dump the annotations
nann = sum([v for v in annotations.values()])
print(f"Files checked: {nann}")
def rep(label: str, val: int) -> None:
pcen = 100 * val / nann
print(f" {label:18s} : {val:3d} {pcen:4.1f}%")
rep("no __annotations__", annotations['missing'])
rep("empty", annotations['none'])
rep(" <sum> ", annotations['missing'] + annotations['none'])
print(" ---")
rep("return only", annotations['return-only'])
rep("argument only", annotations['argument-only'])
rep("both", annotations['both'])
rep(" <sum> ", annotations['return-only'] +
annotations['argument-only'] + annotations['both'])
print("")
"""
# extra symbols
# statistics
# optimisers
#
# Be very-restrictive on the accepted symbols
#
statnames = ui.list_stats()
statnames.remove('userstat') # explicitly remove
for name in dir(sherpa.stats):
if not name[0].isupper():
# this check is only realy needed for methods but include it
continue
lname = name.lower()
if lname not in statnames:
continue
symbol = getattr(sherpa.stats, name)
doit(lname, symbol)
optnames = ui.list_methods()
for name in dir(sherpa.optmethods):
if not name[0].isupper():
continue
lname = name.lower()
if lname not in optnames:
continue
symbol = getattr(sherpa.optmethods, name)
doit(lname, symbol)
"""
help_str = """Convert Sherpa docstrings into CIAO ahelp files."""
if __name__ == "__main__":
import argparse
import sys
import stk
parser = argparse.ArgumentParser(description=help_str,
prog=sys.argv[0])
parser.add_argument("outdir",
help="Files are written to this directory (must exist)")
parser.add_argument("names", nargs='?', default=None,
help="Restrict to these names (stack syntax)")
parser.add_argument("--debug", action="store_true",
help="Print out parsed output")
parser.add_argument("--sxml", action="store_true",
help="Use the SXML rather than AHELp dtd")
parser.add_argument("--models", action="store_true",
help="Restrict to Sherpa models only")
parser.add_argument("--annotations", "-a",
default="keep",
choices=["keep", "delete"],
help="What to do with annotations?")
args = parser.parse_args(sys.argv[1:])
restrict = args.names
if restrict is not None:
restrict = stk.build(restrict)
dtd = 'sxml' if args.sxml else 'ahelp'
print(f"Annotation handling: {args.annotations}")
convert(args.outdir, dtd=dtd, modelsonly=args.models,
handle_annotations=args.annotations,
debug=args.debug,
restrict=restrict)