Skip to content

data_structure_dicts

Access the dictionaries for variable information.

This ultimately provides access to variable information that is included in the python source (e.g. docstrings) or that cannot be dynamically accessed (e.g. variable initial values).

INPUT_TYPE_MAP = {int: 'int', float: 'real', str: 'string'} module-attribute

NON_F_VALUES = ['f_j_cs_start_pulse_end_flat_top', 'f_c_plasma_non_inductive', 'feffcd', 'f_a_tf_turn_cable_copper'] module-attribute

output_dict = {} module-attribute

Dictionary

Source code in process/core/io/data_structure_dicts.py
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
class Dictionary:
    # Base Dictionary class for all dicts
    def __init__(self, name):
        self.name = name  # Dict name
        self.dict = {}  # Contains the dict
        self.dict[self.name] = {}  # Structures this dict: key = dict name,
        # value = nested dict of variable info

    def make_dict(self):
        # Make the dictionary
        pass

    def post_process(self):
        # Perform any processing after making the dict
        pass

    def publish(self):
        # Add the finished dictionary to the output dict
        output_dict.update(self.dict)

name = name instance-attribute

dict = {} instance-attribute

make_dict()

Source code in process/core/io/data_structure_dicts.py
48
49
50
def make_dict(self):
    # Make the dictionary
    pass

post_process()

Source code in process/core/io/data_structure_dicts.py
52
53
54
def post_process(self):
    # Perform any processing after making the dict
    pass

publish()

Source code in process/core/io/data_structure_dicts.py
56
57
58
def publish(self):
    # Add the finished dictionary to the output dict
    output_dict.update(self.dict)

SourceDictionary

Bases: Dictionary

Source code in process/core/io/data_structure_dicts.py
61
62
63
64
65
66
67
68
69
70
class SourceDictionary(Dictionary):
    # Dictionary created from Fortran source
    def __init__(self, name, dict_creator_func):
        Dictionary.__init__(self, name)
        # Function that creates the dict
        self.dict_creator_func = dict_creator_func

    def make_dict(self):
        # Make entire nested dict from function
        self.dict[self.name] = self.dict_creator_func()

dict_creator_func = dict_creator_func instance-attribute

make_dict()

Source code in process/core/io/data_structure_dicts.py
68
69
70
def make_dict(self):
    # Make entire nested dict from function
    self.dict[self.name] = self.dict_creator_func()

HardcodedDictionary

Bases: Dictionary

Source code in process/core/io/data_structure_dicts.py
73
74
75
76
77
78
79
80
81
82
83
84
class HardcodedDictionary(Dictionary):
    # Dictionary created from a hardcoded dict in this file
    def __init__(self, name, hardcoded_dict):
        Dictionary.__init__(self, name)
        self.dict[self.name] = None
        # Hardcoded value isn't always a dict; override to None to allow the
        # value to be set to any type
        self.hardcoded_dict = hardcoded_dict

    def make_dict(self):
        # Set the nested value to a hardcoded int, list or dict
        self.dict[self.name] = self.hardcoded_dict

hardcoded_dict = hardcoded_dict instance-attribute

make_dict()

Source code in process/core/io/data_structure_dicts.py
82
83
84
def make_dict(self):
    # Set the nested value to a hardcoded int, list or dict
    self.dict[self.name] = self.hardcoded_dict

to_type(string)

Given a string, attempts to convert the string to a numerical value. If the string can't be simply converted, the function looks to see if it begins with a integer and returns that (since some lines have clarification text after the number). If this also fails, return string.strip()

Parameters:

Name Type Description Default
string
required

Returns:

Type Description

Either a float, int or string depending on input

Source code in process/core/io/data_structure_dicts.py
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
def to_type(string):
    """Given a string, attempts to convert the string to a numerical
    value. If the string can't be simply converted, the function
    looks to see if it begins with a integer and returns that (since
    some lines have clarification text after the number). If this
    also fails, return string.strip()

    Parameters
    ----------
    string :


    Returns
    -------
    :
        Either a float, int or string depending on input
    """

    try:
        if "." in string:
            # try a float conversion
            string_mod = string.strip().lower().replace("d", "e")
            return float(string_mod)
        # try an int conversion
        return int(string.strip())
    except ValueError:
        match = re.match(r"\s*(\d+)", string)
        if match:
            # if the string starts with an integer return that
            return int(match.group(1))

        # otherwise return the string unchanged but with whitespace removed
        return string.strip()

grep(file, regexp, flags=re.UNICODE)

Implements an in-python grep. Returns the lines that match as a list.

Parameters:

Name Type Description Default
file

Name of file to be read

required
regexp

Regular expression to search for

required
flags

re flags to use in search. Default is re.U which has

UNICODE

Returns:

Name Type Description
lines

List of matching lines

Source code in process/core/io/data_structure_dicts.py
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
def grep(file, regexp, flags=re.UNICODE):
    """Implements an in-python grep. Returns the lines that match
    as a list.

    Parameters
    ----------
    file:
        Name of file to be read
    regexp:
        Regular expression to search for
    flags:
        re flags to use in search. Default is re.U which has

    Returns
    -------
    lines:
        List of matching lines
    """

    lines = []

    try:
        with open(file, encoding="utf-8") as file_open:
            lines = [line for line in file_open if re.search(regexp, line, flags)]

    except OSError:
        logger.warning("File : %s not found\n", file)
    return lines

slice_file(file, re1, re2)

Returns a slice of a file that is bounded by lines containing a substring matching the given regular expressions. The first match to re1 in the file marks the start of the slice, the first match to re2 after that marks the end of the slice. The list of lines returned includes the two bounding lines.

Parameters:

Name Type Description Default
file

Name of file to read through

required
re1

Starting regular expression

required
re2

Ending regular expression

required

Returns:

Type Description

lines:List of lines from file between re1 and re2 inclusive

Source code in process/core/io/data_structure_dicts.py
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
def slice_file(file, re1, re2):
    """Returns a slice of a file that is bounded by lines containing a
    substring matching the given regular expressions. The first match
    to re1 in the file marks the start of the slice, the first match
    to re2 after that marks the end of the slice. The list of lines
    returned includes the two bounding lines.

    Parameters
    ----------
    file :
        Name of file to read through
    re1 :
        Starting regular expression
    re2 :
        Ending regular expression

    Returns
    -------
    :
        lines:List of lines from file between re1 and re2 inclusive
    """

    with open(file, encoding="utf-8") as file:
        filetext = file.readlines()
    start = None
    for i in range(len(filetext)):
        # look for first match
        if re.search(re1, filetext[i]):
            start = i
            break
    if start is None:
        logger.warning("Could not match %s in file %s\n", re1, file)
        return ""
    end = None
    for i in range(start, len(filetext)):
        # look for second match
        if re.search(re2, filetext[i]):
            end = i
            break
    if end is None:
        logger.warning("Could not match %s in file %s\n", re2, file)
        return ""
    # return slice
    return filetext[start : end + 1]

remove_comments(line)

Function to remove comments from a fortran line. Works by simply removing everything after the first '!' in the line. This will cause problems in the case of '!' characters contained within strings so am assuming this won't happen. Need to change this.

Parameters:

Name Type Description Default
line

Line to strip comments from

required

Returns:

Name Type Description
modified_line

Line with comments removed

Source code in process/core/io/data_structure_dicts.py
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
def remove_comments(line):
    """Function to remove comments from a fortran line. Works by simply
    removing everything after the first '!' in the line. This will
    cause problems in the case of '!' characters contained within strings
    so am assuming this won't happen. Need to change this.

    Parameters
    ----------
    line:
        Line to strip comments from

    Returns
    -------
    modified_line:
        Line with comments removed

    """
    if "!" in line:
        line = line[: line.find("!")]
    line = line.strip()
    if line == "":
        return line
    if line[-1] == "&":
        line = line[:-1]
    return line

dict_ixc2nsweep()

Returns a dict mapping ixc_no to nsweep_no, if both exist for a particular variable.

Example dictionary entry: DICT_IXC2NSWEEP['1'] = '1'

Source code in process/core/io/data_structure_dicts.py
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
def dict_ixc2nsweep():
    """Returns a dict mapping ixc_no to nsweep_no, if both exist for a
    particular variable.

    Example dictionary entry:
        DICT_IXC2NSWEEP['1'] = '1'
    """

    name_to_nsweep = {
        sv.value.variable_name: sv.value.variable_num for sv in ScanVariables
    }

    # create a dictionary that maps iteration variable names to ixc_no
    ixc_full = dict_ixc_full()
    name_to_ixc = {
        name: ixc
        for ixc, data in ixc_full.items()
        if (name := data["name"]) in name_to_nsweep
    }

    return {ixc: name_to_nsweep[name] for name, ixc in name_to_ixc.items()}

dict_nsweep2ixc()

Returns a dict mapping nsweep_no to ixc_no; the inverse of dict_ixc2nsweep

Source code in process/core/io/data_structure_dicts.py
248
249
250
251
252
253
254
255
def dict_nsweep2ixc():
    """Returns a dict mapping nsweep_no to ixc_no; the inverse of
    dict_ixc2nsweep
    """

    # Use dict_ixc2nsweep from output_dict to produce dict_nsweep2ixc
    ixc2nsweep = output_dict["DICT_IXC2NSWEEP"]
    return {b: a for a, b in ixc2nsweep.items()}

dict_var_type()

Function to return a dictionary mapping variable name to variable type eg. 'real_variable' or 'int_array'. Looks in input.f90 at the process functions that read in variables from IN.DAT.

Example of line we are looking for: call parse_real_variable('BETA', beta, 0.0D0, 1.0D0, &

Example dictionary entry: DICT_VAR_TYPE['beta'] = 'real_variable'

Source code in process/core/io/data_structure_dicts.py
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
def dict_var_type():
    """Function to return a dictionary mapping variable name to variable type
    eg. 'real_variable' or 'int_array'. Looks in input.f90 at the process
    functions that read in variables from IN.DAT.

    Example of line we are looking for:
        call parse_real_variable('BETA', beta, 0.0D0, 1.0D0, &

    Example dictionary entry:
        DICT_VAR_TYPE['beta'] = 'real_variable'
    """
    di = {}

    for var_name, config in INPUT_VARIABLES.items():
        var_type = (
            f"{INPUT_TYPE_MAP[config.type]}_{'array' if config.array else 'variable'}"
        )

        di[var_name] = var_type

    return di

dict_input_bounds()

Returns a dictionary matching variable names to dictionary containing upper and lower bounds that PROCESS checks variable lies between when reading IN.DAT. Looks in input.f90 for parse_real_variable and parse_int_variable.

Example of a line we are looking for: call parse_real_variable('BETA', beta, 0.0D0, 1.0D0, &

Example dictionary entry: DICT_INPUT_BOUNDS['beta'] = {'lb' : 0.0, 'ub' : 1.0}

Source code in process/core/io/data_structure_dicts.py
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
def dict_input_bounds():
    """Returns a dictionary matching variable names to dictionary containing
    upper and lower bounds that PROCESS checks variable lies between when
    reading IN.DAT. Looks in input.f90 for parse_real_variable and
    parse_int_variable.

    Example of a line we are looking for:
         call parse_real_variable('BETA', beta, 0.0D0, 1.0D0, &

    Example dictionary entry:
         DICT_INPUT_BOUNDS['beta'] = {'lb' : 0.0, 'ub' : 1.0}
    """
    di = {}

    for var_name, config in INPUT_VARIABLES.items():
        lb, ub = None, None
        if config.range is not None:
            lb, ub = config.range

        elif config.choices is not None and config.type in [int, float]:
            lb = min(config.choices)
            ub = max(config.choices)

        if lb is not None:
            di[var_name] = {"lb": lb, "ub": ub}

    return di

dict_nsweep2varname()

Source code in process/core/io/data_structure_dicts.py
310
311
def dict_nsweep2varname():
    return {sv.value.variable_num: sv.value.variable_name for sv in ScanVariables}

dict_ixc_full()

Function to return a dictionary matching str(ixc_no) to a dictionary containing the name, lower and upper bounds of that variable.

Example dictionary entry: DICT_IXC_FULL['5'] = {'name' : 'beta', 'lb' : 0.001, 'ub' : 1.0}

Source code in process/core/io/data_structure_dicts.py
314
315
316
317
318
319
320
321
322
323
324
325
def dict_ixc_full():
    """Function to return a dictionary matching str(ixc_no) to a dictionary
    containing the name, lower and upper bounds of that variable.

    Example dictionary entry:
        DICT_IXC_FULL['5'] = {'name' : 'beta', 'lb' : 0.001, 'ub' : 1.0}
    """

    return {
        str(k): {"name": v.name, "lb": v.lower_bound, "ub": v.upper_bound}
        for k, v in ITERATION_VARIABLES.items()
    }

dict_ixc_bounds()

Source code in process/core/io/data_structure_dicts.py
328
329
330
331
332
333
334
335
336
337
338
def dict_ixc_bounds():
    # Returns dictionary mapping iteration variable name to bounds
    ixc_full = output_dict["DICT_IXC_FULL"]
    ixc_bounds = {}
    for value in ixc_full.values():
        lb = value["lb"]
        ub = value["ub"]
        temp = {"lb": lb, "ub": ub}
        ixc_bounds[value["name"]] = temp

    return ixc_bounds

dict_ixc_simple()

Source code in process/core/io/data_structure_dicts.py
341
342
343
344
345
346
347
348
def dict_ixc_simple():
    # Returns dictionary mapping ixc no to iteration variable name
    ixc_simple = {}
    ixc_full = output_dict["DICT_IXC_FULL"]
    for key, value in ixc_full.items():
        ixc_simple[key] = value["name"]

    return ixc_simple

dict_ixc_simple_rev()

Source code in process/core/io/data_structure_dicts.py
351
352
353
354
def dict_ixc_simple_rev():
    # Returns dictionary mapping iteration variable name to ixc no
    ixc_simple = output_dict["DICT_IXC_SIMPLE"]
    return {b: a for a, b in ixc_simple.items()}

get_dicts() cached

Constructs the dictionaries which contain information about every PROCESS variable.

WARNING: this function must be used carefully because it re-initialises the PROCESS state

Source code in process/core/io/data_structure_dicts.py
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
@cache
def get_dicts():
    """Constructs the dictionaries which contain information about every PROCESS variable.

    WARNING: this function must be used carefully because it re-initialises the PROCESS state
    """
    dict_objects = []
    # Different dict objects, e.g. variable descriptions

    init_all_module_vars()
    # Make dict objects
    # Some dicts depend on other dicts already existing in output_dicts, so
    # be careful if changing the order!
    dict_objects.extend([
        HardcodedDictionary("NON_F_VALUES", NON_F_VALUES),
        HardcodedDictionary("DICT_DEFAULT", {}),
        HardcodedDictionary("DICT_MODULE", {}),
        HardcodedDictionary("DICT_DESCRIPTIONS", {}),
        SourceDictionary("DICT_INPUT_BOUNDS", dict_input_bounds),
        SourceDictionary("DICT_NSWEEP2VARNAME", dict_nsweep2varname),
        SourceDictionary("DICT_VAR_TYPE", dict_var_type),
        SourceDictionary("DICT_IXC2NSWEEP", dict_ixc2nsweep),
        SourceDictionary("DICT_NSWEEP2IXC", dict_nsweep2ixc),
        SourceDictionary("DICT_IXC_FULL", dict_ixc_full),
        SourceDictionary("DICT_IXC_BOUNDS", dict_ixc_bounds),
        SourceDictionary("DICT_IXC_SIMPLE", dict_ixc_simple),
        SourceDictionary("DICT_IXC_SIMPLE_REV", dict_ixc_simple_rev),
    ])

    # Make individual dicts within dict objects, process, then add to output_dict
    for dict_object in dict_objects:
        dict_object.make_dict()
        dict_object.post_process()
        dict_object.publish()

    for module_name in import_module("process.data_structure").__all__:
        if module_name == "__init__.py":
            continue
        module = import_module(f"process.data_structure.{module_name.split('.', 1)[0]}")

        module_tree = ast.parse(inspect.getsource(module))
        initial_values_dict = {}
        variable_names = []
        var_names_and_descriptions = {}
        dict_module_entry = {}
        variable_types = {}

        # get the variable names and initial values
        for node in ast.walk(module_tree):
            if isinstance(node, ast.AnnAssign):
                # for each variable in the file, get the initial value
                # (either is None, or value initialised in init_variables fn)
                # set default to be None if variable is not being initialised eg if you
                # just have `example_double: float` instead of `example_double: float = None`
                initial_value = getattr(module, node.target.id)
                # JSON doesn't like np arrays
                if type(initial_value) is np.ndarray:
                    initial_value = initial_value.tolist()
                initial_values_dict[node.target.id] = initial_value
                # get the variable name and add to variable_names list
                var_name = node.target.id
                variable_names.append(var_name)
                # Now want to get the types of these variables
                if isinstance(node.annotation, ast.Subscript):
                    if node.annotation.value.id == "list":
                        if node.annotation.slice.id == "str":
                            var_type = "string_array"
                        elif node.annotation.slice.id == "float":
                            var_type = "real_array"
                        elif node.annotation.slice.id == "int":
                            var_type = "int_array"
                        elif node.annotation.slice.id == "bool":
                            var_type = "bool_array"
                        else:
                            raise TypeError(
                                f"The type annotation of variable {node.target.id} is "
                                f"{node.annotation.value.id}[{node.annotation.slice.id}], and "
                                "this is not recognised. Please change your type annotation for "
                                "this variable. PROCESS recognises the following type annotations: "
                                "list[float], list[int], list[str], list[bool]."
                            )
                else:
                    if node.annotation.id == "float":
                        var_type = "real_variable"
                    elif node.annotation.id == "int":
                        var_type = "int_variable"
                    elif node.annotation.id == "str":
                        var_type = "str_variable"
                    elif node.annotation.id == "bool":
                        var_type = "bool_variable"
                    else:
                        raise TypeError(
                            f"The type annotation of variable {node.target.id} is "
                            f"{node.annotation.id}, and this is not recognised. Please change your "
                            "type annotation for this variable. PROCESS recognises the following "
                            "type annotations: float, int, str, bool."
                        )

                variable_types[node.target.id] = var_type
        # get the variable descriptions
        # need to check for pairs of ast.AnnAssign followed by an ast.Expr - this is the form of
        # a variable being declared followed by a docstring expression. can get these var descriptions
        # from here, and if there is no ast.Expr immediately after an ast.AnnAssign then this var does not
        # have a docstring and so set the description to be ""
        for node1, node2 in pairwise(module_tree.body):
            if isinstance(node1, ast.AnnAssign) and isinstance(node2, ast.Expr):
                # if docstring immediately follows the variable declaration, add docstring to descriptions dict
                var_names_and_descriptions[node1.target.id] = node2.value.value
            if isinstance(node1, ast.AnnAssign) and not isinstance(node2, ast.Expr):
                # if no docstring for variable, have a blank description
                var_names_and_descriptions[node1.target.id] = ""
        # check if last entry of ast.body is declaring a var. if it is then this var has no description and will be missing
        # from var_names_and_descriptions. need to add to var_names_and_descriptions dict
        lastvar = module_tree.body[-1]

        if (
            isinstance(lastvar, ast.AnnAssign)
            and lastvar not in var_names_and_descriptions
        ):
            var_names_and_descriptions[lastvar.target.id] = ""

        dict_module_entry[module_name] = variable_names

        output_dict["DICT_MODULE"].update(dict_module_entry)
        output_dict["DICT_DEFAULT"].update(initial_values_dict)
        output_dict["DICT_DESCRIPTIONS"].update(var_names_and_descriptions)
        output_dict["DICT_VAR_TYPE"].update(variable_types)

    return output_dict