test_parsing.py 9.92 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
# Copyright 2018 Markus Scheidgen
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an"AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
import os
16
17
18
from io import StringIO
import json
import pytest
19
20

from nomadcore.local_meta_info import loadJsonFile
21
import nomad_meta_info
22

23
from nomad import utils
24
from nomad.parsing import JSONStreamWriter, parser_dict
25
from nomad.parsing import LocalBackend, BadContextURI
26

27
parser_examples = [
28
    ('parsers/random', 'test/data/parsers/random_0'),
29
    ('parsers/template', 'tests/data/parsers/template.json'),
30
31
32
    ('parsers/exciting', 'tests/data/parsers/exciting/Ag/INFO.OUT'),
    ('parsers/exciting', 'tests/data/parsers/exciting/GW/INFO.OUT'),
    ('parsers/vasp', 'tests/data/parsers/vasp.xml'),
33
    ('parsers/fhi-aims', 'tests/data/parsers/aims.out'),
34
    ('parsers/cp2k', 'tests/data/parsers/cp2k/si_bulk8.out'),
35
36
    ('parsers/crystal', 'tests/data/parsers/crystal/si.out'),
    ('parsers/cpmd', 'tests/data/parsers/cpmd/geo_output.out'),
37
    ('parsers/nwchem', 'tests/data/parsers/nwchem/md/output.out'),
38
    ('parsers/bigdft', 'tests/data/parsers/bigdft/n2_output.out')
39
40
]

41
42
43
44
faulty_unknown_one_d_matid_example = [
    ('parsers/template', 'tests/data/normalizers/no_sim_cell_boolean_positions.json')
]

45
46
47
48
49

class TestLocalBackend(object):

    @pytest.fixture(scope='session')
    def meta_info(self):
50
51
        file_dir = os.path.dirname(os.path.abspath(nomad_meta_info.__file__))
        path = os.path.join(file_dir, 'all.nomadmetainfo.json')
52
53
54
55
56
57
58
        meta_info, _ = loadJsonFile(path)
        return meta_info

    @pytest.fixture(scope='function')
    def backend(self, meta_info):
        return LocalBackend(meta_info, debug=True)

59
    def test_meta_info(self, meta_info, no_warn):
60
61
        assert 'section_topology' in meta_info

62
63
64
65
66
67
68
69
70
71
    def test_metadata(self, backend, no_warn):
        g_index = backend.openSection('section_calculation_info')
        assert g_index == 0
        backend.addValue('calc_id', 't0')
        backend.closeSection('section_calculation_info', 0)
        g_index = backend.openSection('section_repository_info')
        backend.addValue('repository_calc_id', 1)
        backend.closeSection('section_repository_info', 0)
        assert json.dumps(backend.metadata()) is not None

72
    def test_section(self, backend, no_warn):
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
        g_index = backend.openSection('section_run')
        assert g_index == 0
        backend.addValue('program_name', 't0')
        backend.closeSection('section_run', 0)

        g_index = backend.openSection('section_run')
        assert g_index == 1

        g_index = backend.openSection('section_run')
        assert g_index == 2

        backend.addValue('program_name', 't1', 1)
        backend.addValue('program_name', 't2', 2)

        backend.closeSection('section_run', 1)
        backend.closeSection('section_run', 2)

        assert backend.get_sections('section_run') == [0, 1, 2]
        for i in range(0, 3):
            assert backend.get_value('program_name', i) == 't%d' % i

94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
    def test_two_sections(self, backend, no_warn):
        g_index = backend.openSection('section_run')
        assert g_index == 0
        backend.addValue('program_name', 't0')
        backend.closeSection('section_run', 0)

        g_index = backend.openSection('section_calculation_info')
        assert g_index == 0
        backend.addValue('parser_name', 'p0')
        backend.closeSection('section_calculation_info', 0)

        assert backend.get_sections('section_run') == [0]
        assert backend.get_sections('section_calculation_info') == [0]

        output = StringIO()
        backend.write_json(output)
        archive = json.loads(output.getvalue())
        assert 'section_run' in archive
        assert 'section_calculation_info' in archive

114
    def test_subsection(self, backend: LocalBackend, no_warn):
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
        backend.openSection('section_run')
        backend.openSection('section_method')
        backend.closeSection('section_method', -1)

        backend.openSection('section_method')
        backend.closeSection('section_method', -1)

        backend.openSection('section_run')
        backend.closeSection('section_run', 0)
        backend.closeSection('section_run', 1)

        backend.openSection('section_method')
        backend.closeSection('section_method', -1)

        runs = backend.data['section_run']
        assert len(runs) == 2
        assert len(runs[0]['section_method']) == 2
        assert len(runs[1]['section_method']) == 1

134
    def test_context(self, backend: LocalBackend, no_warn):
135
136
137
138
139
        backend.openSection('section_run')
        backend.openSection('section_method')
        backend.closeSection('section_method', -1)
        backend.closeSection('section_run', -1)

140
141
        backend.openSection('section_run')
        backend.closeSection('section_run', -1)
142

143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
        backend.openContext('/section_run/0')
        backend.addValue('program_name', 't1')
        backend.closeContext('/section_run/0')

        backend.openContext('/section_run/1')
        backend.addValue('program_name', 't2')
        backend.closeContext('/section_run/1')

        backend.openContext('/section_run/0/section_method/0')
        backend.closeContext('/section_run/0/section_method/0')

        runs = backend.data['section_run']
        assert runs[0]['program_name'] == 't1'
        assert runs[1]['program_name'] == 't2'

158
    def test_multi_context(self, backend: LocalBackend, no_warn):
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
        backend.openSection('section_run')
        backend.closeSection('section_run', -1)

        backend.openContext('/section_run/0')
        backend.openSection('section_method')
        backend.closeSection('section_method', -1)
        backend.closeContext('/section_run/0')

        backend.openContext('/section_run/0')
        backend.openSection('section_method')
        backend.closeSection('section_method', -1)
        backend.closeContext('/section_run/0')

        assert len(backend.data['section_method']) == 1

174
    def test_bad_context(self, backend: LocalBackend, no_warn):
175
176
177
178
179
180
181
182
183
184
185
186
        try:
            backend.openContext('section_run/0')
            assert False
        except BadContextURI:
            pass

        try:
            backend.openContext('dsfds')
            assert False
        except BadContextURI:
            pass

187
188
189
190
191
192
193
194
195

def create_reference(data, pretty):
    if (pretty):
        return json.dumps(data, indent=2)
    else:
        return json.dumps(data, separators=(',', ':'))


@pytest.mark.parametrize("pretty", [False, True])
196
def test_stream_generator(pretty, no_warn):
197
198
199
200
201
202
203
204
205
206
207
208
209
    example_data = [
        {
            'key1': 'value',
            'key2': 1
        },
        {
            'key': {
                'key': 'value'
            }
        }
    ]

    out = StringIO()
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
    writer = JSONStreamWriter(out, pretty=pretty)
    writer.open_array()
    writer.open_object()
    writer.key('key1')
    writer.value('value')
    writer.key('key2')
    writer.value(1)
    writer.close_object()
    writer.open_object()
    writer.key('key')
    writer.open_object()
    writer.key('key')
    writer.value('value')
    writer.close_object()
    writer.close_object()
    writer.close_array()
    writer.close()
227
228
229

    assert create_reference(example_data, pretty) == out.getvalue()

230

231
232
def assert_parser_result(backend):
    status, errors = backend.status
233
234
    assert status == 'ParseSuccess'
    assert errors is None or len(errors) == 0
235
236


237
238
def run_parser(parser_name, mainfile):
    parser = parser_dict[parser_name]
239
240
    result = parser.run(mainfile, logger=utils.get_logger(__name__))
    return add_calculation_info(result)
Markus Scheidgen's avatar
Markus Scheidgen committed
241
242


243
244
245
246
@pytest.fixture
def parsed_vasp_example() -> LocalBackend:
    return run_parser(
        'parsers/vasp', '.dependencies/parsers/vasp/test/examples/xml/perovskite.xml')
Markus Scheidgen's avatar
Markus Scheidgen committed
247
248


249
250
251
252
253
254
@pytest.fixture
def parsed_template_example() -> LocalBackend:
    return run_parser(
        'parsers/template', 'tests/data/parsers/template.json')


255
256
257
258
259
260
261
@pytest.fixture(
    params=faulty_unknown_one_d_matid_example, ids=lambda spec: '%s-%s' % spec)
def parsed_faulty_unknown_matid_example(caplog, request) -> LocalBackend:
    parser_name, mainfile = request.param
    return run_parser(parser_name, mainfile)


262
263
264
@pytest.fixture(params=parser_examples, ids=lambda spec: '%s-%s' % spec)
def parsed_example(request) -> LocalBackend:
    parser_name, mainfile = request.param
Markus Scheidgen's avatar
Markus Scheidgen committed
265
266
    result = run_parser(parser_name, mainfile)
    return result
267
268


269
270
271
def add_calculation_info(backend: LocalBackend) -> LocalBackend:
    backend.openNonOverlappingSection('section_calculation_info')
    backend.addValue('upload_id', 'test_upload_id')
272
273
    backend.addValue('calc_id', 'test_calc_id')
    backend.addValue('calc_hash', 'test_calc_hash')
274
275
276
277
    backend.addValue('main_file', 'test/mainfile.txt')
    backend.addValue('parser_name', 'testParser')
    backend.closeNonOverlappingSection('section_calculation_info')
    return backend
278
279


280
281
282
@pytest.mark.parametrize('parser_name, mainfile', parser_examples)
def test_parser(parser_name, mainfile, caplog):
    parsed_example = run_parser(parser_name, mainfile)
283
    assert_parser_result(parsed_example)
Markus Scheidgen's avatar
Markus Scheidgen committed
284

285
286
287
288
289
290
    logger_received = False
    for record in caplog.get_records(when='call'):
        if record.levelname == 'DEBUG':
            logger_received |= json.loads(record.msg)['event'] == 'received logger'
    assert logger_received

Markus Scheidgen's avatar
Markus Scheidgen committed
291

292
def test_match(no_warn):
Markus Scheidgen's avatar
Markus Scheidgen committed
293
    directory = 'tests/data/proc/match'
294
295
296
297
298

    count = 0
    for dirpath, _, filenames in os.walk(directory):
        for filename in filenames:
            fullname = os.path.join(dirpath, filename)
Markus Scheidgen's avatar
Markus Scheidgen committed
299
300
301
            for parser in parser_dict.values():
                if parser.is_mainfile(fullname, lambda fn: open(fn)):
                    count += 1
302

Markus Scheidgen's avatar
Markus Scheidgen committed
303
    assert count == 6