Source code for spec2nexus.plugins.spec_common

#!/usr/bin/env python
# -*- coding: utf-8 -*-

# -----------------------------------------------------------------------------
# :author:    Pete R. Jemian
# :email:     prjemian@gmail.com
# :copyright: (c) 2014-2020, Pete R. Jemian
#
# Distributed under the terms of the Creative Commons Attribution 4.0 International Public License.
#
# The full license is in the file LICENSE.txt, distributed with this software.
# -----------------------------------------------------------------------------

"""
SPEC data file standard control lines

:see: SPEC manual, *Standard Data File Format*,
   http://www.certif.com/spec_manual/user_1_4_1.html

"""

from collections import OrderedDict
import datetime
import six
import time

from ..diffractometers import get_geometry_catalog, Diffractometer
from ..eznx import write_dataset, makeGroup, openGroup, makeLink
from ..plugin import AutoRegister, ControlLineHandler
from ..scanf import scanf
from ..spec import (
    SpecDataFileHeader,
    SpecDataFileScan,
    DuplicateSpecScanNumber,
    MCA_DATA_KEY,
)
from ..utils import (
    strip_first_word,
    iso8601,
    split_column_labels,
    clean_name,
)
from ..writer import CONTAINER_CLASS


SCAN_DATA_KEY = "scan_data"

# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

# header block


[docs]@six.add_metaclass(AutoRegister)
class SPEC_File(ControlLineHandler):

    """
    **#F** -- original data file name (starts a file header block)

    Module :mod:`spec2nexus.spec` is responsible for handling this control line.

    IN-MEMORY REPRESENTATION

    * (SpecDataFile): **fileName**
    * (SpecDataFileHeader) : **file**

    HDF5/NeXus REPRESENTATION

    * file root-level attribute: **SPEC_file**
    """

    key = r"#F"
    # do NOT add F to scan_attributes_defined

[docs]    def process(self, text, spec_file_obj, *args, **kws):
        if not hasattr(spec_file_obj, "specFile"):
            spec_file_obj.specFile = None
        if spec_file_obj.specFile in (None, ""):
            spec_file_obj.specFile = strip_first_word(text)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Epoch(ControlLineHandler):

    """
    **#E** -- the UNIX epoch (seconds from 00:00 GMT 1/1/70)

    In SPEC data files, the ``#E`` control line indicates the
    start of a *header* block.

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **epoch** *int*

    HDF5/NeXus REPRESENTATION

    * file root-level attribute: **SPEC_epoch** *int*
    """

    key = r"#E"
    # do NOT add E to scan_attributes_defined

[docs]    def process(self, buf, sdf_object, *args, **kws):
        matches = [
            h for h in sdf_object.headers if h.raw.strip() == buf.strip()
        ]
        if len(matches) > 0:
            # this header exists, nothing to do
            return
        header = SpecDataFileHeader(buf, parent=sdf_object)
        line = buf.splitlines()[0].strip()
        if line.find(".") > -1:
            header.epoch = float(strip_first_word(line))
        else:
            header.epoch = int(strip_first_word(line))
        sdf_object.headers.append(header)
        header.interpret()  # parse the full header


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Date(ControlLineHandler):

    """
    **#D** -- date/time stamp

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **date** *str*, ISO8601 format

    HDF5/NeXus REPRESENTATION

    * file root-level attribute: **SPEC_date** *str* (value for 1st header block is used)
    """

    key = r"#D"
    # do NOT add epoch and date to scan_attributes_defined

[docs]    def process(self, text, sdf_object, *args, **kws):
        text = strip_first_word(text)
        # if isinstance(sdf_object, SpecDataFileScan):
        #     sdf_object = sdf_object.header
        sp = text.split(" ")
        if len(sp) == 1:
            sdf_object.epoch = int(float(text))
            text = datetime.datetime.fromtimestamp(float(text))
            text = text.strftime("%c")
        sdf_object.date = text
        if not hasattr(sdf_object, "epoch"):
            # Mon Jul 08 13:35:50 2019
            spec_fmt = "%a %b %d %H:%M:%S %Y"
            ts = time.strptime(text, spec_fmt)
            sdf_object.epoch = time.mktime(ts)
        if isinstance(sdf_object, SpecDataFileScan):
            sdf_object.addH5writer(self.key, self.writer)
            if len(sdf_object.header.date.strip()) == 0:
                sdf_object.header.date = text
                sdf_object.header.epoch = sdf_object.epoch
            # TODO: what if header date is greater than this scan's date?

[docs]    def writer(self, h5parent, writer, sdf_object, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        write_dataset(h5parent, "date", iso8601(sdf_object.date))


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Comment(ControlLineHandler):

    """
    **#C** -- any comment either in the scan header or somewhere in the scan

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **comments**
    * (SpecDataFileScan):  **comments**

    HDF5/NeXus REPRESENTATION

    * file root-level attribute: **SPEC_comments** :
      string array of all comments from first header block
    * dataset named **comments** under */NXentry* group, such as */S1/comments* :
      string array of all comments from this scan block

    """

    key = r"#C"
    scan_attributes_defined = ["comments"]

[docs]    def process(self, text, scan, *args, **kws):
        scan.comments.append(strip_first_word(text))
        pos = text.find("Scan aborted after ")
        if pos > 0:
            scan._aborted_ = text[pos:]
        if isinstance(scan, SpecDataFileScan):
            scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        write_dataset(
            h5parent, "comments", "\n".join(list(map(str, scan.comments)))
        )


# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

# scan block


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Scan(ControlLineHandler):

    """
    **#S** -- SPEC scan

    In SPEC data files, the ``#S`` control line indicates the
    start of a *scan* block.  Each scan will be written to a
    separate **NXentry** group in the HDF5 file.

    **NXentry**:
        "The top-level NeXus group which contains all the data
        and associated information that comprise a single measurement."

        -- http://download.nexusformat.org/doc/html/classes/base_classes/NXentry.html

    IN-MEMORY REPRESENTATION

    * (SpecDataFile):
    * (SpecDataFileHeader):

    HDF5/NeXus REPRESENTATION

    * */NXentry* group named 'S%d` scan_number at root
      level, such as */S1*

    """

    key = r"#S"
    # do NOT add S to scan_attributes_defined

[docs]    def process(self, part, sdf, *args, **kws):
        if len(sdf.headers) == 0:
            # make a header if none exists now
            raw = ""  # TODO: what default content to use?
            header = SpecDataFileHeader(raw, parent=sdf)
            sdf.headers.append(header)
        else:
            header = sdf.headers[-1]  # pick the most recent header

        matches = [
            (k, s)
            for k, s in sdf.scans.items()
            if s.raw.strip() == part.strip()
        ]

        if len(matches) > 0 and sdf.last_scan is not None:
            if sdf.getScan(sdf.last_scan).raw != part:
                return

        scan = SpecDataFileScan(header, part, parent=sdf)
        if sdf.last_scan is not None:
            # We know that `part` does not match any existing scan.
            # Do the first few lines match (#S and #D in particular)?
            # If so, then that scan has been updated with more data.
            def beginning(buf):
                "return a string with first few lines of buf"
                return "\n".join(
                    [
                        line
                        for line in buf.strip().splitlines()[:5]
                        if line.startswith("#")
                    ]
                )

            # TODO: replace beginning() with new algorithm
            # if new_scan.raw.startswith(last_scan.raw), that's it!

            if beginning(part) == beginning(
                sdf.getScan(sdf.last_scan).raw
            ):
                # remove the last scan
                del sdf.scans[sdf.last_scan]
                sdf.last_scan = None

        scan.S = strip_first_word(part.splitlines()[0].strip())
        scan.scanNum = scan.S.split()[0]
        scan.scanCmd = strip_first_word(scan.S)

        if scan.scanNum in sdf.scans:
            # Before raising an exception,
            #    Check for duplicate scan number and create alternate name
            #    write as "%d.%d" % (scan.scanNum, index+1)
            #    where index is the lowest integer in
            #    range(really big) that is not already in use.
            # really_big <= len(total number of scans in data file)
            # Will a non-integer scanNum break anything?  [note: It *has* caused troubles.]
            for i in range(len(scan.parent.scans)):
                new_scanNum = "%s.%d" % (scan.scanNum, i + 1)
                if new_scanNum not in sdf.scans:
                    scan.scanNum = new_scanNum
                    break
        scan.scanNum = str(scan.scanNum)
        if scan.scanNum in sdf.scans:
            msg = str(scan.scanNum) + " in " + sdf.fileName
            raise DuplicateSpecScanNumber(msg)
        sdf.scans[scan.scanNum] = scan


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Geometry(ControlLineHandler):

    """
    **#G** -- diffractometer geometry (numbered rows: #G0, #G1, ...)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **G**

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **G** in the *NXentry* group, such as */S1/G*

      * Datasets created from dictionary <scan>.G
        (indexed by number from the scan block, such as ``G0``, ``G1``, ...).
        Meaning of contents for each index are defined by geometry-specific
        SPEC diffractometer support.

    * *NXinstrument* & *NXsample* groups for interpreted information
    """

    key = r"#G\d+"
    scan_attributes_defined = ["G", "diffractometer"]

[docs]    def process(self, text, scan, *args, **kws):
        subkey = text.split()[0].lstrip("#")
        scan.G[subkey] = strip_first_word(text)
        scan.addPostProcessor("diffractometer geometry", self.postprocess)

[docs]    def postprocess(self, scan, *args, **kws):
        if len(scan.G) > 0:
            scan.addH5writer("diffractometer geometry", self.writer)

        dgc = get_geometry_catalog()
        geometry = dgc.match(scan)
        diffractometer = Diffractometer(geometry)
        if diffractometer is None:
            scan.geometry = {}
        else:
            diffractometer.parse(scan)
            scan.diffractometer = diffractometer

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        # e.g.: SPECD/four.mac
        # http://certif.com/spec_manual/fourc_4_9.html
        desc = "SPEC geometry arrays, meanings defined by SPEC diffractometer support"
        group = makeGroup(h5parent, "G", nxclass, description=desc)
        dd = {}
        for item, value in scan.G.items():
            dd[item] = list(map(float, value.split()))
        writer.save_dict(group, dd)

        gpar = scan.diffractometer.geometry_parameters
        if len(gpar) > 0:
            nxinstrument = openGroup(
                h5parent, "instrument", "NXinstrument"
            )
            write_dataset(
                nxinstrument,
                "name",
                scan.diffractometer.geometry_name_full,
            )
            if scan.diffractometer.lattice is not None:
                nxsample = openGroup(h5parent, "sample", "NXsample")
                abc = [
                    scan.diffractometer.lattice.a,
                    scan.diffractometer.lattice.b,
                    scan.diffractometer.lattice.c,
                ]
                angles = [
                    scan.diffractometer.lattice.alpha,
                    scan.diffractometer.lattice.beta,
                    scan.diffractometer.lattice.gamma,
                ]
                write_dataset(
                    nxsample, "unit_cell_abc", abc, units="angstrom",
                )
                write_dataset(
                    nxsample,
                    "unit_cell_alphabetagamma",
                    angles,
                    units="degrees",
                )
                write_dataset(  # ah, NeXus ... so many ways ...
                    nxsample, "unit_cell", abc + angles,
                )
            if "ub_matrix" in gpar:
                nxsample = openGroup(h5parent, "sample", "NXsample")
                ub = gpar["ub_matrix"].value
                write_dataset(nxsample, "ub_matrix", ub)
            if scan.diffractometer.mode is not None:
                nxsample = openGroup(h5parent, "sample", "NXsample")
                write_dataset(
                    nxsample,
                    "diffractometer_mode",
                    scan.diffractometer.mode,
                )
            if scan.diffractometer.sector is not None:
                nxsample = openGroup(h5parent, "sample", "NXsample")
                write_dataset(
                    nxsample,
                    "diffractometer_sector",
                    scan.diffractometer.sector,
                )
            if len(scan.diffractometer.reflections) > 0:
                nxsample = openGroup(h5parent, "sample", "NXsample")
                for i, ref in enumerate(scan.diffractometer.reflections):
                    nm = "or%d" % i
                    nxnote = openGroup(
                        nxsample,
                        nm,
                        "NXnote",
                        description=nm + ": orientation reflection",
                    )
                    write_dataset(nxnote, "h", ref.h)
                    write_dataset(nxnote, "k", ref.k)
                    write_dataset(nxnote, "l", ref.l)
                    write_dataset(
                        nxnote,
                        "wavelength",
                        ref.wavelength,
                        units="Angstrom",
                    )
                    for k, a in ref.angles.items():
                        write_dataset(
                            nxnote,
                            k,
                            a,
                            units="degrees",
                            description="diffractometer angle",
                        )
            if scan.diffractometer.wavelength is not None:
                # see: http://download.nexusformat.org/doc/html/strategies.html#strategies-wavelength
                nxmono = openGroup(
                    nxinstrument, "monochromator", "NXmonochromator"
                )
                ds = write_dataset(
                    nxmono,
                    "wavelength",
                    scan.diffractometer.wavelength,
                    units="angstrom",
                )
                # and: http://download.nexusformat.org/doc/html/classes/base_classes/NXbeam.html#nxbeam
                nxsample = openGroup(h5parent, "sample", "NXsample")
                nxbeam = openGroup(nxsample, "beam", "NXbeam")
                # link them
                makeLink(
                    nxsample, ds, nxbeam.name + "/incident_wavelength"
                )

            nxnote = openGroup(
                nxinstrument,
                "geometry_parameters",
                nxclass,
                description="SPEC geometry arrays, interpreted",
            )
            for kdv in gpar.values():
                d = kdv.description
                if len(d) == 0:
                    write_dataset(nxnote, kdv.key, kdv.value)
                else:
                    write_dataset(
                        nxnote, kdv.key, kdv.value, description=d
                    )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_NormalizingFactor(ControlLineHandler):

    """
    **#I** -- intensity normalizing factor

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **I**

    HDF5/NeXus REPRESENTATION

    * Dataset named **intensity_factor** in the *NXentry* group, such as */S1/intensity_factor*
    """

    key = r"#I"
    scan_attributes_defined = ["I"]

[docs]    def process(self, text, scan, *args, **kws):
        scan.I = float(strip_first_word(text))

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if hasattr(scan, "I"):
            writer.write_dataset(h5parent, "intensity_factor", scan.I)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_CounterNames(ControlLineHandler):

    """
    **#J** -- names of counters (each separated by two spaces) (new with SPEC v6)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **J** : mnemonics

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **counter_cross_reference** in the *NXentry* group, such as */S1/counter_cross_reference*

      * datasets with names supplied as SPEC counter mnemonics, string values supplied as SPEC counter names

    """

    key = r"#J\d+"
    scan_attributes_defined = ["J"]

[docs]    def process(self, text, header, *args, **kws):
        if not hasattr(header, "J"):
            header.J = []
        header.J.append(strip_first_word(text).split())
        header.addPostProcessor(
            "counter cross-referencing", self.postprocess
        )

[docs]    def postprocess(self, header, *args, **kws):
        counter_xref_postprocessing(header)
        header.addH5writer("counter cross-referencing", self.writer)

[docs]    def writer(self, h5parent, writer, header, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if not hasattr(header, "counter_xref"):
            header.counter_xref = {}  # mnemonic:name
        desc = "cross-reference SPEC counter mnemonics and names"
        comment = "keys are SPEC counter mnemonics, values are SPEC counter names"
        if nxclass is None:
            nxclass = CONTAINER_CLASS
        group = makeGroup(
            h5parent,
            "counter_cross_reference",
            nxclass,
            description=desc,
            comment=comment,
        )
        for key, value in sorted(header.counter_xref.items()):
            write_dataset(group, key, value)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_CounterMnemonics(ControlLineHandler):

    """
    **#j** -- mnemonics of counter  (new with SPEC v6)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **j** : mnemonics

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **counter_cross_reference** in the *NXentry* group, such as */S1/counter_cross_reference*

      * datasets with names supplied as SPEC counter mnemonics, string values supplied as SPEC counter names

    """

    key = r"#j\d+"
    scan_attributes_defined = ["j"]

[docs]    def process(self, text, header, *args, **kws):
        if not hasattr(header, "j"):
            header.j = []
        header.j.append(strip_first_word(text).split())
        header.addPostProcessor(
            "counter cross-referencing", self.postprocess
        )

[docs]    def postprocess(self, header, *args, **kws):
        counter_xref_postprocessing(header)
        header.addH5writer("counter cross-referencing", self.writer)

[docs]    def writer(self, h5parent, writer, header, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if not hasattr(header, "counter_xref"):
            header.counter_xref = {}  # mnemonic:name
        desc = "cross-reference SPEC counter mnemonics and names"
        comment = "keys are SPEC counter mnemonics, values are SPEC counter names"
        if nxclass is None:
            nxclass = CONTAINER_CLASS
        group = makeGroup(
            h5parent,
            "counter_cross_reference",
            nxclass,
            description=desc,
            comment=comment,
        )
        for key, value in sorted(header.counter_xref.items()):
            write_dataset(group, key, value)


def counter_xref_postprocessing(header):
    if not hasattr(header, "j") or not hasattr(header, "J"):
        return
    if not hasattr(header, "counter_xref"):
        header.counter_xref = {}  # mnemonic:name
    for row_number, mne_row in enumerate(header.j):
        name_row = header.J[row_number]
        for column_number, mne in enumerate(mne_row):
            header.counter_xref[mne] = name_row[column_number]


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Labels(ControlLineHandler):

    """
    **#L** -- data column labels

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **L** : labels
    * (SpecDataFileScan): **data** : {labels: values}

    HDF5/NeXus REPRESENTATION

    * *NXdata* group named **data** in the *NXentry* group,
      such as */S1/data*
    * datasets with names supplied in **L**, array values
      collected in **data_lines**

    """

    key = r"#L"
    scan_attributes_defined = ["L", "column_first", "column_last"]

[docs]    def process(self, text, scan, *args, **kws):
        # Some folks use more than two spaces!  Use regular expression(re) module
        scan.L = split_column_labels(strip_first_word(text))

        if len(scan.L) == 1 and hasattr(scan, "N") and scan.N[0] > 1:
            # BUT: some folks only use a single-space as a separator!
            # perhaps #L was written with single-space separators.?
            # Unusual for scan to have only 1 column, but possible
            labels = strip_first_word(text).split()
            if len(labels) == scan.N[0]:
                scan.L = labels

        scan.column_first = scan.L[0]
        scan.column_last = scan.L[-1]


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Monitor(ControlLineHandler):

    """
    **#M** -- counting against this constant monitor count (see #T)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **M**

    HDF5/NeXus REPRESENTATION

    * Dataset named **M** in the *NXentry* group, such as */S1/M*
    * Dataset named **counting_basis** in the *NXentry* group with
      value *SPEC scan with constant monitor count*, such as */S1/counting_basis*

    """

    key = r"#M"
    scan_attributes_defined = ["M", "monitor_name"]

[docs]    def process(self, text, scan, *args, **kws):
        text = strip_first_word(text)
        pos = text.find(" ")
        scan.M = text[:pos]
        scan.monitor_name = text[pos:].strip().lstrip("(").rstrip(")")

        scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        desc = "SPEC scan with constant monitor count"
        write_dataset(h5parent, "counting_basis", desc)
        write_dataset(
            h5parent, "M", float(scan.M), units="counts", description=desc
        )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_NumColumns(ControlLineHandler):

    """
    **#N** -- number of columns of data [ num2 sets per row ]

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **N** : [int]

    HDF5/NeXus REPRESENTATION

    * not written to file
    """

    key = r"#N"
    # TODO: Needs an example data file to test (issue #8)
    scan_attributes_defined = ["N"]

[docs]    def process(self, text, scan, *args, **kws):
        scan.N = list(map(int, strip_first_word(text).split()))


[docs]@six.add_metaclass(AutoRegister)
class SPEC_PositionerNames(ControlLineHandler):

    """
    **#O** -- positioner names (numbered rows: #O0, #O1, ...)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader) : **O** : label
    * (SpecDataFileScan): **positioner** : {label: value}

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **positioners** in the *NXentry* group, such as */S1/positioners*

      * datasets created from dictionary <scan>.positioner

    * *NXnote* group named **positioner_cross_reference** in the *NXentry* group, such as */S1/positioner_cross_reference*

      * datasets with names supplied as SPEC positioner mnemonics, string values supplied as SPEC positioner names

    """

    key = r"#O\d+"
    scan_attributes_defined = ["O"]

[docs]    def process(self, text, sdf_object, *args, **kws):
        if isinstance(sdf_object, SpecDataFileScan):
            sdf_object = sdf_object.header
        key = text.split()[0]
        if key == "#O0":
            sdf_object.O = []  # TODO: What if motor names are different?
        content = strip_first_word(text).strip()
        if content == "":
            content = []
        else:
            content = split_column_labels(content)
        sdf_object.O.append(content)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_PositionerMnemonics(ControlLineHandler):

    """
    **#o** -- positioner mnemonics (new with SPEC v6)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **o** : mnemonics

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **positioner_cross_reference** in the *NXentry* group, such as */S1/positioner_cross_reference*

      * datasets with names supplied as SPEC positioner mnemonics, string values supplied as SPEC positioner names

    """

    key = r"#o\d+"
    scan_attributes_defined = ["o"]

[docs]    def process(self, text, header, *args, **kws):
        if not hasattr(header, "o"):
            header.o = []
        content = strip_first_word(text).strip()
        if content == "":
            content = []
        else:
            content = content.split()
        header.o.append(content)
        header.addPostProcessor(
            "positioner cross-referencing", self.postprocess
        )

[docs]    def postprocess(self, header, *args, **kws):
        positioner_xref_postprocessing(header)
        header.addH5writer("positioner cross-referencing", self.writer)

[docs]    def writer(self, h5parent, writer, header, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if not hasattr(header, "positioner_xref"):
            header.counter_xref = {}  # mnemonic:name
        desc = "cross-reference SPEC positioner mnemonics and names"
        comment = "keys are SPEC positioner mnemonics, values are SPEC positioner names"
        if nxclass is None:
            nxclass = CONTAINER_CLASS
        group = makeGroup(
            h5parent,
            "positioner_cross_reference",
            nxclass,
            description=desc,
            comment=comment,
        )
        for key, value in sorted(header.positioner_xref.items()):
            write_dataset(group, key, value)


def positioner_xref_postprocessing(header):
    if not hasattr(header, "o") or not hasattr(header, "O"):
        return
    if not hasattr(header, "positioner_xref"):
        header.positioner_xref = {}  # mnemonic:name
    for row_number, mne_row in enumerate(header.o):
        name_row = header.O[row_number]
        for column_number, mne in enumerate(mne_row):
            header.positioner_xref[mne] = name_row[column_number]


[docs]@six.add_metaclass(AutoRegister)
class SPEC_Positioners(ControlLineHandler):

    """
    **#P** -- positioner values at start of scan (numbered rows: #P0, #P1, ...)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader) : **O** : label
    * (SpecDataFileScan): **positioner** : {label: value}

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **positioners** in the *NXentry* group, such as */S1/positioners*

      * datasets created from dictionary <scan>.positioner

    """

    key = r"#P\d+"
    scan_attributes_defined = ["P", "positioner"]

[docs]    def process(self, text, scan, *args, **kws):
        if isinstance(scan, SpecDataFileHeader):
            scan = scan.getLatestScan()
        content = strip_first_word(text)
        if content == "":
            content = []
        else:
            content = content.split()
        scan.P.append(content)
        scan.addPostProcessor("motor_positions", self.postprocess)

[docs]    def postprocess(self, scan, *args, **kws):
        """
        interpret the motor positions from the scan header

        :param SpecDataFileScan scan: data from a single SPEC scan
        """
        scan.positioner = OrderedDict()
        for row, values in enumerate(scan.P):
            if row >= len(scan.header.O):
                scan.add_interpreter_comment(
                    "#P%d found without #O%d" % (row, row)
                )
                continue
            for col, val in enumerate(values):
                if col >= len(scan.header.O[row]):
                    scan.add_interpreter_comment(
                        "extra value in #P%d position %d, no matching label in #O%d"
                        % (row, col + 1, row)
                    )
                    continue
                mne = scan.header.O[row][col]
                scan.positioner[mne] = float(val)
        if len(scan.positioner) > 0:
            scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        desc = "SPEC positioners (#P & #O lines)"
        group = makeGroup(
            h5parent, "positioners", nxclass, description=desc
        )
        # writer.save_dict(group, scan.positioner)
        for k, v in scan.positioner.items():
            safe_name = clean_name(k)
            pg = openGroup(group, safe_name, "NXpositioner")
            write_dataset(pg, "name", safe_name, spec_name=k)
            write_dataset(pg, "value", v, spec_name=k)
        nxinstrument = openGroup(h5parent, "instrument", "NXinstrument")
        makeLink(h5parent, group, nxinstrument.name + "/positioners")


[docs]@six.add_metaclass(AutoRegister)
class SPEC_HKL(ControlLineHandler):

    """
    **#Q** -- :math:`Q` (:math:`hkl`) at start of scan

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **Q**

    HDF5/NeXus REPRESENTATION

    * Dataset named **Q** in the *NXentry* group, such as */S1/M*
    """

    key = r"#Q"
    scan_attributes_defined = ["Q"]

[docs]    def process(self, text, scan, *args, **kws):
        s = strip_first_word(text)
        if len(s) > 0:
            scan.Q = list(map(float, s.split()))
            scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        desc = "hkl at start of scan"
        write_dataset(h5parent, "Q", scan.Q, description=desc)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_CountTime(ControlLineHandler):

    """
    **#T** -- counting against this constant number of seconds (see #M)

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **T**

    HDF5/NeXus REPRESENTATION

    * Dataset named **T** in the *NXentry* group, such as */S1/T*
    * Dataset named **counting_basis** in the *NXentry* group with
      value *SPEC scan with constant counting time*, such as */S1/counting_basis*

    """

    key = r"#T"
    scan_attributes_defined = ["T", "time_name"]

[docs]    def process(self, text, scan, *args, **kws):
        text = strip_first_word(text)
        pos = text.find(" ")
        scan.T = text[:pos]
        scan.time_name = text[pos:].strip().lstrip("(").rstrip(")")

        scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        desc = "SPEC scan with constant counting time"
        write_dataset(h5parent, "counting_basis", desc)
        write_dataset(
            h5parent, "T", float(scan.T), units="s", description=desc
        )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_UserReserved(ControlLineHandler):

    """
    **#U** -- Reserved for user

    IN-MEMORY REPRESENTATION

    * (SpecDataFileHeader): **U**, [*str*]
    * (SpecDataFileScan): **U**, [*str*]

    HDF5/NeXus REPRESENTATION

    * Within a group named **UserReserved** in the *NXentry* group:
      dataset(s) named **header_##** (from the SPEC data file header
      section) or **item_##** (from the SPEC data file scan section),
      such as */S1/UserReserved/header_1* and  */S1/UserReserved/item_5*
    """

    key = r"#U"
    scan_attributes_defined = ["U"]

[docs]    def process(self, text, sdf_object, *args, **kws):
        text = strip_first_word(text)
        if not hasattr(sdf_object, "U"):
            sdf_object.U = []
        sdf_object.U.append(text.strip())

        sdf_object.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, sdf_object, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        desc = 'SPEC control line "#U: Reserved for user"'
        group = openGroup(
            h5parent, "UserReserved", "NXnote", description=desc
        )
        if isinstance(sdf_object, SpecDataFileHeader):
            tag = "header"
        else:
            tag = "item"
        for i, text in enumerate(sdf_object.U):
            key = "%s_%d" % (tag, i + 1)
            write_dataset(
                group, key, text, description="#U line %d" % (i + 1)
            )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_TemperatureSetPoint(ControlLineHandler):

    """
    **#X** -- Temperature Set Point (desired temperature)

    The default declaration of the #X control line is written::

         def Fheader '_cols++;printf("#X %gKohm (%gC)\\n",TEMP_SP,DEGC_SP)'

    The supplied macro alters this slightly (replacing %g with %f)
    and uses the :meth:`spec2nexus.scanf.scanf` implementation with this format::

        fmt = "#X %fKohm (%fC)"

    Depending on the circumstances, this might be a good candidate to override
    with a custom *ControlLineHandler* that parses the data as written.
    If the conversion process fails for any reason in this implementation, the *#X* line is ignored.

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **TEMP_SP**
    * (SpecDataFileScan): **DEGC_SP**

    HDF5/NeXus REPRESENTATION

    * Dataset named **TEMP_SP** in the *NXentry* group, such as */S1/TEMP_SP*
    * Dataset named **DEGC_SP** in the *NXentry* group, such as */S1/DEGC_SP*
    """

    key = r"#X"
    scan_attributes_defined = ["TEMP_SP", "DEGC_SP"]

[docs]    def process(self, text, scan, *args, **kws):
        # Try a list of formats until one succeeds
        format_list = [
            "#X %fKohm (%fC)",
            # "#X %g %g",        # note: %g specifier is not available
            "#X %f %f",
        ]
        for fmt in format_list:
            result = scanf(fmt, text)
            if result is not None:
                scan.TEMP_SP, scan.DEGC_SP = result
                scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        # consider putting this info under NXsample or NXentry/metadata
        if hasattr(scan, "TEMP_SP"):
            write_dataset(
                h5parent,
                "TEMP_SP",
                scan.TEMP_SP,
                description="temperature set point",
            )
        if hasattr(scan, "DEGC_SP"):
            write_dataset(
                h5parent,
                "DEGC_SP",
                scan.DEGC_SP,
                units="C",
                description="temperature set point (C)",
            )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_DataLine(ControlLineHandler):

    """
    **(scan_data)** -- scan data line

    Scan data could include interspersed MCA data or
    even describe 2-D or 3-D data.  T
    his method reads the data lines and
    buffers them for post-processing in
    :meth:`spec2nexus.plugins.spec_common_spec2nexus.data_lines_postprocessing`.

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **data_lines** : values
    * (SpecDataFileScan): **data** : {labels: values}

    HDF5/NeXus REPRESENTATION

    * *NXdata* group named **data** in the *NXentry* group,
      such as */S1/data*

    * datasets with names supplied in **L**, array values
      collected in **data_lines**

    """

    # key = r'[+-]?\d*\.?\d?'
    # use custom key match since regexp for floats is tedious!
    key = SCAN_DATA_KEY
    scan_attributes_defined = ["data", "data_lines"]

[docs]    def match_key(self, text):
        """
        Easier to try conversion to number than construct complicated regexp
        """
        try:
            float(text.strip().split()[0])
            return True
        except ValueError:
            return False

[docs]    def process(self, text, scan, *args, **kws):
        scan.data_lines.append(text)

        # defer processing since comments and MCA data may
        # intersperse the scan data
        scan.addPostProcessor(SCAN_DATA_KEY, self.postprocess)

[docs]    def postprocess(self, scan, *args, **kws):
        data_lines_postprocessing(scan)


# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

# MCA: multi-channel analyzer

# see ESRF BLISS group: http://www.esrf.eu/blissdb/macros/getsource.py?macname=mca.mac


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA(ControlLineHandler):

    """
    **#@MCA** -- MCA data formatting declaration (ignored for now)

    declares this scan contains MCA data (SPEC's array_dump() format, such as ``"#@MCA 16C"``)

    From documentation provided by the ESRF BLISS group:
    (http://www.esrf.eu/blissdb/macros/getsource.py?macname=mca.mac)

        #@MCA 16C
        Format string passed to data_dump() function.
        This format string is held by the global variable "MCA_FMT" and can then been adapted to particular needs.
        "%%16C" is the default. It dumps data on 1 line, cut every 16 points::

            @A 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\\
             0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\\
             0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\\
             0 0 0 0 0 0 0 0 0 0 0 ...

        "%%16" would do the same without any backslash
        "1" would dump 1 point per line, ...

    """

    key = r"#@MCA"

[docs]    def process(self, text, scan, *args, **kws):
        # #@MCA 16C
        # Isn't this only informative to how the data is presented in the file?
        pass  # not sure how to handle this, ignore it for now


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA_Array(ControlLineHandler):

    """
    **@A** -- MCA Array data

    MCA data. Each value is the content of one channel, or an
    integrated value over several channels if a reduction was applied.

    Since the MCA Array data is interspersed with scan data,
    this method reads the data lines and buffers them for post-processing in
    :meth:`spec2nexus.plugins.spec_common_spec2nexus.data_lines_postprocessing`.

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **data_lines** : values
    * (SpecDataFileScan): **data** : {labels: values}

    HDF5/NeXus REPRESENTATION

    * *NXdata* group named **data** in the *NXentry* group, such as */S1/data*

      * Dataset **_mca_** : *float* MCA data reported on *@A* lines
      * Dataset **_mca_channel_**: provided as HDF5 dimension scale for **_mca_** dataset
          * if CALIB data specified: *float* scaled MCA channels -- :math:`x_k = a +bk + ck^2`
          * if CALIB data not specified: *int* MCA channel numbers

    """

    key = r"@A\d*"
    # continued lines will be matched by SPEC_DataLine
    # process these lines only after all lines have been read
    scan_attributes_defined = ["data_lines"]

    # TODO: need more examples of MCA spectra in SPEC files to improve this
    # Are there any other MCA spectra (such as @B) possible?

[docs]    def process(self, text, scan, *args, **kws):
        # acquire like numerical data, handle in postprocessing
        scan.data_lines.append(text)
        scan.addPostProcessor(SCAN_DATA_KEY, self.postprocess)

[docs]    def postprocess(self, scan, *args, **kws):
        data_lines_postprocessing(scan)


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA_Calibration(ControlLineHandler):

    """
    **#@CALIB** -- coefficients to compute a scale based on the MCA channel number

    :math:`x_k = a +bk + ck^2` for MCA data, :math:`k` is channel number

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **MCA['CALIB']** = ``dict(a, b, c)``

    HDF5/NeXus REPRESENTATION

    * defines a dimension scale for MCA data
    * *NXnote* group named **MCA** in the *NXentry* group, such as */S1/MCA*

      * Dataset **calib_a** : *float*
      * Dataset **calib_b** : *float*
      * Dataset **calib_c** : *float*

    """

    # key = r'#@CALIB'
    # accept upper or lower case variants
    # https://certif.com/spec_help/scans.html
    key = r"#@[cC][aA][lL][iI][bB]"
    scan_attributes_defined = ["MCA"]

[docs]    def process(self, text, scan, *args, **kws):
        # #@CALIB a b c
        # #@Calib 0.0501959 0.0141105 0 mca1
        s = strip_first_word(text).split()
        a, b, c = list(map(float, s[0:3]))

        if not hasattr(scan, "MCA"):
            scan.MCA = {}
        if "CALIB" not in scan.MCA:
            scan.MCA["CALIB"] = {}

        scan.MCA["CALIB"]["a"] = a
        scan.MCA["CALIB"]["b"] = b
        scan.MCA["CALIB"]["c"] = c
        scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if hasattr(scan, "MCA"):
            if "CALIB" in scan.MCA:
                mca_group = openGroup(
                    h5parent, "MCA", nxclass, description="MCA metadata"
                )
                calib_dict = scan.MCA["CALIB"]
                for key in "a b c".split():
                    if key in calib_dict:
                        write_dataset(
                            mca_group, "calib_" + key, calib_dict[key]
                        )


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA_ChannelInformation(ControlLineHandler):

    """
    **#@CHANN** -- MCA channel information

    number_saved, first_saved, last_saved, reduction_coef

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **MCA['CALIB']** = ``dict(number_saved, first_saved, last_saved, reduction_coef)``

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **MCA** in the *NXentry* group, such as */S1/MCA*

      * Dataset **number_saved** : *int* number of channels saved
      * Dataset **first_saved** : *int* first channel saved
      * Dataset **first_saved** : *int* last channel saved
      * Dataset **reduction_coef** : *float* reduction coefficient

    """

    key = r"#@CHANN"
    scan_attributes_defined = ["MCA"]

[docs]    def process(self, text, scan, *args, **kws):
        # #@CHANN 1201 1110 1200 1
        s = strip_first_word(text).split()
        number_saved, first_saved, last_saved = list(map(int, s[0:3]))
        reduction_coef = float(s[-1])

        if not hasattr(scan, "MCA"):
            scan.MCA = {}

        scan.MCA["number_saved"] = number_saved
        scan.MCA["first_saved"] = first_saved
        scan.MCA["last_saved"] = last_saved
        scan.MCA["reduction_coef"] = reduction_coef
        scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if hasattr(scan, "MCA"):
            mca_group = openGroup(
                h5parent, "MCA", nxclass, description="MCA metadata"
            )
            mca = scan.MCA
            for (
                key
            ) in "number_saved  first_saved  last_saved  reduction_coef".split():
                if key in mca:
                    write_dataset(mca_group, key, mca[key])

            # make link in NXinstrument group
            nxinstrument = openGroup(
                h5parent, "instrument", "NXinstrument"
            )
            if "MCA" not in nxinstrument:
                makeLink(h5parent, mca_group, nxinstrument.name + "/MCA")


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA_CountTime(ControlLineHandler):

    """
    **#@CTIME** -- MCA count times

    preset_time, elapsed_live_time, elapsed_real_time

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **MCA['CALIB']** = ``dict(preset_time, elapsed_live_time, elapsed_real_time)``

    HDF5/NeXus REPRESENTATION

    * *NXnote* group named **MCA** in the *NXentry* group, such as */S1/MCA*

      * Dataset **preset_time** : *float*
      * Dataset **elapsed_live_time** : *float*
      * Dataset **elapsed_real_time** : *float*

    """

    key = r"#@CTIME"
    scan_attributes_defined = ["MCA"]

[docs]    def process(self, text, scan, *args, **kws):
        s = strip_first_word(text).split()
        preset_time, elapsed_live_time, elapsed_real_time = list(
            map(float, s)
        )

        if not hasattr(scan, "MCA"):
            scan.MCA = {}

        scan.MCA["preset_time"] = preset_time
        scan.MCA["elapsed_live_time"] = elapsed_live_time
        scan.MCA["elapsed_real_time"] = elapsed_real_time
        scan.addH5writer(self.key, self.writer)

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if hasattr(scan, "MCA"):
            mca_group = openGroup(
                h5parent, "MCA", nxclass, description="MCA metadata"
            )
            mca = scan.MCA
            for (
                key
            ) in (
                "preset_time  elapsed_live_time  elapsed_real_time".split()
            ):
                if key in mca:
                    write_dataset(mca_group, key, mca[key], units="s")

            # make link in NXinstrument group
            nxinstrument = openGroup(
                h5parent, "instrument", "NXinstrument"
            )
            if "MCA" not in nxinstrument:
                makeLink(h5parent, mca_group, nxinstrument.name + "/MCA")


[docs]@six.add_metaclass(AutoRegister)
class SPEC_MCA_RegionOfInterest(ControlLineHandler):

    """
    **#@ROI** -- MCA ROI (Region Of Interest) channel information

    ROI_name, first_chan, last_chan

    IN-MEMORY REPRESENTATION

    * (SpecDataFileScan): **MCA['ROI']** = {ROI_name:dict(first_chan, last_chan)}

    HDF5/NeXus REPRESENTATION

    * *NXnote* group **ROI** in
      in *NXnote* group named **MCA**
      in the *NXentry* group, such as */S1/MCA/ROI*

      * Dataset **{ROI_name}** : *int* [first_chan, last_chan]

    """

    key = r"#@ROI"
    scan_attributes_defined = ["MCA"]

[docs]    def process(self, text, scan, *args, **kws):
        text = strip_first_word(text)

        pos = text.rfind(" ")
        last_chan = int(text[pos:])
        text = text[:pos]

        pos = text.rfind(" ")
        first_chan = int(text[pos:])
        ROI_name = text[:pos].strip()

        if not hasattr(scan, "MCA"):
            scan.MCA = {}
        if "ROI" not in scan.MCA:
            scan.MCA["ROI"] = {}

        scan.MCA["ROI"][ROI_name] = {}
        scan.MCA["ROI"][ROI_name]["first_chan"] = first_chan
        scan.MCA["ROI"][ROI_name]["last_chan"] = last_chan

[docs]    def writer(self, h5parent, writer, scan, nxclass=None, *args, **kws):
        """Describe how to store this data in an HDF5 NeXus file"""
        if hasattr(scan, "MCA"):
            if hasattr(scan.MCA, "ROI"):
                mca_group = openGroup(
                    h5parent, "MCA", nxclass, description="MCA metadata"
                )
                roi_group = openGroup(
                    mca_group,
                    "ROI",
                    nxclass,
                    description="Regions Of Interest",
                )
                roi_dict = scan.MCA["ROI"]
                for key, roi in roi_dict.items():
                    dataset = [roi["first_chan"], roi["last_chan"]]
                    desc = "first_chan, last_chan"
                    write_dataset(
                        roi_group,
                        key,
                        dataset,
                        description=desc,
                        units="channel",
                    )

            # make link in NXinstrument group
            nxinstrument = openGroup(
                h5parent, "instrument", "NXinstrument"
            )
            if "MCA" not in nxinstrument:
                makeLink(h5parent, mca_group, nxinstrument.name + "/MCA")


# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -


[docs]def combine_split_NM_lines(nm, data_lines):
    """
    combine split lines of data

        #N N [M]

    Indicates there are N columns of data.
    If M is present, it indicates there
    are M sets of data columns on each line.
    """
    if len(nm) == 1:
        # no split lines indicated
        return data_lines
    dl = []
    N, M = nm
    buf = ""
    for line in data_lines:
        if line.startswith("@A"):
            if len(buf) > 0:
                dl.append(buf)
            buf = []
            dl.append(line)
        else:
            if len(buf) > 0 and buf[-1] != " ":
                buf += " "  # ensure whitespace delimiter
            buf += line
            if len(buf.split()) == N:  # assumption here!
                dl.append(buf)
                buf = ""

    return dl


[docs]def data_lines_postprocessing(scan):
    """
    interpret the data lines from the body of the scan

    :param SpecDataFileScan scan: data from a single SPEC scan
    """
    if len(scan.L) == 1 and scan.L[0].split(" ") == scan.N[0]:
        # https://github.com/prjemian/spec2nexus/issues/216#issuecomment-569745297
        raise ValueError(
            "file {}: "
            "#S {}: "
            "#L lines must use two (2) spaces between labels".format(
                scan.specFile, scan.S
            )
        )

    if len(scan.L) != scan.N[0]:
        # https://github.com/prjemian/spec2nexus/issues/216
        raise ValueError(
            "file {}: "
            "#S {}: "
            "# of given column labels in #L ({}) "
            "does not match # specified in #N ({})".format(
                scan.specFile, scan.S, len(scan.L), scan.N[0]
            )
        )

    # first, get the column labels, rename redundant labels to be unique
    # the unique labels will be the scan.data dictionary keys
    scan.data = {}
    for col in range(len(scan.L)):
        label = scan._unique_key(scan.L[col], scan.data.keys())
        # need to guard when same column label is used more than once
        if label != scan.L[col]:
            scan.L[col] = label  # rename this column's label
        scan.data[label] = []  # list for the column's data
    num_columns = len(scan.data)

    # any MCA spectra?
    data_lines = scan.data_lines
    if "@A" in [line[:2] for line in data_lines if len(line) > 2]:
        # There can be more than 1 MCA spectrum specified
        # scan.data[MCA_DATA_KEY] = {}  keys: mca or mca1, mca2, ...
        scan.data[MCA_DATA_KEY] = {}

    data_lines = combine_split_NM_lines(scan.N, data_lines)

    # interpret the data lines from the body of the scan
    for values in data_lines:
        if values.startswith("@A"):
            # which MCA spectrum is THIS one?
            parts = values.split()
            if parts[0] == "@A":  # @A: mca
                key = r"mca"
            else:
                key = r"mca" + parts[0][2:]  # @A1: mca1, @A2: mca2, ...
            if key not in scan.data[MCA_DATA_KEY]:
                scan.data[MCA_DATA_KEY][key] = []
            # accumulate this spectrum
            mca_spectrum = list(map(float, parts[1:]))
            scan.data[MCA_DATA_KEY][key].append(mca_spectrum)
        else:
            try:
                buf = scan._interpret_data_row(values)
                if len(buf) == num_columns:
                    # only keep complete rows
                    for label, val in buf.items():
                        scan.data[label].append(val)
            except ValueError as _exc:
                pass  # ignore bad data lines (could save it as such ...)
    scan.addH5writer(SCAN_DATA_KEY, data_lines_writer)


[docs]def data_lines_writer(h5parent, writer, scan, *args, **kws):
    """Describe how to store scan data in an HDF5 NeXus file"""
    desc = "SPEC scan data"
    nxdata = makeGroup(h5parent, "data", "NXdata", description=desc)
    writer.save_data(nxdata, scan)