mne-tools · drammock · Jun 26, 2025 · Jun 26, 2025 · Jul 1, 2025 · Jul 4, 2025
@@ -43,6 +43,7 @@ __all__ = [
     "read_raw_nihon",
     "read_raw_nirx",
     "read_raw_nsx",
+    "read_raw_otb",
     "read_raw_persyst",
     "read_raw_snirf",
     "show_fiff",
@@ -87,5 +88,6 @@ from .nicolet import read_raw_nicolet
 from .nihon import read_raw_nihon
 from .nirx import read_raw_nirx
 from .nsx import read_raw_nsx
+from .otb import read_raw_otb
 from .persyst import read_raw_persyst
 from .snirf import read_raw_snirf
diff --git a/mne/io/otb/__init__.py b/mne/io/otb/__init__.py
@@ -0,0 +1,7 @@
+"""OTB module for reading EMG data in OTB4 and OTB+ formats."""
+
+# Authors: The MNE-Python contributors.
+# License: BSD-3-Clause
+# Copyright the MNE-Python contributors.
+
+from .otb import read_raw_otb
diff --git a/mne/io/otb/otb.py b/mne/io/otb/otb.py
@@ -0,0 +1,308 @@
+# Authors: The MNE-Python contributors.
+# License: BSD-3-Clause
+# Copyright the MNE-Python contributors.
+
+import tarfile
+from collections import Counter
+from datetime import datetime, timezone
+from pathlib import Path
+
+import numpy as np
+from defusedxml import ElementTree as ET
+
+from ..._fiff.meas_info import create_info
+from ...utils import _check_fname, fill_doc, logger, verbose, warn
+from ..base import BaseRaw
+
+
+def _parse_patient_xml(tree):
+    """Convert an ElementTree to a dict."""
+
+    def _parse_sex(sex):
+        # TODO For devices that generate `.otb+` files, the recording GUI only has M or
+        # F options and choosing one is mandatory. For `.otb4` the field is optional.
+        return dict(m=1, f=2)[sex.lower()[0]] if sex else 0  # 0 means "unknown"
+
+    def _parse_date(dt):
+        return datetime.fromisoformat(dt).date()
+
+    subj_info_mapping = (
+        ("family_name", "last_name", str),
+        ("first_name", "first_name", str),
+        ("weight", "weight", float),
+        ("height", "height", float),
+        ("sex", "sex", _parse_sex),
+        ("birth_date", "birthday", _parse_date),
+    )
+    subject_info = dict()
+    for source, target, func in subj_info_mapping:
+        value = tree.find(source)
+        if value is not None:
+            subject_info[target] = func(value.text)
+    return subject_info
+
+
+@fill_doc
+class RawOTB(BaseRaw):
+    """Raw object from an OTB file.
+
+    Parameters
+    ----------
+    fname : path-like
+        Path to the OTB file.
+    %(verbose)s
+
+    See Also
+    --------
+    mne.io.Raw : Documentation of attributes and methods.
+    """
+
+    @verbose
+    def __init__(self, fname, *, verbose=None):
+        # Adapted from the MATLAB code at:
+        # https://github.com/OTBioelettronica/OTB-Matlab/tree/main/MATLAB%20Open%20and%20Processing%20OTBFiles
+        # with permission to relicense as BSD-3 granted here:
+        # https://github.com/OTBioelettronica/OTB-Python/issues/2#issuecomment-2979135882
+        fname = str(_check_fname(fname, "read", True, "fname"))
+        if fname.endswith(".otb4"):
+            raise NotImplementedError(".otb4 format is not yet supported")
+        logger.info(f"Loading {fname}")
+
+        self.preload = True  # lazy loading not supported
+
+        highpass = list()
+        lowpass = list()
+        ch_names = list()
+        ch_types = list()
+
+        # TODO verify these are the only non-data channel IDs (other than "AUX*" which
+        # are handled separately via glob)
+        NON_DATA_CHS = ("Quaternion", "BufferChannel", "RampChannel", "LoadCellChannel")
+        POWER_SUPPLY = 3.3  # volts
+
+        with tarfile.open(fname, "r") as fid:
+            fnames = fid.getnames()
+            # the .sig file is the binary channel data
+            sig_fname = [_fname for _fname in fnames if _fname.endswith(".sig")]
+            if len(sig_fname) != 1:
+                raise NotImplementedError(
+                    "multiple .sig files found in the OTB+ archive. Probably this "
+                    "means that an acquisition was imported into another session. "
+                    "This is not yet supported; please open an issue at "
+                    "https://github.com/mne-tools/mne-emg/issues if you want us to add "
+                    "such support."
+                )
+            sig_fname = sig_fname[0]
+            data_size_bytes = fid.getmember(sig_fname).size
+            # the .xml file with the matching basename contains signal metadata
+            metadata_fname = str(Path(sig_fname).with_suffix(".xml"))
+            metadata = ET.fromstring(fid.extractfile(metadata_fname).read())
+            # patient info
+            patient_info_xml = ET.fromstring(fid.extractfile("patient.xml").read())
+        # structure of `metadata` is:
+        # Device
+        # └ Channels
+        #   ├ Adapter
+        #   │ ├ Channel
+        #   │ ├ ...
+        #   │ └ Channel
+        #   ├ ...
+        #   └ Adapter
+        #     ├ Channel
+        #     ├ ...
+        #     └ Channel
+        assert metadata.tag == "Device"
+        sfreq = float(metadata.attrib["SampleFrequency"])
+        n_chan = int(metadata.attrib["DeviceTotalChannels"])
+        bit_depth = int(metadata.attrib["ad_bits"])
+        model = metadata.attrib["Name"]
+
+        # TODO we may not need this? only relevant for Quattrocento device, and `n_chan`
+        # defined above should already be correct/sufficient
+        # if model := metadata.attrib.get("Model"):
+        #     max_n_chan = int(model[-3:])
+        if bit_depth == 16:
+            _dtype = np.int16
+        elif bit_depth == 24:  # EEG data recorded on OTB devices do this
+            # this is possible but will be a bit tricky, see:
+            # https://stackoverflow.com/a/34128171
+            # https://stackoverflow.com/a/11967503
+            raise NotImplementedError(
+                "OTB+ files with 24-bit data are not yet supported."
+            )
+        else:
+            raise NotImplementedError(
+                f"expected 16- or 24-bit data, but file metadata says {bit_depth}-bit. "
+                "If this file can be successfully read with other software (i.e. it is "
+                "not corrupted), please open an issue at "
+                "https://github.com/mne-tools/mne-emg/issues so we can add support for "
+                "your use case."
+            )
+        gains = np.full(n_chan, np.nan)
+        # check in advance where we'll need to append indices to uniquify ch_names
+        n_ch_by_type = Counter([ch.get("ID") for ch in metadata.iter("Channel")])
+        dupl_ids = [k for k, v in n_ch_by_type.items() if v > 1]
+        # iterate over adapters & channels to extract gain, filters, names, etc
+        for adapter_ix, adapter in enumerate(metadata.iter("Adapter")):
+            adapter_ch_offset = int(adapter.get("ChannelStartIndex"))
+            adapter_gain = float(adapter.get("Gain"))
+            # we only care about lowpass/highpass on the data channels
+            # TODO verify these two are the only non-data adapter types
+            if adapter.get("ID") not in ("AdapterQuaternions", "AdapterControl"):
+                highpass.append(float(adapter.get("HighPassFilter")))
+                lowpass.append(float(adapter.get("LowPassFilter")))
+
+            for ch in adapter.iter("Channel"):
+                ix = int(ch.get("Index"))
+                ch_id = ch.get("ID")
+                # # see if we can parse the adapter name to get row,col info
+                # pattern = re.compile(
+                #     # connector type   inter-elec dist    grid rows    grid cols
+                #     r"(?:[a-zA-Z]+)(?:(?P<ied>\d+)MM)(?P<row>\d{2})(?P<col>\d{2})"
+                # )
+                # if match := pattern.match(ch_id):
+                #     col = ix % int(match["col"])
+                #     row = ix // int(match["row"])
+                #     ch_name = f"EMG_{adapter_ix}({row:02},{col:02})"
+                # elif ch_id
+                # else:
+                #     ch_name = f"EMG_{ix + adapter_ch_offset:03}"
+                # ch_names.append(ch_name)
+                ch_names.append(f"{ch_id}_{ix}" if ch_id in dupl_ids else ch_id)
+                # store gains
+                gains[ix + adapter_ch_offset] = float(ch.get("Gain")) * adapter_gain
+                # TODO verify ch_type for quats, buffer channel, and ramp channel
+                ch_types.append(
+                    "misc"
+                    if ch_id in NON_DATA_CHS or ch_id.lower().startswith("aux")
+                    else "emg"
+                )
+        assert np.isfinite(gains).all()
+
+        # compute number of samples
+        n_samples, extra = divmod(data_size_bytes, (bit_depth // 8) * n_chan)
+        if extra != 0:
+            warn(
+                f"Number of bytes in file ({data_size_bytes}) not evenly divided by "
+                f"number of channels ({n_chan}). File may be corrupted or truncated."
+            )
+        n_samples = int(n_samples)
+
+        # check filter freqs.
+        # TODO filter freqs can vary by adapter, so in theory we might get different
+        # filters for different *data* channels (not just different between data and
+        # misc/aux/whatever).
+        if len(highpass) > 1:
+            warn(
+                "More than one highpass frequency found in file; choosing lowest "
+                f"({min(highpass)})"
+            )
+        if len(lowpass) > 1:
+            warn(
+                "More than one lowpass frequency found in file; choosing highest "
+                f"({max(lowpass)})"
+            )
+        highpass = min(highpass)
+        lowpass = max(lowpass)
+
+        # create info
+        info = create_info(ch_names=ch_names, ch_types=ch_types, sfreq=sfreq)
+        subject_info = _parse_patient_xml(patient_info_xml)
+        device_info = dict(type="OTB", model=model)  # TODO type, model, serial, site
+        site = patient_info_xml.find("place")
+        if site is not None:
+            device_info.update(site=site.text)
+        info.update(subject_info=subject_info, device_info=device_info)
+        with info._unlock():
+            info["highpass"] = highpass
+            info["lowpass"] = lowpass
+            for _ch in info["chs"]:
+                cal = 1 / 2**bit_depth / gains[ix + adapter_ch_offset]
+                _ch.update(cal=cal, range=POWER_SUPPLY)
+            meas_date = patient_info_xml.find("time")
+            if meas_date is not None:
+                info["meas_date"] = datetime.fromisoformat(meas_date.text).astimezone(
+                    timezone.utc
+                )
+
+        # sanity check
+        dur = patient_info_xml.find("duration")
+        if dur is not None:
+            np.testing.assert_almost_equal(
+                float(dur.text), n_samples / sfreq, decimal=3
+            )
+
+        # TODO other fields in patient_info_xml:
+        # protocol_code, pathology, commentsPatient, comments
+
+        # TODO parse files markers_0.xml, markers_1.xml as annotations?
+
+        # populate raw_extras
+        raw_extras = dict(dtype=_dtype, sig_fname=sig_fname)
+        FORMAT_MAPPING = dict(
+            d="double",
+            f="single",
+            i="int",
+            h="short",
+        )
+        orig_format = FORMAT_MAPPING[_dtype().dtype.char]
+
+        super().__init__(
+            info,
+            preload=True,
+            last_samps=(n_samples - 1,),
+            filenames=[fname],
+            orig_format=orig_format,
+            # orig_units="V",  # TODO maybe not needed
+            raw_extras=[raw_extras],
+            verbose=verbose,
+        )
+
+    def _preload_data(self, preload):
+        """Load raw data from an OTB+ file."""
+        _extras = self._raw_extras[0]
+        sig_fname = _extras["sig_fname"]
+
+        with tarfile.open(self.filenames[0], "r") as fid:
+            _data = (
+                np.frombuffer(
+                    fid.extractfile(sig_fname).read(),
+                    dtype=_extras["dtype"],
+                )
+                .reshape(-1, self.info["nchan"])
+                .T
+            )
+        cals = np.array(
+            [
+                _ch["cal"] * _ch["range"] * _ch.get("scale", 1.0)
+                for _ch in self.info["chs"]
+            ]
+        )
+        self._data = _data * cals[:, np.newaxis]
+
+
+@fill_doc
+def read_raw_otb(fname, verbose=None) -> RawOTB:
+    """Reader for an OTB (.otb4/.otb+) recording.
+
+    Parameters
+    ----------
+    fname : path-like
+        Path to the OTB file.
+    %(verbose)s
+
+    Returns
+    -------
+    raw : instance of RawOTB
+        A Raw object containing OTB data.
+        See :class:`mne.io.Raw` for documentation of attributes and methods.
+
+    See Also
+    --------
+    mne.io.Raw : Documentation of attributes and methods of RawPersyst.
+
+    Notes
+    -----
+    ``preload=False`` is not supported for this file format.
+    """
+    return RawOTB(fname, verbose=verbose)