From a4e4439916a2a789cc721b8e0a8a52fb0dc52772 Mon Sep 17 00:00:00 2001 From: Ben Dichter Date: Mon, 12 Aug 2024 12:24:49 -0400 Subject: [PATCH 1/5] add new TimeIntervalsInterface --- src/neuroconv/datainterfaces/__init__.py | 2 + .../text/csv/csvtimeintervalsinterface.py | 4 +- .../text/excel/exceltimeintervalsinterface.py | 4 +- .../text/time_intervals.schema.json | 50 +++++++++++++++++ .../text/timeintervalsinterface.py | 55 ++++++++++++++++++- tests/test_text/test_time_intervals.py | 38 +++++++++++++ 6 files changed, 147 insertions(+), 6 deletions(-) create mode 100644 src/neuroconv/datainterfaces/text/time_intervals.schema.json diff --git a/src/neuroconv/datainterfaces/__init__.py b/src/neuroconv/datainterfaces/__init__.py index 9028c1d42..f45a78639 100644 --- a/src/neuroconv/datainterfaces/__init__.py +++ b/src/neuroconv/datainterfaces/__init__.py @@ -94,6 +94,7 @@ # Text from .text.csv.csvtimeintervalsinterface import CsvTimeIntervalsInterface from .text.excel.exceltimeintervalsinterface import ExcelTimeIntervalsInterface +from .text.timeintervalsinterface import TimeIntervalsInterface interface_list = [ # Ecephys @@ -162,6 +163,7 @@ # Text CsvTimeIntervalsInterface, ExcelTimeIntervalsInterface, + TimeIntervalsInterface, ] interfaces_by_category = dict( diff --git a/src/neuroconv/datainterfaces/text/csv/csvtimeintervalsinterface.py b/src/neuroconv/datainterfaces/text/csv/csvtimeintervalsinterface.py index 4904e1c19..b1ce92fcd 100644 --- a/src/neuroconv/datainterfaces/text/csv/csvtimeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/csv/csvtimeintervalsinterface.py @@ -1,10 +1,10 @@ import pandas as pd -from ..timeintervalsinterface import TimeIntervalsInterface +from ..timeintervalsinterface import BaseTimeIntervalsInterface from ....utils.types import FilePathType -class CsvTimeIntervalsInterface(TimeIntervalsInterface): +class CsvTimeIntervalsInterface(BaseTimeIntervalsInterface): """Interface for adding data from a .csv file as a TimeIntervals object.""" display_name = "CSV time interval table" diff --git a/src/neuroconv/datainterfaces/text/excel/exceltimeintervalsinterface.py b/src/neuroconv/datainterfaces/text/excel/exceltimeintervalsinterface.py index 96a375d50..5851af99e 100644 --- a/src/neuroconv/datainterfaces/text/excel/exceltimeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/excel/exceltimeintervalsinterface.py @@ -2,11 +2,11 @@ import pandas as pd -from ..timeintervalsinterface import TimeIntervalsInterface +from ..timeintervalsinterface import BaseTimeIntervalsInterface from ....utils.types import FilePathType -class ExcelTimeIntervalsInterface(TimeIntervalsInterface): +class ExcelTimeIntervalsInterface(BaseTimeIntervalsInterface): """Interface for adding data from an Excel file to NWB as a TimeIntervals object.""" display_name = "Excel time interval table" diff --git a/src/neuroconv/datainterfaces/text/time_intervals.schema.json b/src/neuroconv/datainterfaces/text/time_intervals.schema.json new file mode 100644 index 000000000..ba3667be0 --- /dev/null +++ b/src/neuroconv/datainterfaces/text/time_intervals.schema.json @@ -0,0 +1,50 @@ +{ + "type": "object", + "patternProperties": { + "^[a-zA-Z0-9_]+$": { + "type": "object", + "properties": { + "description": { + "type": "string" + }, + "columns": { + "type": "array", + "items": { + "type": "object", + "properties": { + "name": { + "type": "string" + }, + "description": { + "type": "string" + } + }, + "required": [ + "name" + ], + "additionalProperties": false + } + }, + "data": { + "type": "array", + "items": { + "type": "object", + "properties": { + "start_time": { + "type": "number" + }, + "stop_time": { + "type": "number" + } + }, + "required": [ + "start_time", + "stop_time" + ], + "additionalProperties": true + } + } + } + } + } +} \ No newline at end of file diff --git a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py index dd7f491f8..d35286c60 100644 --- a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py @@ -4,14 +4,15 @@ import numpy as np from pynwb import NWBFile +from pynwb.epoch import TimeIntervals from ...basedatainterface import BaseDataInterface from ...tools.text import convert_df_to_time_intervals -from ...utils.dict import load_dict_from_file +from ...utils.dict import load_dict_from_file, DeepDict from ...utils.types import FilePathType -class TimeIntervalsInterface(BaseDataInterface): +class BaseTimeIntervalsInterface(BaseDataInterface): """Abstract Interface for time intervals.""" keywords = ("table", "trials", "epochs", "time intervals") @@ -154,3 +155,53 @@ def add_to_nwbfile( @abstractmethod def _read_file(self, file_path: FilePathType, **read_kwargs): pass + + +class TimeIntervalsInterface(BaseDataInterface): + + @classmethod + def add_to_nwbfile(cls, nwbfile: NWBFile, metadata: DeepDict) -> None: + + for table_name, table_metadata in metadata["TimeIntervals"].items(): + time_intervals = TimeIntervals( + name=table_name, + description=table_metadata.get("description", "no description") + ) + + # add custom columns + for column_name, column_metadata in table_metadata["columns"].items(): + if column_name not in ("start_time", "stop_time"): + time_intervals.add_column(name=column_name, description=column_metadata.get("description", "no description")) + # handle any custom columns that were not defined in columns object + for column_name in table_metadata["data"][0]: + if column_name not in time_intervals.colnames + ("start_time", "stop_time"): + time_intervals.add_column(name=key, description="no description") + # add data + for row in table_metadata["data"]: + time_intervals.add_interval(**row) + + # add to nwbfile + if table_name == "trials": + nwbfile.trials = time_intervals + else: + nwbfile.add_time_intervals(time_intervals) + + + def get_metadata_schema(self) -> dict: + metadata_schema = super().get_metadata_schema() + + time_intervals_schema = load_dict_from_file(Path(__file__).parent / "time_intervals.schema.json") + metadata_schema["properties"]["TimeIntervals"] = time_intervals_schema + return metadata_schema + + def get_metadata(self) -> dict: + metadata = super().get_metadata() + metadata["TimeIntervals"]["trials"] = dict( + columns=dict( + start_time=dict(description="start time of the trial"), + stop_time=dict(description="stop time of the trial"), + ), + data=[], + ) + + return metadata diff --git a/tests/test_text/test_time_intervals.py b/tests/test_text/test_time_intervals.py index 761879bd8..e624828bb 100644 --- a/tests/test_text/test_time_intervals.py +++ b/tests/test_text/test_time_intervals.py @@ -8,6 +8,7 @@ from neuroconv.datainterfaces import ( CsvTimeIntervalsInterface, ExcelTimeIntervalsInterface, + TimeIntervalsInterface, ) from neuroconv.tools.nwb_helpers import make_nwbfile_from_metadata from neuroconv.tools.text import convert_df_to_time_intervals @@ -96,3 +97,40 @@ def test_csv_round_trip_rename(tmp_path): def test_get_metadata_schema(): interface = CsvTimeIntervalsInterface(trials_csv_path) interface.get_metadata_schema() + + +def test_trials(): + metadata = dict( + NWBFile=dict( + session_start_time=datetime.now().astimezone(), + ), + TimeIntervals=dict( + trials=dict( + columns=dict( + start_time=dict(description="start time of the trial"), + stop_time=dict(description="stop time of the trial"), + correct=dict(description="correct or not"), + ), + data=[ + dict(start_time=0.0, stop_time=1.0, correct=True), + dict(start_time=1.0, stop_time=2.0, correct=False), + ], + ), + new_table=dict( + columns=dict( + stim_id=dict(description="stimulus ID"), + ), + data=[ + dict(start_time=0.0, stop_time=1.0, stim_id=0), + dict(start_time=1.0, stop_time=2.0, stim_id=1), + ], + ) + ), + ) + + nwbfile = TimeIntervalsInterface().create_nwbfile(metadata) + assert nwbfile.trials.correct.description == "correct or not" + assert_array_equal(nwbfile.trials.correct[:], [True, False]) + assert_array_equal(nwbfile.trials.start_time[:], [0.0, 1.0]) + + assert_array_equal(nwbfile.intervals["new_table"].stim_id[:], [0, 1]) From 22d6aff3c93af9dc04bba51a7b59552b67f01e73 Mon Sep 17 00:00:00 2001 From: Ben Dichter Date: Mon, 12 Aug 2024 12:25:54 -0400 Subject: [PATCH 2/5] add metadata --- src/neuroconv/datainterfaces/text/timeintervalsinterface.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py index d35286c60..80fa1ca71 100644 --- a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py @@ -159,6 +159,9 @@ def _read_file(self, file_path: FilePathType, **read_kwargs): class TimeIntervalsInterface(BaseDataInterface): + display_name = "Time Intervals" + keywords = ("table", "trials", "epochs", "time intervals") + @classmethod def add_to_nwbfile(cls, nwbfile: NWBFile, metadata: DeepDict) -> None: From 1b8012f97bda16b16e995e956adc363e539a9ed7 Mon Sep 17 00:00:00 2001 From: "pre-commit-ci[bot]" <66853113+pre-commit-ci[bot]@users.noreply.github.com> Date: Mon, 12 Aug 2024 16:29:53 +0000 Subject: [PATCH 3/5] [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --- .../datainterfaces/text/time_intervals.schema.json | 2 +- .../datainterfaces/text/timeintervalsinterface.py | 10 +++++----- tests/test_text/test_time_intervals.py | 4 ++-- 3 files changed, 8 insertions(+), 8 deletions(-) diff --git a/src/neuroconv/datainterfaces/text/time_intervals.schema.json b/src/neuroconv/datainterfaces/text/time_intervals.schema.json index ba3667be0..32c3a891a 100644 --- a/src/neuroconv/datainterfaces/text/time_intervals.schema.json +++ b/src/neuroconv/datainterfaces/text/time_intervals.schema.json @@ -47,4 +47,4 @@ } } } -} \ No newline at end of file +} diff --git a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py index 80fa1ca71..8f9970460 100644 --- a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py @@ -8,7 +8,7 @@ from ...basedatainterface import BaseDataInterface from ...tools.text import convert_df_to_time_intervals -from ...utils.dict import load_dict_from_file, DeepDict +from ...utils.dict import DeepDict, load_dict_from_file from ...utils.types import FilePathType @@ -167,14 +167,15 @@ def add_to_nwbfile(cls, nwbfile: NWBFile, metadata: DeepDict) -> None: for table_name, table_metadata in metadata["TimeIntervals"].items(): time_intervals = TimeIntervals( - name=table_name, - description=table_metadata.get("description", "no description") + name=table_name, description=table_metadata.get("description", "no description") ) # add custom columns for column_name, column_metadata in table_metadata["columns"].items(): if column_name not in ("start_time", "stop_time"): - time_intervals.add_column(name=column_name, description=column_metadata.get("description", "no description")) + time_intervals.add_column( + name=column_name, description=column_metadata.get("description", "no description") + ) # handle any custom columns that were not defined in columns object for column_name in table_metadata["data"][0]: if column_name not in time_intervals.colnames + ("start_time", "stop_time"): @@ -189,7 +190,6 @@ def add_to_nwbfile(cls, nwbfile: NWBFile, metadata: DeepDict) -> None: else: nwbfile.add_time_intervals(time_intervals) - def get_metadata_schema(self) -> dict: metadata_schema = super().get_metadata_schema() diff --git a/tests/test_text/test_time_intervals.py b/tests/test_text/test_time_intervals.py index e624828bb..698dde9a1 100644 --- a/tests/test_text/test_time_intervals.py +++ b/tests/test_text/test_time_intervals.py @@ -115,7 +115,7 @@ def test_trials(): dict(start_time=0.0, stop_time=1.0, correct=True), dict(start_time=1.0, stop_time=2.0, correct=False), ], - ), + ), new_table=dict( columns=dict( stim_id=dict(description="stimulus ID"), @@ -124,7 +124,7 @@ def test_trials(): dict(start_time=0.0, stop_time=1.0, stim_id=0), dict(start_time=1.0, stop_time=2.0, stim_id=1), ], - ) + ), ), ) From e6ecf69962957c8eb0e73b85722588727595fb84 Mon Sep 17 00:00:00 2001 From: Ben Dichter Date: Mon, 12 Aug 2024 14:41:26 -0400 Subject: [PATCH 4/5] add class attributes --- src/neuroconv/datainterfaces/text/timeintervalsinterface.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py index 80fa1ca71..188b3e05c 100644 --- a/src/neuroconv/datainterfaces/text/timeintervalsinterface.py +++ b/src/neuroconv/datainterfaces/text/timeintervalsinterface.py @@ -161,6 +161,8 @@ class TimeIntervalsInterface(BaseDataInterface): display_name = "Time Intervals" keywords = ("table", "trials", "epochs", "time intervals") + associated_suffixes = () + info = "Interface for time intervals data added to metadata." @classmethod def add_to_nwbfile(cls, nwbfile: NWBFile, metadata: DeepDict) -> None: From 4576bc412797db2a92b2c1dd1cfead74aef7a636 Mon Sep 17 00:00:00 2001 From: Ben Dichter Date: Mon, 12 Aug 2024 17:20:12 -0400 Subject: [PATCH 5/5] rmv test that ensures associated_suffixes and keywords have length > 0. I think they should be allowed to be 0-length --- tests/test_minimal/test_tools/test_importing.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/tests/test_minimal/test_tools/test_importing.py b/tests/test_minimal/test_tools/test_importing.py index 9f800f0e7..1fcff6c45 100644 --- a/tests/test_minimal/test_tools/test_importing.py +++ b/tests/test_minimal/test_tools/test_importing.py @@ -27,5 +27,3 @@ def test_guide_attributes(): assert isinstance( value, tuple ), f"{name} incorrectly specified GUIDE-related attribute 'associated_suffixes' (must be tuple)." - if isinstance(value, tuple): - assert len(value) > 0, f"{name} is missing entries in GUIDE related attribute {key}."