From ebfd471672eafb223fc103652b56e680f18c5063 Mon Sep 17 00:00:00 2001
From: Johanna Senk <j.senk@fz-juelich.de>
Date: Fri, 13 Sep 2019 13:52:00 +0200
Subject: [PATCH 1/7] Rename nestio.py to nest2io.py (support for output from
 NEST2.x)

---
 neo/io/{nestio.py => nest2io.py} | 1 +
 1 file changed, 1 insertion(+)
 rename neo/io/{nestio.py => nest2io.py} (99%)

diff --git a/neo/io/nestio.py b/neo/io/nest2io.py
similarity index 99%
rename from neo/io/nestio.py
rename to neo/io/nest2io.py
index 972ac8ced..5aa9594f8 100644
--- a/neo/io/nestio.py
+++ b/neo/io/nest2io.py
@@ -1,6 +1,7 @@
 # -*- coding: utf-8 -*-
 """
 Class for reading output files from NEST simulations
+using NEST versions 2.x
 ( http://www.nest-simulator.org/ ).
 Tested with NEST2.10.0
 

From 6f3ff8b5790cc9b48f8d0f7d7d121a2542f1c59c Mon Sep 17 00:00:00 2001
From: Johanna Senk <j.senk@fz-juelich.de>
Date: Fri, 13 Sep 2019 14:12:57 +0200
Subject: [PATCH 2/7] Start nest3io supporting NEST3

---
 neo/io/__init__.py      |  12 +-
 neo/io/nest3io.py       |  31 ++++
 neo/rawio/__init__.py   |   2 +
 neo/rawio/nest3rawio.py | 380 ++++++++++++++++++++++++++++++++++++++++
 4 files changed, 422 insertions(+), 3 deletions(-)
 create mode 100644 neo/io/nest3io.py
 create mode 100644 neo/rawio/nest3rawio.py

diff --git a/neo/io/__init__.py b/neo/io/__init__.py
index f4923ab5d..6f902b131 100644
--- a/neo/io/__init__.py
+++ b/neo/io/__init__.py
@@ -133,7 +133,11 @@
 
     .. autoattribute:: extensions
 
-.. autoclass:: neo.io.NestIO
+.. autoclass:: neo.io.Nest2IO
+
+    .. autoattribute:: extensions
+
+.. autoclass:: neo.io.Nest3IO
 
     .. autoattribute:: extensions
 
@@ -243,7 +247,8 @@
 from neo.io.micromedio import MicromedIO
 from neo.io.hdf5io import NeoHdf5IO
 from neo.io.neomatlabio import NeoMatlabIO
-from neo.io.nestio import NestIO
+from neo.io.nest2io import Nest2IO
+from neo.io.nest3io import Nest3IO
 from neo.io.neuralynxio import NeuralynxIO
 from neo.io.neuralynxio_v1 import NeuralynxIO as OldNeuralynxIO
 from neo.io.neuroexplorerio import NeuroExplorerIO
@@ -285,7 +290,8 @@
     NixIO,  # place NixIO before NeoHdf5IO to make it the default for .h5 files
     NeoHdf5IO,
     NeoMatlabIO,
-    NestIO,
+    Nest2IO,
+    Nest3IO,
     NeuralynxIO,
     NeuroExplorerIO,
     NeuroScopeIO,
diff --git a/neo/io/nest3io.py b/neo/io/nest3io.py
new file mode 100644
index 000000000..43dbfb523
--- /dev/null
+++ b/neo/io/nest3io.py
@@ -0,0 +1,31 @@
+# -*- coding: utf-8 -*-
+"""
+neo.io have been split in 2 level API:
+  * neo.io: this API give neo object
+  * neo.rawio: this API give raw data as they are in files.
+
+Developper are encourage to use neo.rawio.
+
+When this is done the neo.io is done automagically with
+this king of following code.
+
+Author: sgarcia
+
+"""
+
+from neo.io.basefromrawio import BaseFromRaw
+from neo.rawio.nest3rawio import Nest3RawIO
+
+
+class Nest3IO(Nest3RawIO, BaseFromRaw):
+    name = 'Nest3IO'
+    description = "Fake IO"
+
+    # This is an inportant choice when there are several channels.
+    #   'split-all' :  1 AnalogSignal each 1 channel
+    #   'group-by-same-units' : one 2D AnalogSignal for each group of channel with same units
+    _prefered_signal_group_mode = 'group-by-same-units'
+
+    def __init__(self, filename=''):
+        Nest3RawIO.__init__(self, filename=filename)
+        BaseFromRaw.__init__(self, filename)
diff --git a/neo/rawio/__init__.py b/neo/rawio/__init__.py
index 3ad1de370..7747026c9 100644
--- a/neo/rawio/__init__.py
+++ b/neo/rawio/__init__.py
@@ -121,6 +121,7 @@
 from neo.rawio.examplerawio import ExampleRawIO
 from neo.rawio.intanrawio import IntanRawIO
 from neo.rawio.micromedrawio import MicromedRawIO
+from neo.rawio.nest3rawio import Nest3RawIO
 from neo.rawio.neuralynxrawio import NeuralynxRawIO
 from neo.rawio.neuroexplorerrawio import NeuroExplorerRawIO
 from neo.rawio.neuroscoperawio import NeuroScopeRawIO
@@ -142,6 +143,7 @@
     ElanRawIO,
     IntanRawIO,
     MicromedRawIO,
+    Nest3RawIO,
     NeuralynxRawIO,
     NeuroExplorerRawIO,
     NeuroScopeRawIO,
diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
new file mode 100644
index 000000000..5a68a9fe4
--- /dev/null
+++ b/neo/rawio/nest3rawio.py
@@ -0,0 +1,380 @@
+# -*- coding: utf-8 -*-
+"""
+NestSionRawIO is a class for reading output files from NEST simulations
+( http://www.nest-simulator.org/ ) written with the library SIONlib.
+SIONlib ( http://www.fz-juelich.de/jsc/sionlib ) is a scalable I/O library for
+parallel access to task-local files.
+
+
+
+Author: Johanna Senk
+"""
+from __future__ import unicode_literals, print_function, division, absolute_import
+
+from .baserawio import (BaseRawIO, _signal_channel_dtype, _unit_channel_dtype,
+                        _event_channel_dtype)
+
+import numpy as np
+
+import nestio # TODO from https://github.com/apeyser/nestio-tools (bring to setup.py, maybe change of name?)
+
+
+class Nest3RawIO(BaseRawIO):
+    """
+    Class for "reading" fake data from an imaginary file.
+
+    For the user, it give acces to raw data (signals, event, spikes) as they
+    are in the (fake) file int16 and int64.
+
+    For a developer, it is just an example showing guidelines for someone who wants
+    to develop a new IO module.
+
+    Two rules for developers:
+      * Respect the Neo RawIO API (:ref:`_neo_rawio_API`)
+      * Follow :ref:`_io_guiline`
+
+    This fake IO:
+        * have 2 blocks
+        * blocks have 2 and 3 segments
+        * have 16 signal_channel sample_rate = 10000
+        * have 3 unit_channel
+        * have 2 event channel: one have *type=event*, the other have
+          *type=epoch*
+
+
+    Usage:
+        >>> import neo.rawio
+        >>> r = neo.rawio.ExampleRawIO(filename='output.sion')
+        >>> r.parse_header()
+        >>> print(r)
+        >>> raw_chunk = r.get_analogsignal_chunk(block_index=0, seg_index=0,
+                            i_start=0, i_stop=1024,  channel_names=channel_names)
+        >>> float_chunk = reader.rescale_signal_raw_to_float(raw_chunk, dtype='float64',
+                            channel_indexes=[0, 3, 6])
+        >>> spike_timestamp = reader.spike_timestamps(unit_index=0, t_start=None, t_stop=None)
+        >>> spike_times = reader.rescale_spike_timestamp(spike_timestamp, 'float64')
+        >>> ev_timestamps, _, ev_labels = reader.event_timestamps(event_channel_index=0)
+
+    """
+    name = 'Nest3RawIO'
+    description = ''
+    extensions = ['sion']
+    rawmode = 'one-file'
+
+    def __init__(self, filename=''):
+        BaseRawIO.__init__(self)
+        self.filename = filename
+
+    def _source_name(self):
+        return self.filename
+
+    def _parse_header(self):
+
+        self.description = '' # TODO
+        self.header = {}
+
+        # access the .sion file with the reader from nestio-tools
+        self.reader = nestio.NestReader(self.filename)
+
+        # one block with one segment per .sion file
+        self.header['nb_block'] = 1
+        self.header['nb_segment'] = [1]
+
+        # block annotations: global information on simulation
+        block_ann = { 'nest_version': self.reader.nest_version,
+                      'sionlib_rec_backend_version' : self.reader.sionlib_rec_backend_version }
+
+        # segment annotations: global information on simulation
+        seg_ann = { 'sim_resolution' : self.reader.resolution * 1e-3, # in s
+                    'sim_t_start' : self.reader.t_start * 1e-3, # in s
+                    'sim_t_stop' : self.reader.t_end * 1e-3, # in s
+                    'sim_unit' : 'seconds' }
+
+        # loop through data
+        unit_channels = []
+        sig_channels = []
+        for rec_dev in self.reader:
+            neuron_ids = np.unique(np.array(self.reader[rec_dev.gid])['f0'])
+            for nid in neuron_ids:
+
+                # spike data as units
+                if rec_dev.name == u'spike_detector':
+                    unit_name = 'unit{}'.format(c)
+                    unit_id = '#{}'.format(c)
+                    wf_units = 'uV'
+                    wf_gain = 1000. / 2 ** 16
+                    wf_offset = 0.
+                    wf_left_sweep = 20
+                    wf_sampling_rate = 10000.
+                    unit_channels.append((unit_name, unit_id, wf_units, wf_gain,
+                                          wf_offset, wf_left_sweep, wf_sampling_rate))
+
+                # analog data as signals
+                elif rec_dev.name == u'multimeter':
+                    ch_name
+                    chan_id
+                    sr
+                    dtype
+                    units
+                    gain
+                    offset
+                    group_id
+                    sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
+
+
+            
+
+
+            
+            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin, i.rows, i.dtype, i.t_start, i.t_stop
+
+
+            
+
+
+
+
+
+        # minimal annotations from BaseRawIO
+        self._generate_minimal_annotations()
+
+
+
+        
+
+        # # global information on simulation
+        # self.nest_version =  self.reader.nest_version
+        # self.sionlib_rec_backend_version =  self.reader.sionlib_rec_backend_version
+        # self.sim_resolution = self.reader.resolution * 1e-3 # in s
+        # self.sim_t_start = self.reader.t_start * 1e-3 # in s
+        # self.sim_t_stop = self.reader.t_end * 1e-3 # in s
+
+        # # set number of blocks and segments
+        # self.header['nb_block'] = 0
+        # self.header['nb_segment'] = []
+        # for rec_dev in self.reader:
+        #     # one block per recording device
+        #     self.header['nb_block'] += 1
+        #     # one segment per observable (at least one per block)
+        #     self.header['nb_segment'].append(
+        #         np.max([1, rec_dev.double_n_val + rec_dev.long_n_val]))
+
+        # # signals and units are not global but specific to to the recording devices
+        # self.header['signal_channels'] = np.array([], dtype=_signal_channel_dtype)
+        # self.header['unit_channels'] = np.array([], dtype=_unit_channel_dtype)
+
+        # # no events or epochs
+        # self.header['event_channels'] = np.array([], dtype=_event_channel_dtype)
+
+        # # minimal annotations from BaseRawIO
+        # self._generate_minimal_annotations()
+
+        # # annotate blocks with information on the recording device
+        # for block_index,rec_dev in enumerate(self.reader):
+        #     ba = self.raw_annotations['blocks'][block_index]
+        #     ba['gid'] = rec_dev.gid
+        #     ba['rec_dev'] = rec_dev.name
+        #     ba['label'] = rec_dev.label
+
+        #     # annotate segments: specify data columns
+        #     seg_index = 0
+        #     double_index = 0
+        #     long_index = 0
+        #     while seg_index < self.header['nb_segment'][block_index]:
+        #         sa = ba['segments'][seg_index]
+        #         sa['data'] = {}
+        #         sa['data'].update({'gids': ['f0'],
+        #                            'times': ['f1']})
+
+        #         if double_index < rec_dev.double_n_val:
+        #             sa['data'].update({rec_dev.double_observables[double_index]: ['f3', double_index]})
+        #             double_index += 1
+
+        #         if long_index < rec_dev.long_n_val and double_index >= rec_dev.double_n_val:
+        #             sa['data'].update({rec_dev.long_observables[long_index]: ['f4', long_index]})
+        #             long_index += 1
+        #         seg_index += 1
+
+
+    def _segment_t_start(self, block_index, seg_index):
+        # DONE
+        # INDEPENDENT OF SEG_INDEX
+
+        # this must return an float scale in second
+        # this t_start will be shared by all object in the segment
+        # except AnalogSignal
+        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        t_start_rec_dev = self.reader[gid_rec_dev].t_start * self.sim_resolution
+        t_start = np.max([self.sim_t_start, t_start_rec_dev])
+        return t_start
+
+
+    def _segment_t_stop(self, block_index, seg_index):
+        # DONE
+        # INDEPENDENT OF SEG_INDEX
+
+        # this must return an float scale in second
+        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        t_stop_rec_dev = self.reader[gid_rec_dev].t_stop * self.sim_resolution
+        t_stop = np.min([self.sim_t_stop, t_stop_rec_dev])
+        return t_stop
+
+
+    def _get_signal_size(self, block_index, seg_index, channel_indexes=None):
+        # TODO
+        #
+        # we are lucky: signals in all segment have the same shape!! (10.0 seconds)
+        # it is not always the case
+        # this must return an int = the number of sample
+
+        # Note that channel_indexes can be ignored for most cases
+        # except for several sampling rate.
+        return rows
+
+
+    def _get_signal_t_start(self, block_index, seg_index, channel_indexes):
+        # DONE
+        # same as _segment_t_start
+        #
+        # This give the t_start of signals.
+        # Very often this equal to _segment_t_start but not
+        # always.
+        # this must return an float scale in second
+
+        # Note that channel_indexes can be ignored for most cases
+        # except for several sampling rate.
+
+        # Here this is the same.
+        # this is not always the case
+        return self._segment_t_start(block_index, seg_index)
+    
+
+    def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, channel_indexes):
+        # TODO
+        # this must return a signal chunk limited with
+        # i_start/i_stop (can be None)
+        # channel_indexes can be None (=all channel) or a list or numpy.array
+        # This must return a numpy array 2D (even with one channel).
+        # This must return the orignal dtype. No conversion here.
+        # This must as fast as possible.
+        # Everything that can be done in _parse_header() must not be here.
+
+        # Here we are lucky:  our signals is always zeros!!
+        # it is not always the case
+        # internally signals are int16
+        # convertion to real units is done with self.header['signal_channels']
+
+        if i_start is None:
+            i_start = 0
+        if i_stop is None:
+            i_stop = 100000
+
+        assert i_start >= 0, "I don't like your jokes"
+        assert i_stop <= 100000, "I don't like your jokes"
+
+        if channel_indexes is None:
+            nb_chan = 16
+        else:
+            nb_chan = len(channel_indexes)
+        raw_signals = np.zeros((i_stop - i_start, nb_chan), dtype='int16')
+        return raw_signals
+
+
+    def _spike_count(self, block_index, seg_index, unit_index):
+        # DONE
+
+        # Must return the nb of spike for given (block_index, seg_index, unit_index)
+
+        rec_dev = self.raw_annotations['blocks'][block_index]['rec_dev']
+        assert rec_dev == b'spike_detector', \
+            'This block does not contain data from a spike_detector!'
+
+        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        gids_nrns = np.asarray(self.reader[gid_rec_dev])['f0']
+
+        nb_spikes = sum(gids_nrns == unit_index)
+        return nb_spikes
+
+
+    def _get_spike_timestamps(self, block_index, seg_index, unit_index, t_start, t_stop):
+        # DONE
+        # ALREADY IN S
+
+        # the same clip t_start/t_start must be used in _spike_raw_waveforms()
+
+
+        rec_dev = self.raw_annotations['blocks'][block_index]['rec_dev']
+        assert rec_dev == b'spike_detector', \
+            'This block does not contain data from a spike_detector!'
+
+        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        data = np.asarray(self.reader[gid_rec_dev])
+
+        idx = np.argwhere(data['f0'] == unit_index)
+
+        # TODO: IS THIS CORRECT?
+        # step * resolution + offset, result in s
+        all_spike_timestamps = data['f1'][idx] * self.sim_resolution + data['f2'][idx] * 1e-3
+
+        mask = (all_spike_timestamps >= t_start) & (all_spike_timestamps <= t_stop)
+        spike_timestamps = all_spike_timestamps[mask]
+
+        return spike_timestamps
+
+
+    def _rescale_spike_timestamp(self, spike_timestamps, dtype):
+        # DONE
+        # SPIKE_TIMESTAMPS ARE ALREADY IN S BECAUSE OF STEP AND OFFSET, THIS CHANGES ONLY DTYPE
+
+        spike_times = spike_timestamps.astype(dtype)
+        return spike_times
+
+
+    def _get_spike_raw_waveforms(self, block_index, seg_index, unit_index, t_start, t_stop):
+        # this must return a 3D numpy array (nb_spike, nb_channel, nb_sample)
+        # in the original dtype
+        # this must be as fast as possible.
+        # the same clip t_start/t_start must be used in _spike_timestamps()
+
+        # If there there is no waveform supported in the
+        # IO them _spike_raw_waveforms must return None
+
+        # In our IO waveforms come from all channels
+        # they are int16
+        # convertion to real units is done with self.header['unit_channels']
+        # Here, we have a realistic case: all waveforms are only noise.
+        # it is not always the case
+        # we 20 spikes with a sweep of 50 (5ms)
+
+        # trick to get how many spike in the slice
+        ts = self._get_spike_timestamps(block_index, seg_index, unit_index, t_start, t_stop)
+        nb_spike = ts.size
+
+        np.random.seed(2205)  # a magic number (my birthday)
+        waveforms = np.random.randint(low=-2**4, high=2**4, size=nb_spike * 50, dtype='int16')
+        waveforms = waveforms.reshape(nb_spike, 1, 50)
+        return None
+
+
+    def _event_count(self, block_index, seg_index, event_channel_index):
+        return 0
+
+
+    def _get_event_timestamps(self, block_index, seg_index, event_channel_index, t_start, t_stop):
+        #return timestamp, durations, labels
+        return None
+
+
+    def _rescale_event_timestamp(self, event_timestamps, dtype):
+        # must rescale to second a particular event_timestamps
+        # with a fixed dtype so the user can choose the precisino he want.
+
+        # really easy here because in our case it is already seconds
+        event_times = event_timestamps.astype(dtype)
+        return event_times
+
+
+    def _rescale_epoch_duration(self, raw_duration, dtype):
+        # really easy here because in our case it is already seconds
+        durations = raw_duration.astype(dtype)
+        return durations

From a89ce61c2d824afee572b3817bfe240369e2a024 Mon Sep 17 00:00:00 2001
From: Julia Sprenger <julia.sprenger@rwth-aachen.de>
Date: Fri, 13 Sep 2019 16:44:58 +0200
Subject: [PATCH 3/7] [Nest3IO] Add spike reading capabilities

---
 neo/io/nest2io.py       |   2 +-
 neo/io/nest3io.py       |   6 +-
 neo/rawio/nest3rawio.py | 173 +++++++++++++++++++---------------------
 3 files changed, 84 insertions(+), 97 deletions(-)

diff --git a/neo/io/nest2io.py b/neo/io/nest2io.py
index 5aa9594f8..8eb2c6b93 100644
--- a/neo/io/nest2io.py
+++ b/neo/io/nest2io.py
@@ -31,7 +31,7 @@
                    'no type': pq.dimensionless}
 
 
-class NestIO(BaseIO):
+class Nest2IO(BaseIO):
     """
     Class for reading NEST output files. GDF files for the spike data and DAT
     files for analog signals are possible.
diff --git a/neo/io/nest3io.py b/neo/io/nest3io.py
index 43dbfb523..b9d7c5c15 100644
--- a/neo/io/nest3io.py
+++ b/neo/io/nest3io.py
@@ -4,12 +4,12 @@
   * neo.io: this API give neo object
   * neo.rawio: this API give raw data as they are in files.
 
-Developper are encourage to use neo.rawio.
+Developer are encourage to use neo.rawio.
 
 When this is done the neo.io is done automagically with
 this king of following code.
 
-Author: sgarcia
+Author: Johanna Senk, Julia Sprenger
 
 """
 
@@ -21,7 +21,7 @@ class Nest3IO(Nest3RawIO, BaseFromRaw):
     name = 'Nest3IO'
     description = "Fake IO"
 
-    # This is an inportant choice when there are several channels.
+    # This is an important choice when there are several channels.
     #   'split-all' :  1 AnalogSignal each 1 channel
     #   'group-by-same-units' : one 2D AnalogSignal for each group of channel with same units
     _prefered_signal_group_mode = 'group-by-same-units'
diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
index 5a68a9fe4..9d19ec4f8 100644
--- a/neo/rawio/nest3rawio.py
+++ b/neo/rawio/nest3rawio.py
@@ -82,13 +82,11 @@ def _parse_header(self):
 
         # block annotations: global information on simulation
         block_ann = { 'nest_version': self.reader.nest_version,
-                      'sionlib_rec_backend_version' : self.reader.sionlib_rec_backend_version }
+                      'sionlib_rec_backend_version' : self.reader.sionlib_rec_backend_version,
+                      'sim_resolution': self.reader.resolution * 1e-3}  # in s
 
         # segment annotations: global information on simulation
-        seg_ann = { 'sim_resolution' : self.reader.resolution * 1e-3, # in s
-                    'sim_t_start' : self.reader.t_start * 1e-3, # in s
-                    'sim_t_stop' : self.reader.t_end * 1e-3, # in s
-                    'sim_unit' : 'seconds' }
+        seg_ann = {}
 
         # loop through data
         unit_channels = []
@@ -98,49 +96,51 @@ def _parse_header(self):
             for nid in neuron_ids:
 
                 # spike data as units
-                if rec_dev.name == u'spike_detector':
-                    unit_name = 'unit{}'.format(c)
-                    unit_id = '#{}'.format(c)
-                    wf_units = 'uV'
-                    wf_gain = 1000. / 2 ** 16
-                    wf_offset = 0.
-                    wf_left_sweep = 20
-                    wf_sampling_rate = 10000.
+                if rec_dev.name == b'spike_detector':
+                    unit_name = 'sd{}unit{}'.format(rec_dev.gid, nid)
+                    unit_id = '{}#{}'.format(rec_dev.gid, nid)
+                    wf_units = ''
+                    wf_gain = 0.0
+                    wf_offset = 0.0
+                    wf_left_sweep = 0
+                    wf_sampling_rate = 0.0
                     unit_channels.append((unit_name, unit_id, wf_units, wf_gain,
                                           wf_offset, wf_left_sweep, wf_sampling_rate))
 
                 # analog data as signals
-                elif rec_dev.name == u'multimeter':
-                    ch_name
-                    chan_id
-                    sr
-                    dtype
-                    units
-                    gain
-                    offset
-                    group_id
-                    sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
+                # elif rec_dev.name == b'multimeter':
+                #     ch_name =
+                #     chan_id
+                #     sr
+                #     dtype
+                #     units
+                #     gain
+                #     offset
+                #     group_id
+                #     sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
 
 
-            
 
 
-            
-            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin, i.rows, i.dtype, i.t_start, i.t_stop
 
 
-            
+            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin, i.rows, i.dtype, i.t_start, i.t_stop
 
+        unit_channels = np.array(unit_channels, dtype=_unit_channel_dtype)
+        self.header['unit_channels'] = unit_channels
 
+        # # signals and units are not global but specific to to the recording devices
+        self.header['signal_channels'] = np.array([], dtype=_signal_channel_dtype)
+        # self.header['unit_channels'] = np.array([], dtype=_unit_channel_dtype)
 
+        # # no events or epochs
+        self.header['event_channels'] = np.array([], dtype=_event_channel_dtype)
 
 
         # minimal annotations from BaseRawIO
         self._generate_minimal_annotations()
 
-
-
-        
+        self.raw_annotations['blocks'][0].update(block_ann)
 
         # # global information on simulation
         # self.nest_version =  self.reader.nest_version
@@ -159,19 +159,17 @@ def _parse_header(self):
         #     self.header['nb_segment'].append(
         #         np.max([1, rec_dev.double_n_val + rec_dev.long_n_val]))
 
-        # # signals and units are not global but specific to to the recording devices
-        # self.header['signal_channels'] = np.array([], dtype=_signal_channel_dtype)
-        # self.header['unit_channels'] = np.array([], dtype=_unit_channel_dtype)
 
-        # # no events or epochs
-        # self.header['event_channels'] = np.array([], dtype=_event_channel_dtype)
 
-        # # minimal annotations from BaseRawIO
+        # minimal annotations from BaseRawIO
         # self._generate_minimal_annotations()
 
+        # bl_ann = self.raw_annotations['blocks'][block_index]
+
         # # annotate blocks with information on the recording device
         # for block_index,rec_dev in enumerate(self.reader):
         #     ba = self.raw_annotations['blocks'][block_index]
+
         #     ba['gid'] = rec_dev.gid
         #     ba['rec_dev'] = rec_dev.name
         #     ba['label'] = rec_dev.label
@@ -203,10 +201,11 @@ def _segment_t_start(self, block_index, seg_index):
         # this must return an float scale in second
         # this t_start will be shared by all object in the segment
         # except AnalogSignal
-        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
-        t_start_rec_dev = self.reader[gid_rec_dev].t_start * self.sim_resolution
-        t_start = np.max([self.sim_t_start, t_start_rec_dev])
-        return t_start
+        # gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        # t_start_rec_dev = self.reader[gid_rec_dev].t_start * self.sim_resolution
+        # t_start = np.max([self.sim_t_start, t_start_rec_dev])
+        # return t_start
+        return  self.reader.t_start * 1e-3
 
 
     def _segment_t_stop(self, block_index, seg_index):
@@ -214,10 +213,12 @@ def _segment_t_stop(self, block_index, seg_index):
         # INDEPENDENT OF SEG_INDEX
 
         # this must return an float scale in second
-        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
-        t_stop_rec_dev = self.reader[gid_rec_dev].t_stop * self.sim_resolution
-        t_stop = np.min([self.sim_t_stop, t_stop_rec_dev])
-        return t_stop
+        # gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
+        # t_stop_rec_dev = self.reader[gid_rec_dev].t_stop * self.sim_resolution
+        # t_stop = np.min([self.sim_t_stop, t_stop_rec_dev])
+        # return t_stop
+
+        return  self.reader.t_end * 1e-3
 
 
     def _get_signal_size(self, block_index, seg_index, channel_indexes=None):
@@ -246,8 +247,9 @@ def _get_signal_t_start(self, block_index, seg_index, channel_indexes):
 
         # Here this is the same.
         # this is not always the case
-        return self._segment_t_start(block_index, seg_index)
-    
+        return 0
+        # return self._segment_t_start(block_index, seg_index)
+
 
     def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, channel_indexes):
         # TODO
@@ -255,7 +257,7 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
         # i_start/i_stop (can be None)
         # channel_indexes can be None (=all channel) or a list or numpy.array
         # This must return a numpy array 2D (even with one channel).
-        # This must return the orignal dtype. No conversion here.
+        # This must return the original dtype. No conversion here.
         # This must as fast as possible.
         # Everything that can be done in _parse_header() must not be here.
 
@@ -281,41 +283,51 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
 
 
     def _spike_count(self, block_index, seg_index, unit_index):
-        # DONE
-
         # Must return the nb of spike for given (block_index, seg_index, unit_index)
+        sd_id, nid = self.header['unit_channels'][unit_index][1].split('#')
+        sd_id, nid = int(sd_id), int(nid)
 
-        rec_dev = self.raw_annotations['blocks'][block_index]['rec_dev']
-        assert rec_dev == b'spike_detector', \
-            'This block does not contain data from a spike_detector!'
+        assert self.reader[sd_id].name == b'spike_detector', \
+            'This unit was not recorded by a spike_detector!'
 
-        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
-        gids_nrns = np.asarray(self.reader[gid_rec_dev])['f0']
+        data = np.asarray(self.reader[sd_id])
+        return np.sum(data['f0'] == nid)
 
-        nb_spikes = sum(gids_nrns == unit_index)
-        return nb_spikes
 
 
     def _get_spike_timestamps(self, block_index, seg_index, unit_index, t_start, t_stop):
-        # DONE
-        # ALREADY IN S
+        sim_resolution = self.raw_annotations['blocks'][block_index]['sim_resolution']
+        # extract spike detector id and n....
+        sd_id, nid = self.header['unit_channels'][unit_index][1].split('#')
+        sd_id, nid = int(sd_id), int(nid)
 
-        # the same clip t_start/t_start must be used in _spike_raw_waveforms()
+        assert self.reader[sd_id].name == b'spike_detector', \
+            'This unit was not recorded by a spike_detector!'
 
+        data = np.asarray(self.reader[sd_id])
+        idx = np.argwhere(data['f0'] == nid)
 
-        rec_dev = self.raw_annotations['blocks'][block_index]['rec_dev']
-        assert rec_dev == b'spike_detector', \
-            'This block does not contain data from a spike_detector!'
+        # TODO: Check if first and last possible spike is within the limits below
+        sd_t_start = self.reader[sd_id].t_start * sim_resolution
+        sd_t_stop = self.reader[sd_id].t_stop * sim_resolution
 
-        gid_rec_dev = self.raw_annotations['blocks'][block_index]['gid']
-        data = np.asarray(self.reader[gid_rec_dev])
+        spike_start = max(sd_t_start, self.segment_t_start(block_index, seg_index))
+        spike_stop = min(sd_t_stop, self.segment_t_stop(block_index, seg_index))
 
-        idx = np.argwhere(data['f0'] == unit_index)
+        if t_start is None:
+            t_start = spike_start
+        if t_stop is None:
+            t_stop = spike_stop
 
-        # TODO: IS THIS CORRECT?
-        # step * resolution + offset, result in s
-        all_spike_timestamps = data['f1'][idx] * self.sim_resolution + data['f2'][idx] * 1e-3
+        assert sd_t_start <= t_start, 't_start ({}) must be larger than or equal to beginning of spike recording ({}).' \
+                                      ''.format(t_start,spike_start)
+        assert sd_t_stop >= t_stop, 't_stop ({}) must be smaller than or equal to end of spike recording ({}).' \
+                                    ''.format(t_stop, spike_stop)
 
+        # # TODO: IS THIS CORRECT?
+        # # step * resolution + offset, result in s
+        all_spike_timestamps = data['f1'][idx] * sim_resolution + data['f2'][idx] * 1e-3
+        #
         mask = (all_spike_timestamps >= t_start) & (all_spike_timestamps <= t_stop)
         spike_timestamps = all_spike_timestamps[mask]
 
@@ -323,36 +335,12 @@ def _get_spike_timestamps(self, block_index, seg_index, unit_index, t_start, t_s
 
 
     def _rescale_spike_timestamp(self, spike_timestamps, dtype):
-        # DONE
         # SPIKE_TIMESTAMPS ARE ALREADY IN S BECAUSE OF STEP AND OFFSET, THIS CHANGES ONLY DTYPE
-
         spike_times = spike_timestamps.astype(dtype)
         return spike_times
 
 
     def _get_spike_raw_waveforms(self, block_index, seg_index, unit_index, t_start, t_stop):
-        # this must return a 3D numpy array (nb_spike, nb_channel, nb_sample)
-        # in the original dtype
-        # this must be as fast as possible.
-        # the same clip t_start/t_start must be used in _spike_timestamps()
-
-        # If there there is no waveform supported in the
-        # IO them _spike_raw_waveforms must return None
-
-        # In our IO waveforms come from all channels
-        # they are int16
-        # convertion to real units is done with self.header['unit_channels']
-        # Here, we have a realistic case: all waveforms are only noise.
-        # it is not always the case
-        # we 20 spikes with a sweep of 50 (5ms)
-
-        # trick to get how many spike in the slice
-        ts = self._get_spike_timestamps(block_index, seg_index, unit_index, t_start, t_stop)
-        nb_spike = ts.size
-
-        np.random.seed(2205)  # a magic number (my birthday)
-        waveforms = np.random.randint(low=-2**4, high=2**4, size=nb_spike * 50, dtype='int16')
-        waveforms = waveforms.reshape(nb_spike, 1, 50)
         return None
 
 
@@ -361,7 +349,6 @@ def _event_count(self, block_index, seg_index, event_channel_index):
 
 
     def _get_event_timestamps(self, block_index, seg_index, event_channel_index, t_start, t_stop):
-        #return timestamp, durations, labels
         return None
 
 

From 5adb5bc04ebb05a766aca80d3c4c782d64a62266 Mon Sep 17 00:00:00 2001
From: Julia Sprenger <julia.sprenger@rwth-aachen.de>
Date: Mon, 16 Sep 2019 10:45:12 +0200
Subject: [PATCH 4/7] [NestIO] Add test structure for nest3io

---
 neo/rawio/nest3rawio.py         | 31 +++++------
 neo/test/iotest/test_nest3io.py | 98 +++++++++++++++++++++++++++++++++
 2 files changed, 112 insertions(+), 17 deletions(-)
 create mode 100644 neo/test/iotest/test_nest3io.py

diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
index 9d19ec4f8..85b22bafe 100644
--- a/neo/rawio/nest3rawio.py
+++ b/neo/rawio/nest3rawio.py
@@ -108,23 +108,20 @@ def _parse_header(self):
                                           wf_offset, wf_left_sweep, wf_sampling_rate))
 
                 # analog data as signals
-                # elif rec_dev.name == b'multimeter':
-                #     ch_name =
-                #     chan_id
-                #     sr
-                #     dtype
-                #     units
-                #     gain
-                #     offset
-                #     group_id
-                #     sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
-
-
-
-
-
-
-            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin, i.rows, i.dtype, i.t_start, i.t_stop
+                elif rec_dev.name == b'multimeter':
+                    for obs in rec_dev.double_observables + rec_dev.long_observables:
+                        ch_name = 'sd{}unit{}'.format(rec_dev.gid, nid)
+                        chan_id = '{}#{}'.format(rec_dev.gid, nid)
+                        sr = 0
+                        dtype = float if obs in rec_dev.double_observables else int # or rec_dev.dtype
+                        units = 0
+                        gain = 0
+                        offset = 0
+                        group_id = 0
+                        sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
+
+            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin,
+            # i.rows, i.dtype, i.t_start, i.t_stop
 
         unit_channels = np.array(unit_channels, dtype=_unit_channel_dtype)
         self.header['unit_channels'] = unit_channels
diff --git a/neo/test/iotest/test_nest3io.py b/neo/test/iotest/test_nest3io.py
new file mode 100644
index 000000000..176e688eb
--- /dev/null
+++ b/neo/test/iotest/test_nest3io.py
@@ -0,0 +1,98 @@
+# -*- coding: utf-8 -*-
+"""
+Tests of neo.io.nest3io
+"""
+
+# needed for python 3 compatibility
+from __future__ import unicode_literals, print_function, division, absolute_import
+
+import unittest
+
+from neo.io.nest3io import Nest3IO  # , HAVE_SCIPY
+from neo.test.iotest.common_io_test import BaseTestIO
+from neo.io.proxyobjects import (AnalogSignalProxy,
+                SpikeTrainProxy, EventProxy, EpochProxy)
+from neo import (AnalogSignal, SpikeTrain)
+
+import quantities as pq
+import numpy as np
+
+
+# This run standart tests, this is mandatory for all IO
+
+
+class TestExampleIO(BaseTestIO, unittest.TestCase):
+    ioclass = Nest3IO
+    files_to_test = ['fake1',
+                     'fake2',
+                     ]
+    files_to_download = []
+
+
+class Specific_TestNest3IO(unittest.TestCase):
+    # def test_read_segment_lazy(self):
+    #     r = ExampleIO(filename=None)
+    #     seg = r.read_segment(lazy=True)
+    #     for ana in seg.analogsignals:
+    #         assert isinstance(ana, AnalogSignalProxy)
+    #         ana = ana.load()
+    #         assert isinstance(ana, AnalogSignal)
+    #     for st in seg.spiketrains:
+    #         assert isinstance(st, SpikeTrainProxy)
+    #         st = st.load()
+    #         assert isinstance(st, SpikeTrain)
+    #
+    #     seg = r.read_segment(lazy=False)
+    #     for anasig in seg.analogsignals:
+    #         assert isinstance(ana, AnalogSignal)
+    #         self.assertNotEqual(anasig.size, 0)
+    #     for st in seg.spiketrains:
+    #         assert isinstance(st, SpikeTrain)
+    #         self.assertNotEqual(st.size, 0)
+    #
+    #     # annotations
+    #     assert 'seg_extra_info' in seg.annotations
+    #     assert seg.name == 'Seg #0 Block #0'
+    #     for anasig in seg.analogsignals:
+    #         assert anasig.name is not None
+    #     for st in seg.spiketrains:
+    #         assert st.name is not None
+    #     for ev in seg.events:
+    #         assert ev.name is not None
+    #     for ep in seg.epochs:
+    #         assert ep.name is not None
+    #
+    # def test_read_block(self):
+    #     r = ExampleIO(filename=None)
+    #     bl = r.read_block(lazy=True)
+    #     assert len(bl.list_units) == 3
+    #     assert len(bl.channel_indexes) == 1 + 3  # signals grouped + units
+    #
+    # def test_read_segment_with_time_slice(self):
+    #     r = ExampleIO(filename=None)
+    #     seg = r.read_segment(time_slice=None)
+    #     shape_full = seg.analogsignals[0].shape
+    #     spikes_full = seg.spiketrains[0]
+    #     event_full = seg.events[0]
+    #
+    #     t_start, t_stop = 260 * pq.ms, 1.854 * pq.s
+    #     seg = r.read_segment(time_slice=(t_start, t_stop))
+    #     shape_slice = seg.analogsignals[0].shape
+    #     spikes_slice = seg.spiketrains[0]
+    #     event_slice = seg.events[0]
+    #
+    #     assert shape_full[0] > shape_slice[0]
+    #
+    #     assert spikes_full.size > spikes_slice.size
+    #     assert np.all(spikes_slice >= t_start)
+    #     assert np.all(spikes_slice <= t_stop)
+    #     assert spikes_slice.t_start == t_start
+    #     assert spikes_slice.t_stop == t_stop
+    #
+    #     assert event_full.size > event_slice.size
+    #     assert np.all(event_slice.times >= t_start)
+    #     assert np.all(event_slice.times <= t_stop)
+
+
+if __name__ == "__main__":
+    unittest.main()

From 810830c59674dea7e7ac3c7226c3acdd4ba78295 Mon Sep 17 00:00:00 2001
From: Julia Sprenger <julia.sprenger@rwth-aachen.de>
Date: Wed, 18 Sep 2019 16:12:43 +0200
Subject: [PATCH 5/7] [Nest3IO] Add rudimentary AnalogSignal generation

---
 neo/rawio/nest3rawio.py | 119 ++++++++++++++++++++++++++++++++--------
 1 file changed, 95 insertions(+), 24 deletions(-)

diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
index 85b22bafe..6af14165e 100644
--- a/neo/rawio/nest3rawio.py
+++ b/neo/rawio/nest3rawio.py
@@ -61,6 +61,8 @@ class Nest3RawIO(BaseRawIO):
     extensions = ['sion']
     rawmode = 'one-file'
 
+    _obs_colid_mapping = {}  # {gid: column_id]
+
     def __init__(self, filename=''):
         BaseRawIO.__init__(self)
         self.filename = filename
@@ -88,6 +90,8 @@ def _parse_header(self):
         # segment annotations: global information on simulation
         seg_ann = {}
 
+        # TODO: Create one Channel_Index per recording device. Add 'label' annotation (rec_dev.label)
+
         # loop through data
         unit_channels = []
         sig_channels = []
@@ -97,7 +101,7 @@ def _parse_header(self):
 
                 # spike data as units
                 if rec_dev.name == b'spike_detector':
-                    unit_name = 'sd{}unit{}'.format(rec_dev.gid, nid)
+                    unit_name = 'rd{}unit{}'.format(rec_dev.gid, nid)
                     unit_id = '{}#{}'.format(rec_dev.gid, nid)
                     wf_units = ''
                     wf_gain = 0.0
@@ -109,25 +113,33 @@ def _parse_header(self):
 
                 # analog data as signals
                 elif rec_dev.name == b'multimeter':
-                    for obs in rec_dev.double_observables + rec_dev.long_observables:
-                        ch_name = 'sd{}unit{}'.format(rec_dev.gid, nid)
-                        chan_id = '{}#{}'.format(rec_dev.gid, nid)
-                        sr = 0
-                        dtype = float if obs in rec_dev.double_observables else int # or rec_dev.dtype
-                        units = 0
-                        gain = 0
-                        offset = 0
-                        group_id = 0
-                        sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
+                    gid = rec_dev.gid
+                    self._obs_colid_mapping[gid] = {}
+                    sampling_rate = self._get_sampling_rate(rec_dev) # in s
+                    for cols, observables in zip(['f3', 'f4'], [rec_dev.double_observables, rec_dev.long_observables]):
+                        for col_id, obs in enumerate(observables):
+                            ch_name = 'rd{}unit{}signal{}'.format(rec_dev.gid, nid, obs.decode())
+                            chan_id = nid  #'{}#{}#{}'.format(rec_dev.gid, nid, obs.decode())
+                            sr = sampling_rate
+                            dtype = np.asarray(self.reader[gid])[cols].dtype  # float if obs in rec_dev.double_observables else int # or
+                            units = self._get_signal_unit(obs)
+                            gain = 1.
+                            offset = 0.
+                            group_id = 0 # TODO: should this be recording device specific?
+                            sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
+
+                            self._obs_colid_mapping[gid][obs.decode()] = (cols, col_id)
 
             #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin,
             # i.rows, i.dtype, i.t_start, i.t_stop
 
+
+
         unit_channels = np.array(unit_channels, dtype=_unit_channel_dtype)
         self.header['unit_channels'] = unit_channels
 
         # # signals and units are not global but specific to to the recording devices
-        self.header['signal_channels'] = np.array([], dtype=_signal_channel_dtype)
+        self.header['signal_channels'] = np.array(sig_channels, dtype=_signal_channel_dtype)
         # self.header['unit_channels'] = np.array([], dtype=_unit_channel_dtype)
 
         # # no events or epochs
@@ -139,6 +151,29 @@ def _parse_header(self):
 
         self.raw_annotations['blocks'][0].update(block_ann)
 
+        seg_ann = self.raw_annotations['blocks'][0]['segments'][0]
+        seg_ann['name'] = 'Seg #{} Block #{}'.format(0, 0)
+        seg_ann['seg_extra_info'] = 'This is the seg {} of block {}'.format(0, 0)
+
+        # for rec_dev in self.reader:
+        #     neuron_ids = np.unique(np.array(self.reader[rec_dev.gid])['f0'])
+        #     for nid in neuron_ids:
+        #
+        #
+        # for c in range(len(sig_channels)):
+        #     anasig_an = seg_ann['signals'][c]
+        #     anasig_an['info'] = 'This is a good signals'
+        # for c in range(3):
+        #     spiketrain_an = seg_ann['units'][c]
+        #     spiketrain_an['quality'] = 'Good!!'
+        # for c in range(2):
+        #     event_an = seg_ann['events'][c]
+        #     if c == 0:
+        #         event_an['nickname'] = 'Miss Event 0'
+        #     elif c == 1:
+        #         event_an['nickname'] = 'MrEpoch 1'
+
+
         # # global information on simulation
         # self.nest_version =  self.reader.nest_version
         # self.sionlib_rec_backend_version =  self.reader.sionlib_rec_backend_version
@@ -253,6 +288,7 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
         # this must return a signal chunk limited with
         # i_start/i_stop (can be None)
         # channel_indexes can be None (=all channel) or a list or numpy.array
+
         # This must return a numpy array 2D (even with one channel).
         # This must return the original dtype. No conversion here.
         # This must as fast as possible.
@@ -263,20 +299,36 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
         # internally signals are int16
         # convertion to real units is done with self.header['signal_channels']
 
-        if i_start is None:
-            i_start = 0
-        if i_stop is None:
-            i_stop = 100000
+        # TODO: This needs performance optimization
+        res = []
+        for channel_index in channel_indexes:
+            rd_id, nid, signal = self.header['signal_channels'][channel_index][1].split('#')
+            rd_id, nid = int(rd_id), int(nid)
 
-        assert i_start >= 0, "I don't like your jokes"
-        assert i_stop <= 100000, "I don't like your jokes"
+            col, col_id = self._obs_colid_mapping[rd_id][signal]
 
-        if channel_indexes is None:
-            nb_chan = 16
-        else:
-            nb_chan = len(channel_indexes)
-        raw_signals = np.zeros((i_stop - i_start, nb_chan), dtype='int16')
-        return raw_signals
+            data = np.asarray(self.reader[rd_id])
+            idx = np.argwhere(data['f0'] == nid)
+
+            if i_start is None:
+                i_start = 0
+            if i_stop is None:
+                i_stop = sum(idx)
+
+            res.append(np.sort(data[idx])[i_start: i_stop][col][col_id])
+
+        return np.asarray(res)
+
+
+        # assert i_start >= 0, "I don't like your jokes"
+        # assert i_stop <= 100000, "I don't like your jokes"
+
+        # if channel_indexes is None:
+        #     nb_chan = 16
+        # else:
+        #     nb_chan = len(channel_indexes)
+        # raw_signals = np.zeros((i_stop - i_start, nb_chan), dtype='int16')
+        # return raw_signals
 
 
     def _spike_count(self, block_index, seg_index, unit_index):
@@ -362,3 +414,22 @@ def _rescale_epoch_duration(self, raw_duration, dtype):
         # really easy here because in our case it is already seconds
         durations = raw_duration.astype(dtype)
         return durations
+
+    def _get_sampling_rate(self, rec_dev):
+        gid = rec_dev.gid
+        data = np.asarray(self.reader[gid])
+
+        sampling_rate = np.unique(np.diff(np.sort(np.unique(data['f1'])))) * self.reader.resolution * 1e-3
+        # TODO: Does the offset (data['f2']) play a role here?
+
+        # sanity check
+        assert len(sampling_rate)==1, 'Inconsistent sampling times of recording device {}'.format(gid)
+
+        return sampling_rate # in s
+
+    def _get_signal_unit(self, obs):
+        if obs==b'V_m':
+            return 'mV'
+        if obs in [b'I_syn_ex', b'I_syn_in']:
+            return 'pA'
+        raise ValueError('Unit can not be extracted from recordable name {}'.format(obs))
\ No newline at end of file

From 207bc032526de4e28efd2f47fe2047ca9354ef11 Mon Sep 17 00:00:00 2001
From: Julia Sprenger <julia.sprenger@rwth-aachen.de>
Date: Mon, 23 Sep 2019 09:20:14 +0200
Subject: [PATCH 6/7] Rewrite RawIO mechanics

---
 neo/rawio/nest3rawio.py         | 186 ++++++++++++++++++++++----------
 neo/test/iotest/test_nest3io.py |  10 +-
 2 files changed, 138 insertions(+), 58 deletions(-)

diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
index 6af14165e..d117dbff0 100644
--- a/neo/rawio/nest3rawio.py
+++ b/neo/rawio/nest3rawio.py
@@ -62,6 +62,8 @@ class Nest3RawIO(BaseRawIO):
     rawmode = 'one-file'
 
     _obs_colid_mapping = {}  # {gid: column_id]
+    signal_recording_devices = [b'multimeter']
+    spike_recording_devices = [b'spike_detector']
 
     def __init__(self, filename=''):
         BaseRawIO.__init__(self)
@@ -91,19 +93,35 @@ def _parse_header(self):
         seg_ann = {}
 
         # TODO: Create one Channel_Index per recording device. Add 'label' annotation (rec_dev.label)
-
+        # TODO: Pre-sort data now already for faster time range selection later
         # loop through data
         unit_channels = []
         sig_channels = []
+
+        # usefull to get local channel index in nsX from the global channel index
+        local_sig_indexes = []
+        self._nids_per_rec_dev = {}
+
+        # sorting data for faster access later
+        self._sorted_data = {}
         for rec_dev in self.reader:
-            neuron_ids = np.unique(np.array(self.reader[rec_dev.gid])['f0'])
-            for nid in neuron_ids:
-
-                # spike data as units
-                if rec_dev.name == b'spike_detector':
-                    unit_name = 'rd{}unit{}'.format(rec_dev.gid, nid)
-                    unit_id = '{}#{}'.format(rec_dev.gid, nid)
-                    wf_units = ''
+            gid = rec_dev.gid
+            original_data = np.asarray(self.reader[gid])
+            sorting_order = np.lexsort((original_data['f0'],original_data['f1']))
+            self._sorted_data[gid] = original_data[sorting_order,...] # primary sorting time, secondary sorting channels
+
+        for rec_dev in self.reader:
+            gid = rec_dev.gid
+            data = self._sorted_data[gid]
+
+
+            # spike data as units
+            if rec_dev.name in self.spike_recording_devices:
+                neuron_ids = np.unique(data['f0'])
+                for nid in neuron_ids:
+                    unit_name = 'rd{}unit{}'.format(gid, nid)
+                    unit_id = '{}#{}'.format(gid, nid)
+                    wf_units = ''  # There are no waveforms recorded in this format.
                     wf_gain = 0.0
                     wf_offset = 0.0
                     wf_left_sweep = 0
@@ -111,39 +129,47 @@ def _parse_header(self):
                     unit_channels.append((unit_name, unit_id, wf_units, wf_gain,
                                           wf_offset, wf_left_sweep, wf_sampling_rate))
 
-                # analog data as signals
-                elif rec_dev.name == b'multimeter':
-                    gid = rec_dev.gid
+            # analog data as signals
+            elif rec_dev.name in self.signal_recording_devices:
+                samples_per_timestep = np.searchsorted(self._sorted_data['f0'], self._sorted_data['f0'][0],
+                                                       side='right', sorter=None)
+                neuron_ids = self._sorted_data['f1'][:samples_per_timestep]
+                for nid in neuron_ids:
                     self._obs_colid_mapping[gid] = {}
                     sampling_rate = self._get_sampling_rate(rec_dev) # in s
                     for cols, observables in zip(['f3', 'f4'], [rec_dev.double_observables, rec_dev.long_observables]):
                         for col_id, obs in enumerate(observables):
-                            ch_name = 'rd{}unit{}signal{}'.format(rec_dev.gid, nid, obs.decode())
+                            ch_name = 'rd{}unit{}signal{}'.format(gid, nid, obs.decode())
                             chan_id = nid  #'{}#{}#{}'.format(rec_dev.gid, nid, obs.decode())
                             sr = sampling_rate
-                            dtype = np.asarray(self.reader[gid])[cols].dtype  # float if obs in rec_dev.double_observables else int # or
+                            dtype = data[cols].dtype  # float if obs in rec_dev.double_observables else int # or
                             units = self._get_signal_unit(obs)
                             gain = 1.
                             offset = 0.
-                            group_id = 0 # TODO: should this be recording device specific?
+                            group_id = gid
                             sig_channels.append((ch_name, chan_id, sr, dtype, units, gain, offset, group_id))
 
-                            self._obs_colid_mapping[gid][obs.decode()] = (cols, col_id)
+                            # self._obs_colid_mapping[gid][obs.decode()] = (cols, col_id)
 
-            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin,
-            # i.rows, i.dtype, i.t_start, i.t_stop
+                            local_sig_indexes.append((cols, col_id))
 
+            self._nids_per_rec_dev[gid] = neuron_ids
+        self._local_sig_indexes = np.array(local_sig_indexes)
 
+            #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin,
+            # i.rows, i.dtype, i.t_start, i.t_stop
 
+        # finalize header
         unit_channels = np.array(unit_channels, dtype=_unit_channel_dtype)
-        self.header['unit_channels'] = unit_channels
-
-        # # signals and units are not global but specific to to the recording devices
-        self.header['signal_channels'] = np.array(sig_channels, dtype=_signal_channel_dtype)
-        # self.header['unit_channels'] = np.array([], dtype=_unit_channel_dtype)
+        event_channels = np.array([], dtype=_event_channel_dtype)
+        sig_channels = np.array(sig_channels, dtype=_signal_channel_dtype)
 
-        # # no events or epochs
-        self.header['event_channels'] = np.array([], dtype=_event_channel_dtype)
+        self.header = {}
+        self.header['nb_block'] = 1
+        self.header['nb_segment'] = [1]
+        self.header['signal_channels'] = sig_channels
+        self.header['unit_channels'] = unit_channels
+        self.header['event_channels'] = event_channels
 
 
         # minimal annotations from BaseRawIO
@@ -254,18 +280,19 @@ def _segment_t_stop(self, block_index, seg_index):
 
 
     def _get_signal_size(self, block_index, seg_index, channel_indexes=None):
-        # TODO
-        #
-        # we are lucky: signals in all segment have the same shape!! (10.0 seconds)
-        # it is not always the case
-        # this must return an int = the number of sample
+        # the channel_indexes belong to the same recording device (checked by baserawio)
+        # number of samples available in requested channels
+        rd_id, _ = self._get_gid_and_local_indexes(channel_indexes)
 
-        # Note that channel_indexes can be ignored for most cases
-        # except for several sampling rate.
-        return rows
+        # all channels for this recording device have the same number of samples
+        # the samples per channel are therefore the total samples / number of channels (nids)
+        return len(self._sorted_data[rd_id]) / self._nids_per_rec_dev[rd_id]
 
 
     def _get_signal_t_start(self, block_index, seg_index, channel_indexes):
+
+        rd_id, local_ids = self._get_gid_and_local_indexes(channel_indexes)
+
         # DONE
         # same as _segment_t_start
         #
@@ -284,7 +311,8 @@ def _get_signal_t_start(self, block_index, seg_index, channel_indexes):
 
 
     def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, channel_indexes):
-        # TODO
+        # channel_indexes is checked by BaseRawIO to belong to a single group_id and characteristics
+
         # this must return a signal chunk limited with
         # i_start/i_stop (can be None)
         # channel_indexes can be None (=all channel) or a list or numpy.array
@@ -300,24 +328,52 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
         # convertion to real units is done with self.header['signal_channels']
 
         # TODO: This needs performance optimization
-        res = []
-        for channel_index in channel_indexes:
-            rd_id, nid, signal = self.header['signal_channels'][channel_index][1].split('#')
-            rd_id, nid = int(rd_id), int(nid)
 
-            col, col_id = self._obs_colid_mapping[rd_id][signal]
 
-            data = np.asarray(self.reader[rd_id])
-            idx = np.argwhere(data['f0'] == nid)
 
-            if i_start is None:
-                i_start = 0
-            if i_stop is None:
-                i_stop = sum(idx)
+        rd_id, local_ids = self._get_gid_and_local_indexes(channel_indexes)
+        # local_ids = col, col_id
+
+        # all signals have the same number of samples for a signal recording device
+        samples_per_nid = self._get_signal_size(block_index, seg_index, channel_indexes = [0])
+        nids = self.header['signal_channels'][channel_indexes][:,1]
+
+        if i_start is None:
+            i_start = 0
+        if i_stop is None:
+            i_stop = samples_per_nid
+
+        mask_per_time_step = np.where(self._nids_per_rec_dev[rd_id]==nids)[0]
+        nid_mask = np.repeat(mask_per_time_step, samples_per_nid)
+        time_mask = slice(i_start*samples_per_nid, i_stop*samples_per_nid)
+        mask = np.logical_and(nid_mask, time_mask)
+
+        data = self._sorted_data[mask].reshape((samples_per_nid,len(nids)))
+
+        return data
+
+        # data = np.asarray(self.reader[rd_id]) # sorted by time, nid
+        #
+        # # Extract signal values of all selected nids
+        #
+        #
+        # for channel_index in channel_indexes:
+        #     rd_id, nid, signal = self.header['signal_channels'][channel_index][1].split('#')
+        #     rd_id, nid = int(rd_id), int(nid)
+        #
+        #
+        #
+        #
+        #     idx = np.argwhere(data['f0'] == nid)
 
-            res.append(np.sort(data[idx])[i_start: i_stop][col][col_id])
+            # if i_start is None:
+            #     i_start = 0
+            # if i_stop is None:
+            #     i_stop = sum(idx)
 
-        return np.asarray(res)
+        #     res.append(np.sort(data[idx])[i_start: i_stop][col][col_id])
+        #
+        # return np.asarray(res)
 
 
         # assert i_start >= 0, "I don't like your jokes"
@@ -336,8 +392,8 @@ def _spike_count(self, block_index, seg_index, unit_index):
         sd_id, nid = self.header['unit_channels'][unit_index][1].split('#')
         sd_id, nid = int(sd_id), int(nid)
 
-        assert self.reader[sd_id].name == b'spike_detector', \
-            'This unit was not recorded by a spike_detector!'
+        assert self.reader[sd_id].name in self.spike_recording_devices, \
+            'This unit was not recorded by a spike detector!'
 
         data = np.asarray(self.reader[sd_id])
         return np.sum(data['f0'] == nid)
@@ -350,8 +406,8 @@ def _get_spike_timestamps(self, block_index, seg_index, unit_index, t_start, t_s
         sd_id, nid = self.header['unit_channels'][unit_index][1].split('#')
         sd_id, nid = int(sd_id), int(nid)
 
-        assert self.reader[sd_id].name == b'spike_detector', \
-            'This unit was not recorded by a spike_detector!'
+        assert self.reader[sd_id].name in self.spike_recording_devices, \
+            'This unit was not recorded by a spike detector!'
 
         data = np.asarray(self.reader[sd_id])
         idx = np.argwhere(data['f0'] == nid)
@@ -416,15 +472,16 @@ def _rescale_epoch_duration(self, raw_duration, dtype):
         return durations
 
     def _get_sampling_rate(self, rec_dev):
+
+        assert rec_dev.name in self.signal_recording_devices, 'Recording device {} does not have a sampling rate {}'.format(rec_dev.name)
+
         gid = rec_dev.gid
-        data = np.asarray(self.reader[gid])
+        data = self._sorted_data[gid]
 
-        sampling_rate = np.unique(np.diff(np.sort(np.unique(data['f1'])))) * self.reader.resolution * 1e-3
+        samples_per_nid = len(data['f1']) / len(self._nids_per_rec_dev[gid])
+        sampling_rate = (data['f1'][-1] - data['f1'][0]) / (samples_per_nid - 1) * self.reader.resolution * 1e-3
         # TODO: Does the offset (data['f2']) play a role here?
 
-        # sanity check
-        assert len(sampling_rate)==1, 'Inconsistent sampling times of recording device {}'.format(gid)
-
         return sampling_rate # in s
 
     def _get_signal_unit(self, obs):
@@ -432,4 +489,19 @@ def _get_signal_unit(self, obs):
             return 'mV'
         if obs in [b'I_syn_ex', b'I_syn_in']:
             return 'pA'
-        raise ValueError('Unit can not be extracted from recordable name {}'.format(obs))
\ No newline at end of file
+        raise ValueError('Unit can not be extracted from recordable name {}'.format(obs))
+
+
+    ### templates from other RawIOs
+
+    def _get_gid_and_local_indexes(self, channel_indexes):
+        # internal helper to get rd gid and local channel indexes from global channel indexes
+        # when this is called channel_indexes are always in the same group_id this is checked at BaseRaw level
+        if channel_indexes is None:
+            channel_indexes = slice(None)
+        gid = self.header['signal_channels'][channel_indexes]['group_id'][0]
+        if channel_indexes is None:
+            local_indexes = slice(None)
+        else:
+            local_indexes = self._local_sig_indexes[channel_indexes]
+        return gid, local_indexes
\ No newline at end of file
diff --git a/neo/test/iotest/test_nest3io.py b/neo/test/iotest/test_nest3io.py
index 176e688eb..4497c1d9c 100644
--- a/neo/test/iotest/test_nest3io.py
+++ b/neo/test/iotest/test_nest3io.py
@@ -18,7 +18,7 @@
 import numpy as np
 
 
-# This run standart tests, this is mandatory for all IO
+# This run standard tests, this is mandatory for all IO
 
 
 class TestExampleIO(BaseTestIO, unittest.TestCase):
@@ -30,6 +30,14 @@ class TestExampleIO(BaseTestIO, unittest.TestCase):
 
 
 class Specific_TestNest3IO(unittest.TestCase):
+
+    def test_dummy(self):
+        io = Nest3IO(filename='/home/julia/repositories/python/nestio_sionlib/output_event_time.sion')
+        bl = io.read_block()
+        print(bl.segments[0].spiketrains[10].times)
+        print(bl.segments[0].analogsignals)
+
+
     # def test_read_segment_lazy(self):
     #     r = ExampleIO(filename=None)
     #     seg = r.read_segment(lazy=True)

From 87b82f3d9e37d3756553b4521d8ce2bbd1d831e7 Mon Sep 17 00:00:00 2001
From: Julia Sprenger <julia.sprenger@rwth-aachen.de>
Date: Wed, 25 Sep 2019 11:27:12 +0200
Subject: [PATCH 7/7] Structural rewrite

---
 neo/rawio/nest3rawio.py | 80 ++++++++++++++++++++++++++++++++++-------
 1 file changed, 68 insertions(+), 12 deletions(-)

diff --git a/neo/rawio/nest3rawio.py b/neo/rawio/nest3rawio.py
index d117dbff0..93a4a5fe2 100644
--- a/neo/rawio/nest3rawio.py
+++ b/neo/rawio/nest3rawio.py
@@ -16,7 +16,14 @@
 
 import numpy as np
 
-import nestio # TODO from https://github.com/apeyser/nestio-tools (bring to setup.py, maybe change of name?)
+
+try:
+    import nestio  # TODO from https://github.com/apeyser/nestio-tools (bring to setup.py, maybe change of name?)
+    HAVE_NESTIO = True
+except ImportError:
+    HAVE_NESTIO = False
+    nestio = None
+
 
 
 class Nest3RawIO(BaseRawIO):
@@ -131,9 +138,10 @@ def _parse_header(self):
 
             # analog data as signals
             elif rec_dev.name in self.signal_recording_devices:
-                samples_per_timestep = np.searchsorted(self._sorted_data['f0'], self._sorted_data['f0'][0],
-                                                       side='right', sorter=None)
-                neuron_ids = self._sorted_data['f1'][:samples_per_timestep]
+                samples_per_timestep = np.searchsorted(data['f1'], data['f1'][0], side='right', sorter=None)
+                neuron_ids = data['f0'][:samples_per_timestep]
+                self._nids_per_rec_dev[gid] = neuron_ids
+
                 for nid in neuron_ids:
                     self._obs_colid_mapping[gid] = {}
                     sampling_rate = self._get_sampling_rate(rec_dev) # in s
@@ -153,7 +161,7 @@ def _parse_header(self):
 
                             local_sig_indexes.append((cols, col_id))
 
-            self._nids_per_rec_dev[gid] = neuron_ids
+
         self._local_sig_indexes = np.array(local_sig_indexes)
 
             #i.gid, i.name, i.label, i.double_n_val, i.double_observables, i.long_n_val, i.long_observables, i.origin,
@@ -286,7 +294,9 @@ def _get_signal_size(self, block_index, seg_index, channel_indexes=None):
 
         # all channels for this recording device have the same number of samples
         # the samples per channel are therefore the total samples / number of channels (nids)
-        return len(self._sorted_data[rd_id]) / self._nids_per_rec_dev[rd_id]
+        sig_size = len(self._sorted_data[rd_id]) / len(self._nids_per_rec_dev[rd_id])
+        assert sig_size == int(sig_size), 'Error in signal size extraction'
+        return int(sig_size)
 
 
     def _get_signal_t_start(self, block_index, seg_index, channel_indexes):
@@ -334,21 +344,67 @@ def _get_analogsignal_chunk(self, block_index, seg_index, i_start, i_stop, chann
         rd_id, local_ids = self._get_gid_and_local_indexes(channel_indexes)
         # local_ids = col, col_id
 
+        # checking for consistent col, as this defines the dtype of the signal
+        assert all(local_ids[:,0]==local_ids[0,0]), 'Attempting to load signals with different data types into single AnalogSignal'
+        datacolumn_id = local_ids[0,0]
+
         # all signals have the same number of samples for a signal recording device
-        samples_per_nid = self._get_signal_size(block_index, seg_index, channel_indexes = [0])
-        nids = self.header['signal_channels'][channel_indexes][:,1]
+        samples_per_nid = self._get_signal_size(block_index, seg_index, channel_indexes=[0])
+        nids = self.header['signal_channels'][channel_indexes]['id']
 
         if i_start is None:
             i_start = 0
         if i_stop is None:
             i_stop = samples_per_nid
 
-        mask_per_time_step = np.where(self._nids_per_rec_dev[rd_id]==nids)[0]
-        nid_mask = np.repeat(mask_per_time_step, samples_per_nid)
-        time_mask = slice(i_start*samples_per_nid, i_stop*samples_per_nid)
+        # extracting all rows containing requested times and nids
+        # mask_per_time_step = np.in1d(self._nids_per_rec_dev[rd_id], nids)
+        # nid_mask = np.repeat(mask_per_time_step, samples_per_nid)
+        nid_mask = True
+        time_mask = np.zeros(self._sorted_data[rd_id].shape[0], dtype=bool)
+        time_mask[i_start*samples_per_nid: i_stop*samples_per_nid] = True
         mask = np.logical_and(nid_mask, time_mask)
 
-        data = self._sorted_data[mask].reshape((samples_per_nid,len(nids)))
+        # Extract relevant data packets
+        data = self._sorted_data[rd_id][mask]#.reshape((samples_per_nid,len(nids))) # (t, nid)
+
+
+        # unfolding 2d data structure using advanced indexing: nid->channel_index
+        m =np.searchsorted(self._nids_per_rec_dev, nids) # this has len(channel_indexes)
+        l = len(data) / self._nids_per_rec_dev[rd_id]
+        ma = np.array([m+i*len(self._nids_per_rec_dev[rd_id]) for i in range(l)])
+        data_signals = data[datacolumn_id][ma]
+
+        return data_signals.reshape((samples_per_nid, len(channel_indexes)))
+
+
+        def get_local_signal(data, local_id):
+            col, col_id = local_id
+            return data[col][col_id]
+
+        # np.empty(shape=(le))
+
+        vget_local = np.vectorize(get_local_signal)
+
+        data = vget_local(data, local_ids)
+        # Problem: Indexing into array with named dtype is not compatible with advanced indexing.
+        # New approach: used flattened representation of original data and use advanced indexing there
+
+        # Update:
+        # signals will be separated for int and float dtype (as defined by baserawio common characteristics check)
+
+
+
+
+
+
+
+        # Extract relevant data columns from packets
+        #  note: nids can have more than one signal recorded per row. see col and col_id
+        # this function should be vectorized
+        # for col, col_id in local_ids:
+        #     data[col][col_id]
+
 
         return data