%load_ext autoreload
%autoreload 2

import os
import expipe
import pathlib
import numpy as np
import septum_mec.analysis.data_processing as dp
from septum_mec.analysis.registration import store_notebook
import re
import joblib
import multiprocessing
import shutil
import psutil
import pandas as pd
import matplotlib.pyplot as plt
import quantities as pq
import exdir
from distutils.dir_util import copy_tree
from datetime import timedelta
from tqdm import tqdm_notebook as tqdm
from septum_mec.analysis.trackunitmulticomparison import TrackMultipleSessions
import networkx as nx
from nxpd import draw
%matplotlib inline

13:25:38 [I] klustakwik KlustaKwik2 version 0.2.6
/home/mikkel/.virtualenvs/expipe/lib/python3.6/importlib/_bootstrap.py:219: RuntimeWarning: numpy.ufunc size changed, may indicate binary incompatibility. Expected 192 from C header, got 216 from PyObject
  return f(*args, **kwds)
/home/mikkel/.virtualenvs/expipe/lib/python3.6/importlib/_bootstrap.py:219: RuntimeWarning: numpy.ufunc size changed, may indicate binary incompatibility. Expected 192 from C header, got 216 from PyObject
  return f(*args, **kwds)

project_path = dp.project_path()

project = expipe.get_project(project_path)
actions = project.actions

output = pathlib.Path('output/identify_neurons')
output.mkdir(parents=True, exist_ok=True)

identify_neurons = project.require_action('identify-neurons')

actions['1833-010719-2'].attributes

{'users': ['Mikkel Lepperød'],
 'tags': ['11hz', 'stim-ms', 'stim i', 'septum', 'open-ephys'],
 'datetime': '2019-07-01T12:54:49',
 'type': 'Recording',
 'registered': '2019-07-02T14:53:28',
 'data': {'main': 'main.exdir'},
 'location': 'IMB',
 'entities': ['1833']}

data_loader = dp.Data()

skip_actions = [
    '1849-270219-1', 
    '1849-260219-2', 
    '1834-250219-1',
    '1834-230219-1'
]

sessions = []
for action in actions.values():
    if action.id in skip_actions:
        continue
    if action.type != 'Recording':
        continue
    action_data_path = pathlib.Path(action.data_path('main'))
    processing = exdir.File(action_data_path)['processing']

    if not 'electrophysiology' in processing:
        continue
    elphys = processing['electrophysiology']
    if 'spikesorting' not in elphys:
        continue
    tags = [t.lower() for t in action.tags]
    
    freq = np.nan
    stimulated = False
    baseline = False
    is_i = False
    is_ii = False
    tag = None
    stim_location = None
    
    stim_times = data_loader.stim_times(action.id)
    if stim_times is not None:
        stimulated = True
        freq = round(1 / np.median(np.diff(stim_times)))
        
    
    
    tag_i = [i for i, t in enumerate(tags) if 'baseline ' in t or 'stim ' in t]
    if len(tag_i) == 1:
        tag = tags[tag_i[0]]
        what, how = tag.split(' ')
        if what == 'stim':
            where = [t for t in tags if 'stim-' in t]
            assert len(where) == 1
            stim_location = where[0].split('-')[-1]
            assert stimulated
        elif what == 'baseline':
            baseline = True
            assert not stimulated
        else:
            raise Exception(f'Found {tag}, what to do?')
        if how == 'i':
            is_i = True
        elif how == 'ii':
            is_ii = True
        else:
            raise Exception(f'Found {tag}, what to do?')
    elif len(tag_i) > 1:
        print(action.id, [tags[i] for i in tag_i])
        
    

    sessions.append({
        'tag': tag,
        'action': action.id,
        'stimulated': stimulated,
        'baseline': baseline,
        'i': is_i,
        'ii': is_ii,
        'frequency': float(freq),
        'session': int(action.id.split('-')[-1]),
        'stim_location': stim_location,
        'entity': int(action.entities[0]),

    })
sessions = pd.DataFrame(sessions)

sessions.query('stimulated and frequency!=30')

sessions.to_csv(output / 'sessions.csv', index=False)

all_non_identified_units = []
for action in sessions.action.values:
    for ch in range(8):
        for unit_name in data_loader.unit_names(action, ch):
            all_non_identified_units.append({
                'unit_name': unit_name, 
                'action': action, 
                'channel_group': ch
            })
all_non_identified_units = pd.DataFrame(all_non_identified_units)

all_non_identified_units.to_csv(output / 'all_non_identified_units.csv', index=False)

Identify unique neurons¶

# save graphs
for entity, values in sessions.groupby('entity'):
    data_path = output / f'{entity}-graphs'
    if data_path.exists():
        continue
    print('Processing', entity)
    unit_matching = TrackMultipleSessions(
        actions, values.action.values.tolist(), 
        progress_bar=tqdm, verbose=False, data_path=data_path
    )
    unit_matching.do_matching()
    unit_matching.make_graphs_from_matches()
    unit_matching.compute_time_delta_edges()
    unit_matching.compute_depth_delta_edges()
    # save graph with all dissimilarities for later use
    unit_matching.save_graphs()

Processing 1833

Processing 1834

Processing 1839

Processing 1849

Plot comparisons¶

unit_comp = TrackMultipleSessions(actions, data_path=f'output/identify_neurons/1833-graphs')

unit_comp.load_graphs()

max_dissimilarity = .05
max_depth_delta = 100

unit_comp.remove_edges_above_threshold('weight', max_dissimilarity)
unit_comp.remove_edges_above_threshold('depth_delta', max_depth_delta)

unit_comp.remove_edges_with_duplicate_actions()
unit_comp.identify_units()
unit_comp.plot_matches('template', chan_group=6, step_color=False)
plt.tight_layout()

Store uniqe unit ids to csv¶

max_dissimilarity = .05
max_depth_delta = 100
for entity in sessions.entity.values:
    unit_matching = TrackMultipleSessions(
        actions, list(sessions.query(f'entity=={entity}').action), 
        progress_bar=tqdm, verbose=False, data_path=output / f'{entity}-graphs'
    )
    unit_matching.load_graphs()
    # cutoff large dissimilarities
    unit_matching.remove_edges_above_threshold('weight', max_dissimilarity)
    unit_matching.remove_edges_above_threshold('depth_delta', max_depth_delta)
    unit_matching.remove_edges_with_duplicate_actions()
    unit_matching.identify_units()
    units = []
    for ch, group in unit_matching.identified_units.items():
        for unit_id, val in group.items():
            for action_id, orig_unit_ids in val['original_unit_ids'].items():
                units.extend([
                    {
                        'unit_name': name, 
                        'unit_id': unit_id, 
                        'action': action_id,
                        'channel_group': ch,
                        'max_dissimilarity': max_dissimilarity,
                        'max_depth_delta': max_depth_delta
                    } 
                    for name in orig_unit_ids])

    pd.DataFrame(units).to_csv(output / f'{entity}-units.csv', index=False)

unique_units = pd.concat([
    pd.read_csv(p) 
    for p in output.iterdir() 
    if p.name.endswith('units.csv')])

unique_units.to_csv(output / 'units.csv', index=False)

Store results in Expipe action¶

identify_neurons.data['sessions'] = 'sessions.csv'
identify_neurons.data['units'] = 'units.csv'

copy_tree(output, str(identify_neurons.data_path()))

store_notebook(
    identify_neurons, "00-identify-neurons.ipynb")

	action	baseline	entity	frequency	i	ii	session	stim_location	stimulated	tag
3	1839-060619-3	False	1839	11.0	True	False	3	ms	True	stim i
7	1849-110319-2	False	1849	11.0	True	False	2	ms	True	stim i
9	1834-220319-2	False	1834	11.0	True	False	2	ms	True	stim i
12	1834-120319-2	False	1834	11.0	True	False	2	ms	True	stim i
19	1833-260619-2	False	1833	11.0	True	False	2	ms	True	stim i
20	1849-010319-4	False	1849	11.0	True	False	4	mecr	True	stim i
23	1849-220319-3	False	1849	11.0	True	False	3	ms	True	stim i
28	1834-150319-2	False	1834	11.0	True	False	2	ms	True	stim i
30	1839-290519-2	False	1839	11.0	True	False	2	ms	True	stim i
37	1849-150319-2	False	1849	11.0	True	False	2	ms	True	stim i
38	1849-280219-2	False	1849	11.0	True	False	2	ms	True	stim i
44	1834-010319-3	False	1834	11.0	True	False	3	ms	True	stim i
45	1833-050619-2	False	1833	11.0	True	False	2	ms	True	stim i
47	1833-120619-2	False	1833	11.0	True	False	2	ms	True	stim i
50	1849-010319-5	False	1849	11.0	True	False	5	mecl	True	stim i
53	1834-060319-2	False	1834	11.0	True	False	2	ms	True	stim i
55	1834-110319-6	False	1834	11.0	True	False	6	mecr	True	stim i
57	1849-060319-2	False	1849	11.0	True	False	2	ms	True	stim i
61	1834-110319-2	False	1834	11.0	True	False	2	ms	True	stim i
62	1833-020719-2	False	1833	11.0	True	False	2	ms	True	stim i
66	1833-200619-2	False	1833	11.0	True	False	2	ms	True	stim i
75	1833-290519-2	False	1833	11.0	True	False	2	ms	True	stim i
77	1839-120619-2	False	1839	11.0	True	False	2	ms	True	stim i
82	1834-110319-5	False	1834	11.0	True	False	5	mecl	True	stim i
83	1839-200619-2	False	1839	11.0	True	False	2	ms	True	stim i
87	1833-010719-2	False	1833	11.0	True	False	2	ms	True	stim i