import os

import numpy as np
import pandas as pd
import xarray as xr

import matplotlib.pyplot as plt
%matplotlib inline

from allensdk.brain_observatory.ecephys.ecephys_project_cache import EcephysProjectCache


# Example cache directory path, it determines where downloaded data will be stored
data_directory = '/local1/ecephys_cache_dir/'

manifest_path = os.path.join(data_directory, "manifest.json")

cache = EcephysProjectCache.from_warehouse(manifest=manifest_path)


sessions = cache.get_session_table()

sessions.full_genotype.value_counts()

wt/wt                                              30
Sst-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt      12
Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt     8
Vip-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt       8
Name: full_genotype, dtype: int64


pvalb_sessions = sessions[sessions.full_genotype.str.match('Pvalb')]

pvalb_sessions


session = cache.get_session_data(pvalb_sessions.index.values[-3])


session.optogenetic_stimulation_epochs


columns = ['stimulus_name', 'duration','level']

session.optogenetic_stimulation_epochs.drop_duplicates(columns).sort_values(by=columns).drop(columns=['start_time','stop_time'])


sessions.index.values >= 789848216

array([False, False, False, False, False, False, False, False, False,
       False, False, False, False, False, False, False, False, False,
       False, False, False, False, False, False, False, False, False,
       False, False, False, False, False, False, False, False, False,
       False, False, False, False,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True])


trials = session.optogenetic_stimulation_epochs[(session.optogenetic_stimulation_epochs.duration > 0.009) & \
                                                (session.optogenetic_stimulation_epochs.duration < 0.02)]

units = session.units[session.units.ecephys_structure_acronym.str.match('VIS')]

time_resolution = 0.0005 # 0.5 ms bins

bin_edges = np.arange(-0.01, 0.025, time_resolution)

def optotagging_spike_counts(bin_edges, trials, units):
    
    time_resolution = np.mean(np.diff(bin_edges))

    spike_matrix = np.zeros( (len(trials), len(bin_edges), len(units)) )

    for unit_idx, unit_id in enumerate(units.index.values):

        spike_times = session.spike_times[unit_id]

        for trial_idx, trial_start in enumerate(trials.start_time.values):

            in_range = (spike_times > (trial_start + bin_edges[0])) * \
                       (spike_times < (trial_start + bin_edges[-1]))

            binned_times = ((spike_times[in_range] - (trial_start + bin_edges[0])) / time_resolution).astype('int')
            spike_matrix[trial_idx, binned_times, unit_idx] = 1

    return xr.DataArray(
        name='spike_counts',
        data=spike_matrix,
        coords={
            'trial_id': trials.index.values,
            'time_relative_to_stimulus_onset': bin_edges,
            'unit_id': units.index.values
        },
        dims=['trial_id', 'time_relative_to_stimulus_onset', 'unit_id']
    )

da = optotagging_spike_counts(bin_edges, trials, units)


def plot_optotagging_response(da):

    plt.figure(figsize=(5,10))

    plt.imshow(da.mean(dim='trial_id').T / time_resolution, 
               extent=[np.min(bin_edges), np.max(bin_edges),
                       0, len(units)],
               aspect='auto', vmin=0, vmax=200)    

    for bound in [0.0005, 0.0095]:
        plt.plot([bound, bound],[0, len(units)], ':', color='white', linewidth=1.0)

    plt.xlabel('Time (s)')
    plt.ylabel('Unit #')

    cb = plt.colorbar(fraction=0.046, pad=0.04)
    cb.set_label('Mean firing rate (Hz)')
    
plot_optotagging_response(da)


baseline = da.sel(time_relative_to_stimulus_onset=slice(-0.01,-0.002))

baseline_rate = baseline.sum(dim='time_relative_to_stimulus_onset').mean(dim='trial_id') / 0.008

evoked = da.sel(time_relative_to_stimulus_onset=slice(0.001,0.009))

evoked_rate = evoked.sum(dim='time_relative_to_stimulus_onset').mean(dim='trial_id') / 0.008


plt.figure(figsize=(5,5))

plt.scatter(baseline_rate, evoked_rate, s=3)

axis_limit = 250
plt.plot([0,axis_limit],[0,axis_limit], ':k')
plt.plot([0,axis_limit],[0,axis_limit*2], ':r')
plt.xlim([0,axis_limit])
plt.ylim([0,axis_limit])

plt.xlabel('Baseline rate (Hz)')
_ = plt.ylabel('Evoked rate (Hz)')


cre_pos_units = da.unit_id[(evoked_rate / (baseline_rate + 1)) > 2].values # add 1 to prevent divide-by-zero errors

cre_pos_units

array([951131472, 951131470, 951131486, 951131478, 951131522, 951131506,
       951131782, 951131534, 951131558, 951131556, 951131564, 951131560,
       951131581, 951131589, 951131583, 951131593, 951131612, 951131643,
       951131689, 951132054, 951132138, 951132140, 951132159, 951132184,
       951132212, 951132205, 951132224, 951132236, 951133681, 951133822,
       951133909, 951134030, 951134026, 951134066, 951134100, 951134199,
       951136071, 951136175, 951136247, 951136394, 951136657, 951136717,
       951136829, 951137028, 951137073, 951137204, 951140485, 951140617,
       951141942, 951140861, 951140832, 951140821, 951141065, 951141978,
       951141097, 951141154, 951141292, 951141373, 951141485, 951141536])


plt.figure(figsize=(5,5))

for unit_id in cre_pos_units:
    
    peak_channel = session.units.loc[unit_id].peak_channel_id
    wv = session.mean_waveforms[unit_id].sel(channel_id = peak_channel)
    
    plt.plot(wv.time * 1000, wv, 'k', alpha=0.3)

plt.xlabel('Time (ms)')
plt.ylabel('Amplitude (microvolts)')
_ =plt.plot([1.0, 1.0],[-160, 100],':c')


sst_sessions = sessions[sessions.full_genotype.str.match('Sst')]

session = cache.get_session_data(sst_sessions.index.values[-1])


trials = session.optogenetic_stimulation_epochs[(session.optogenetic_stimulation_epochs.duration > 0.009) & \
                                                (session.optogenetic_stimulation_epochs.duration < 0.02)]

units = session.units[session.units.ecephys_structure_acronym.str.match('VIS')]

bin_edges = np.arange(-0.01, 0.025, 0.0005)

da = optotagging_spike_counts(bin_edges, trials, units)


plot_optotagging_response(da)


baseline = da.sel(time_relative_to_stimulus_onset=slice(-0.01,-0.002))

baseline_rate = baseline.sum(dim='time_relative_to_stimulus_onset').mean(dim='trial_id') / 0.008

evoked = da.sel(time_relative_to_stimulus_onset=slice(0.001,0.009))

evoked_rate = evoked.sum(dim='time_relative_to_stimulus_onset').mean(dim='trial_id') / 0.008


plt.figure(figsize=(5,5))

plt.scatter(baseline_rate, evoked_rate, s=3)

axis_limit = 175
plt.plot([0,axis_limit],[0,axis_limit], ':k')
plt.plot([0,axis_limit],[0,axis_limit*2], ':r')
plt.xlim([0,axis_limit])
plt.ylim([0,axis_limit])

plt.xlabel('Baseline rate (Hz)')
_ = plt.ylabel('Evoked rate (Hz)')


cre_pos_units = da.unit_id[(evoked_rate / (baseline_rate + 1)) > 2].values

plt.figure(figsize=(5,5))

for unit_id in cre_pos_units:
    
    peak_channel = session.units.loc[unit_id].peak_channel_id
    wv = session.mean_waveforms[unit_id].sel(channel_id = peak_channel)
    
    plt.plot(wv.time * 1000, wv, 'k', alpha=0.3)

plt.xlabel('Time (ms)')
plt.ylabel('Amplitude (microvolts)')
_ =plt.plot([1.0, 1.0],[-160, 100],':c')


vip_sessions = sessions[sessions.full_genotype.str.match('Vip')]

session = cache.get_session_data(vip_sessions.index.values[-1])


trials = session.optogenetic_stimulation_epochs[(session.optogenetic_stimulation_epochs.duration > 0.009) & \
                                                (session.optogenetic_stimulation_epochs.duration < 0.02)]

units = session.units[session.units.ecephys_structure_acronym.str.match('VIS')]

bin_edges = np.arange(-0.01, 0.025, 0.0005)

da = optotagging_spike_counts(bin_edges, trials, units)


plot_optotagging_response(da)

	published_at	specimen_id	session_type	age_in_days	sex	full_genotype	unit_count	channel_count	probe_count	ecephys_structure_acronyms
id
721123822	2019-10-03T00:00:00Z	707296982	brain_observatory_1.1	125.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	444	2229	6	[MB, SCig, PPT, NOT, DG, CA1, VISam, nan, LP, ...
746083955	2019-10-03T00:00:00Z	726170935	brain_observatory_1.1	98.0	F	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	582	2216	6	[VPM, TH, LGd, CA3, CA2, CA1, VISal, nan, grey...
760345702	2019-10-03T00:00:00Z	739783171	brain_observatory_1.1	103.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	501	1862	5	[MB, TH, PP, PIL, DG, CA3, CA1, VISal, nan, gr...
773418906	2019-10-03T00:00:00Z	757329624	brain_observatory_1.1	124.0	F	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	546	2232	6	[PPT, NOT, SUB, ProS, CA1, VISam, nan, APN, DG...
797828357	2019-10-03T00:00:00Z	776061251	brain_observatory_1.1	107.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	611	2232	6	[PPT, MB, APN, NOT, HPF, ProS, CA1, VISam, nan...
829720705	2019-10-03T00:00:00Z	811322619	functional_connectivity	112.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	529	1841	5	[SCig, SCop, SCsg, SCzo, POST, VISp, nan, CA1,...
839557629	2019-10-03T00:00:00Z	821469666	functional_connectivity	115.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	450	1853	5	[APN, NOT, MB, DG, CA1, VISam, nan, VISpm, LGd...
840012044	2019-10-03T00:00:00Z	820866121	functional_connectivity	116.0	M	Pvalb-IRES-Cre/wt;Ai32(RCL-ChR2(H134R)_EYFP)/wt	758	2298	6	[APN, DG, CA1, VISam, nan, LP, VISpm, VISp, LG...

	start_time	condition	level	stop_time	stimulus_name	duration
id
0	9208.46044	a single square pulse	2.0	9208.46544	pulse	0.005
1	9210.64062	a single square pulse	1.7	9210.65062	pulse	0.010
2	9212.37064	2.5 ms pulses at 10 Hz	1.7	9213.37064	fast_pulses	1.000
3	9214.40076	2.5 ms pulses at 10 Hz	1.3	9215.40076	fast_pulses	1.000
4	9216.55091	2.5 ms pulses at 10 Hz	2.0	9217.55091	fast_pulses	1.000
...	...	...	...	...	...	...
295	9778.77516	2.5 ms pulses at 10 Hz	2.0	9779.77516	fast_pulses	1.000
296	9780.72530	half-period of a cosine wave	2.0	9781.72530	raised_cosine	1.000
297	9782.66528	a single square pulse	1.3	9782.67028	pulse	0.005
298	9784.81538	a single square pulse	1.3	9784.82038	pulse	0.005
299	9786.60547	a single square pulse	1.3	9786.61547	pulse	0.010

	condition	level	stimulus_name	duration
id
3	2.5 ms pulses at 10 Hz	1.3	fast_pulses	1.000
2	2.5 ms pulses at 10 Hz	1.7	fast_pulses	1.000
4	2.5 ms pulses at 10 Hz	2.0	fast_pulses	1.000
17	a single square pulse	1.3	pulse	0.005
7	a single square pulse	1.7	pulse	0.005
0	a single square pulse	2.0	pulse	0.005
13	a single square pulse	1.3	pulse	0.010
1	a single square pulse	1.7	pulse	0.010
8	a single square pulse	2.0	pulse	0.010
5	half-period of a cosine wave	1.3	raised_cosine	1.000
14	half-period of a cosine wave	1.7	raised_cosine	1.000
6	half-period of a cosine wave	2.0	raised_cosine	1.000

Optotagging Analysis¶

Tutorial overview¶

Finding datasets of interest¶

Types of optotagging stimuli¶

Aligning spikes to light pulses¶

Identifying Cre+ units¶

Differences across genotypes¶