-
Notifications
You must be signed in to change notification settings - Fork 34
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #33 from Julie-Fabre/bleeding_edge
Handle duplicate spikes + a better back-compatibility management system
- Loading branch information
Showing
14 changed files
with
339 additions
and
527 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
function param = bc_qualityParamValues_JF(ephysMetaDir, rawFile, ephysKilosortPath, gain_to_uV) | ||
|
||
param = bc_qualityParamValues(ephysMetaDir, rawFile, ephysKilosortPath, gain_to_uV); | ||
param.removeDuplicateSpikes = 0; | ||
|
||
end |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,34 @@ | ||
function [data, missingFields] = bc_addMissingFieldsWithDefault(data, defaultValues) | ||
% JF, Check input structure has all necessary fields + add them with | ||
% defualt values if not. | ||
% ------ | ||
% Inputs | ||
% ------ | ||
if ~isstruct(data) && ~istable(data) | ||
error('Input must be a structure or table'); | ||
end | ||
|
||
if ~isstruct(defaultValues) | ||
error('Default values must be provided as a structure'); | ||
end | ||
|
||
fieldnames = fields(defaultValues); | ||
|
||
if isstruct(data) | ||
missingFields = fieldnames(~isfield(data, fieldnames)); | ||
|
||
for i = 1:length(missingFields) | ||
fieldName = missingFields{i}; | ||
data.(fieldName) = defaultValues.(fieldName); | ||
end | ||
else % data is a table | ||
existingFields = data.Properties.VariableNames; | ||
missingFields = setdiff(fieldnames, existingFields); | ||
|
||
for i = 1:length(missingFields) | ||
fieldName = missingFields{i}; | ||
data.(fieldName) = repmat(defaultValues.(fieldName), height(data), 1); | ||
end | ||
end | ||
end | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,41 @@ | ||
function param_complete = bc_checkParameterFields(param) | ||
% JF, Check input structure has all necessary fields + add them with | ||
% defualt values if not. This is to ensure backcompatibility when any new | ||
% paramaters are introduced. By default, any parameters not already present | ||
% will be set so that the quality metrics are calculated in the same way as | ||
% they were before these new parameters were introduced. | ||
% ------ | ||
% Inputs | ||
% ------ | ||
|
||
|
||
|
||
%% Default values for fields | ||
% duplicate spikes | ||
defaultValues.removeDuplicateSpikes = 0; | ||
defaultValues.duplicateSpikeWindow_s = 0.0001; | ||
defaultValues.saveSpikes_withoutDuplicates = 1; | ||
defaultValues.recomputeDuplicateSpikes = 0; | ||
|
||
% raw waveforms | ||
defaultValues.detrendWaveforms = 0; | ||
defaultValues.extractRaw = 1; | ||
|
||
% amplitude | ||
defaultValues.gain_to_uV = NaN; | ||
|
||
% phy saving | ||
defaultValues.saveAsTSV = 0; | ||
defaultValues.unitType_for_phy = 0; | ||
|
||
|
||
%% Check for missing fields and add them with default value | ||
[param_complete, missingFields] = bc_addMissingFieldsWithDefault(param, defaultValues); | ||
|
||
%% Display result | ||
if ~isempty(missingFields) | ||
disp('Missing param fields filled in with default values'); | ||
disp(missingFields); | ||
end | ||
|
||
end |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,160 @@ | ||
function [nonEmptyUnits, duplicateSpikes_idx, spikeTimes_samples, spikeTemplates, templateAmplitudes, ... | ||
pcFeatures, rawWaveformsFull, rawWaveformsPeakChan, signalToNoiseRatio, maxChannels] = ... | ||
bc_removeDuplicateSpikes(spikeTimes_samples, spikeTemplates, templateAmplitudes, ... | ||
pcFeatures, rawWaveformsFull, rawWaveformsPeakChan, signalToNoiseRatio, ... | ||
maxChannels, removeDuplicateSpikes_flag, ... | ||
duplicateSpikeWindow_s, ephys_sample_rate, saveSpikes_withoutDuplicates_flag, savePath, recompute) | ||
% JF, Remove any duplicate spikes | ||
% Some spike sorters (including kilosort) can sometimes count spikes twice | ||
% if for instance the residuals are re-fitted. see https://github.com/MouseLand/Kilosort/issues/29 | ||
% ------ | ||
% Inputs | ||
% ------ | ||
% | ||
% ------ | ||
% Outputs | ||
% ------ | ||
% | ||
|
||
if removeDuplicateSpikes_flag | ||
% Check if we need to extract duplicate spikes | ||
if recompute || isempty(dir([savePath, filesep, 'spikes._bc_duplicateSpikes.npy'])) | ||
% Parameters | ||
duplicateSpikeWindow_samples = duplicateSpikeWindow_s * ephys_sample_rate; | ||
batch_size = 10000; | ||
overlap_size = 100; | ||
numSpikes_full = length(spikeTimes_samples); | ||
|
||
% initialize and re-allocate | ||
duplicateSpikes_idx = false(1, numSpikes_full); | ||
|
||
% Rename the spike templates according to the remaining templates | ||
good_templates_idx = unique(spikeTemplates); | ||
new_spike_idx = nan(max(spikeTemplates), 1); | ||
new_spike_idx(good_templates_idx) = 1:length(good_templates_idx); | ||
spikeTemplates_flat = new_spike_idx(spikeTemplates); | ||
|
||
% check for duplicate spikes in batches | ||
for start_idx = 1:batch_size - overlap_size:numSpikes_full | ||
end_idx = min(start_idx+batch_size-1, numSpikes_full); | ||
batch_spikeTimes_samples = spikeTimes_samples(start_idx:end_idx); | ||
batch_spikeTemplates = spikeTemplates(start_idx:end_idx); | ||
batch_templateAmplitudes = templateAmplitudes(start_idx:end_idx); | ||
|
||
[~, ~, batch_removeIdx] = removeDuplicates(batch_spikeTimes_samples, ... | ||
batch_spikeTemplates, batch_templateAmplitudes, duplicateSpikeWindow_samples, ... | ||
maxChannels, spikeTemplates_flat); | ||
|
||
duplicateSpikes_idx(start_idx:end_idx) = batch_removeIdx; | ||
|
||
if end_idx == numSpikes_full | ||
break; | ||
end | ||
end | ||
% save data if required | ||
if saveSpikes_withoutDuplicates_flag | ||
writeNPY(duplicateSpikes_idx, [savePath, filesep, 'spikes._bc_duplicateSpikes.npy']) | ||
end | ||
|
||
else | ||
duplicateSpikes_idx = readNPY([savePath, filesep, 'spikes._bc_duplicateSpikes.npy']); | ||
end | ||
|
||
% check if there are any empty units | ||
unique_templates = unique(spikeTemplates); | ||
nonEmptyUnits = unique(spikeTemplates(~duplicateSpikes_idx)); | ||
emptyUnits_idx = ~ismember(unique_templates, nonEmptyUnits); | ||
|
||
% remove any empty units from ephys data | ||
spikeTimes_samples = spikeTimes_samples(~duplicateSpikes_idx); | ||
spikeTemplates = spikeTemplates(~duplicateSpikes_idx); | ||
templateAmplitudes = templateAmplitudes(~duplicateSpikes_idx); | ||
if ~isempty(pcFeatures) | ||
pcFeatures = pcFeatures(~duplicateSpikes_idx, :, :); | ||
end | ||
if ~isempty(rawWaveformsFull) | ||
rawWaveformsFull = rawWaveformsFull(~emptyUnits_idx, :, :); | ||
rawWaveformsPeakChan = rawWaveformsPeakChan(~emptyUnits_idx); | ||
end | ||
|
||
if ~isempty(signalToNoiseRatio) | ||
signalToNoiseRatio = signalToNoiseRatio(~emptyUnits_idx); | ||
end | ||
|
||
fprintf('\n Removed %.0f spike duplicates out of %.0f. \n', sum(duplicateSpikes_idx), length(duplicateSpikes_idx)) | ||
|
||
else | ||
nonEmptyUnits = unique(spikeTemplates); | ||
duplicateSpikes_idx = zeros(size(spikeTimes_samples, 1), 1); | ||
|
||
end | ||
|
||
|
||
function [spikeTimes_samples, spikeTemplates, removeIdx] = removeDuplicates(spikeTimes_samples, ... | ||
spikeTemplates, templateAmplitudes, duplicateSpikeWindow_samples, maxChannels, spikeTemplates_flat) | ||
numSpikes = length(spikeTimes_samples); | ||
removeIdx = false(1, numSpikes); | ||
|
||
% Intra-unit duplicate removal | ||
for iSpike1 = 1:numSpikes | ||
if removeIdx(iSpike1) | ||
continue; | ||
end | ||
|
||
for iSpike2 = iSpike1 + 1:numSpikes | ||
if removeIdx(iSpike2) | ||
continue; | ||
end | ||
if maxChannels(spikeTemplates_flat(iSpike2)) ~= maxChannels(spikeTemplates_flat(iSpike1)) % spikes are not on same channel | ||
continue; | ||
end | ||
|
||
if spikeTemplates(iSpike1) == spikeTemplates(iSpike2) | ||
if abs(spikeTimes_samples(iSpike1)-spikeTimes_samples(iSpike2)) <= duplicateSpikeWindow_samples | ||
if templateAmplitudes(iSpike1) < templateAmplitudes(iSpike2) | ||
spikeTimes_samples(iSpike1) = NaN; | ||
removeIdx(iSpike1) = true; | ||
break; | ||
else | ||
spikeTimes_samples(iSpike2) = NaN; | ||
removeIdx(iSpike2) = true; | ||
end | ||
end | ||
end | ||
end | ||
end | ||
|
||
|
||
% Inter-unit duplicate removal | ||
unitSpikeCounts = accumarray(spikeTemplates, 1); | ||
for iSpike1 = 1:length(spikeTimes_samples) | ||
if removeIdx(iSpike1) | ||
continue; | ||
end | ||
|
||
for iSpike2 = iSpike1 + 1:length(spikeTimes_samples) | ||
if removeIdx(iSpike2) | ||
continue; | ||
end | ||
if maxChannels(spikeTemplates_flat(iSpike2)) ~= maxChannels(spikeTemplates_flat(iSpike1)) % spikes are not on same channel | ||
continue; | ||
end | ||
|
||
if spikeTemplates(iSpike1) ~= spikeTemplates(iSpike2) | ||
if abs(spikeTimes_samples(iSpike1)-spikeTimes_samples(iSpike2)) <= duplicateSpikeWindow_samples | ||
if unitSpikeCounts(spikeTemplates(iSpike1)) < unitSpikeCounts(spikeTemplates(iSpike2)) | ||
spikeTimes_samples(iSpike1) = NaN; | ||
removeIdx(iSpike1) = true; | ||
break; | ||
else | ||
spikeTimes_samples(iSpike2) = NaN; | ||
removeIdx(iSpike2) = true; | ||
end | ||
end | ||
end | ||
end | ||
end | ||
end | ||
|
||
|
||
end |
Oops, something went wrong.