-
Notifications
You must be signed in to change notification settings - Fork 1
/
crossgen_matrix_subsample_prep2prep_djm.m~
executable file
·226 lines (183 loc) · 9.71 KB
/
crossgen_matrix_subsample_prep2prep_djm.m~
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
%% Cross-validation matrix of preparatory attention. Done separately within each ROI
% written by Tanya Wen
% 2019/01/23
dbstop if error
% addpath(genpath('/imaging/tw05'))
addpath('/imaging/tw05/Preparatory_Attention_Study/Version3-FullExp')
addpath('/imaging/local/software/spm_cbu_svn/releases/spm12_latest/')
%addpath(genpath('/imaging/local/software/spm_toolbox/eeglab13_4_3b'))
% if ~strcmp('EEG',spm_get_defaults('modality'))
spm('defaults', 'eeg');
% end
tempdir='/imaging/dm01/temp/'; % djm, temp location for me to write to
% required software: libSVM & RSAtoolbox
workingdir = '/imaging/tw05/Preparatory_Attention_Study/Version3-FullExp';
addpath(genpath(fullfile('/imaging/tw05/Preparatory_Attention_Study/','software','rsatoolbox')));
addpath(fullfile('/imaging/tw05/Preparatory_Attention_Study/','software','libsvm-mat-2.87-1'));
% control variables
libSVMsettings='-s 1 -t 0'; % nu-SVM, linear
nRandomisations=1000;
nfolds = 5;
nsubsample = 100;
% rmpath('/hpc-software/matlab/r2014a/toolbox/bioinfo/biolearning/'); % to make sure libSVM code is used (not strictly necessary: matlab svmtrain yields exactly same model)
% Define SUBJECT INFORMATION
subs = [1,2,3,4,5,6,7,8,9,10,11,13,15,16,17,18,19,20]; % subject numbers
subjects_dirs = {'meg16_0317/161107','meg16_0319/161110','meg16_0321/161111','meg16_0322/161114','meg16_0325/161115','meg16_0327/161117','meg16_0330/161121','meg16_0332/161122','meg16_0333/161124','meg16_0337/161128','meg16_0339/161129','meg16_0340/161129','meg16_0341/161201','meg16_0343/161202','meg16_0345/161206','meg16_0346/161206','meg16_0348/161208','meg16_0349/161208','meg16_0350/161212','meg16_0352/161213'};
subjnum = [1,2,3,4,5,6,1,2,3,4,5,6,1,2,3,4,5,6,6,2]; % counterbalancing numbers
min_trials_mvpa = [88,98,87,98,67,67,91,89,56,82,59,0,66,0,90,84,45,68,97,93];
%% parallelize
nw=128;
scheduler=cbu_scheduler();
scheduler.SubmitArguments='-q compute -l mem=270gb -l walltime=460800';
if isempty(gcp('nocreate')) || ~exist('pool','var') || pool.NumWorkers ~= nw,
if ~isempty(gcp('nocreate'))
delete(gcp('nocreate'))
end
scheduler.NumWorkers=nw;
pool=parpool(scheduler,nw);
end
%%%%%%% djm, moved first bit of ROI loop outside subject loop
roi_folder = '/imaging/tw05/Preparatory_Attention_Study/Version3-FullExp/ROIs';
roi_list = {'Auditory_Te3.nii','Visual_hOc1.nii','LPFC.nii'};
roinames=roi_list;
roinames = strrep(roinames, '_', '-');
roinames = strrep(roinames, '.nii', '');
coords=cell(1,numel(roi_list));
for rois = 1:numel(roi_list)
Vroi = spm_vol(fullfile(roi_folder,roi_list{rois}));
[Y, XYZ]=spm_read_vols(Vroi);
coords{rois} = XYZ(:,Y>0)';
end
%%%%%%%%
for sub = [1,2,3,4,5,6,7,8,9,10,11,13,15,16,17,18,19,20]
tic
fprintf('\nLoading data from subject %d...',sub)
% go to subject directory
cd(workingdir)
swd = sprintf('sub%02d/%s',sub,subjects_dirs{sub}); % subject working directory
cd(swd)
%% attentional template
% load data
D = spm_eeg_load('caefMspm12_attention_task_block1_raw.mat');
val = 1; %inversion method = MMN
%vertex = D.inv{val}.mesh.tess_mni.vert(D.inv{val}.inverse.Is, :); % find existing vertices
%% define labels
% define subject specific pairings
allperms = perms([1 2 3]);
for i = 1:length(allperms)
if rem(subjnum(sub),6)+1 == i
choosetargets = allperms(i,:);
end
end
fprintf('Took %.1f minutes.',toc/60);
for rois = 1:numel(roi_list)
tic
fprintf('\nExtracting data from ROI %d of subject %d...',rois,sub)
% extract voxel x time x trials matrix of ROI
D.val=val;
D.inv{val}.source.XYZ = coords{rois};
D.inv{val}.source.rad = 0;
D.inv{val}.source.label= roinames(rois);
D.inv{val}.source.fname = strcat(roinames{rois},'_attn1');
D.inv{val}.source.type = 'trials';
try
Dattn=spm_eeg_inv_extract_tw(D); % return header to avoid needing to reload
catch
D.inv{val}.source.fname = fullfile(tempdir,D.inv{val}.source.fname); % djm, in case don't have write permission to original directory
Dattn=spm_eeg_inv_extract_tw(D);
end
data3D = single(Dattn.fttimelock.trial);
cond_values = Dattn.fttimelock.trialinfo;
% define cue1 & cue2 index vectors
cues=cell(1,2);
for i=1:2
cues{i} = find(cond_values==i);
end
fprintf('Took %.1f minutes.',toc/60);
tic
fprintf('\nAnalysing ROI %d of subject %d',rois,sub)
%% smoothing option
smoothing = {'Raw','Smooth'};
for smooth = 1%:numel(smoothing)
%% sliding time window
winsizes = 8;%[8,25,50,125]; %32ms,100ms,200ms,500ms
for winsize = winsizes
% set analysis time windows
twin_train = [1 size(data3D,3)]; % time of interest
stpsize = 1; %step size
trainwins = [twin_train(1):stpsize:(twin_train(2)-winsize)]';
trainwins(:,2) = trainwins(:,1) + winsize;
ntrains = size(trainwins,1);
twin_test = [1 size(data3D,3)]; % time of interest
testwins = [twin_test(1):stpsize:(twin_test(2)-winsize)]'; %#ok<*NBRAK>
testwins(:,2) = testwins(:,1) + winsize;
ntests = size(testwins,1);
%%%%% djm: this bit allows the variable to be 'sliced' in parfor loop;
windatatrain=nan(size(data3D,1),size(data3D,2),winsize+1,ntrains);
% the window seems to be 8+1 samples long
for islide = 1:ntrains
windatatrain(:,:,:,islide)=data3D(:,:,trainwins(islide,1):trainwins(islide,2));
end
windatatest=windatatrain; % making a separate variable stops it needing to be 'broadcast'
%%%%
accuracy_matrix = nan(nsubsample,nfolds,ntrains);
predicted_vals = cell(nsubsample,nfolds,ntrains);
for subsample = 1:nsubsample
if ~mod(subsample,10), fprintf('.'); end
for fold = 1: nfolds
testind = [cues{1}(fold:nfolds:end) cues{2}(fold:nfolds:end)];
labels_test=cond_values(testind)';
trainind = setdiff([cues{:}],testind);
train_cond_values = cond_values(trainind);
c1 = datasample(find(train_cond_values==1),round(min_trials_mvpa(sub)*4/5),'Replace',false);
c2 = datasample(find(train_cond_values==2),round(min_trials_mvpa(sub)*4/5),'Replace',false);
subsetind = [trainind(c1),trainind(c2)];
labels_train=cond_values(subsetind)';
parfor islide = 1:ntrains
patternsTrain=double(windatatrain(subsetind,:,:,islide));
if smooth == 1 % no smoothing
patternsTrain=reshape(patternsTrain,length(subsetind),[]);
elseif smooth == 2 % smoothing
patternsTrain = mean(patternsTrain,3);
end
% classification using linear SVM (train the classifier)
model=svmtrain(labels_train,patternsTrain,libSVMsettings);
patternsTest = double(windatatest(testind,:,:,islide));
if smooth == 1 % no smoothing
patternsTest=reshape(patternsTest,length(testind),[]);
elseif smooth == 2 % smoothing
patternsTest = mean(patternsTest,3);
end
% classification using linear SVM (test the classifier)
[predicted,accuracy,~]=svmpredict(labels_test,patternsTest,model);
accuracy_matrix(subsample,fold,islide)=accuracy(1);
predicted_vals{subsample,fold,islide} = predicted;
end % next slide
end % next fold
end % next subsample
output_dir = 'crossgen_ROIs_subsample_prep-prep';
try
cd(output_dir)
catch
eval(sprintf('!mkdir %s',output_dir)); cd(output_dir);
end
figure(sub)
imagesc(squeeze(mean(accuracy_matrix,1)));
colorbar;
caxis([1,100]);
% djm:
set(gca,'xticklabel',(cellfun(@str2double,get(gca,'xticklabel'))-1)*stpsize*4-100);
set(gca,'yticklabel',(cellfun(@str2double,get(gca,'yticklabel'))-1)*stpsize*4-100);
xlabel('start of test windows (ms)')
ylabel('start of train windows (ms)')
fprintf('\nTook %.1f hours.',toc/60/60);
saveas(gcf,sprintf('CrossGenMatrix%03dms%s_%s_sub%s.png',winsize*4,smoothing{smooth},roinames{rois},num2str(sub)));
save(sprintf('CrossGenMatrix%03dms%s_%s_sub%s.mat',winsize*4,smoothing{smooth},roinames{rois},num2str(sub)));
close;
cd(workingdir)
cd(swd)
end % winsize
end % smooth
end % rois
end
delete(gcp)