-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvm.m
285 lines (258 loc) · 10.4 KB
/
vm.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
function vm(files, stage, options)
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Voxelwise modeling for predefined ROIs or whole brain
% --
% files - names of output, stim, resp and testcc files
% stage - stage of processing
% (1 = Reg. Param Selection)
% (2 = Model Estimation)
% options - analysis parameters
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%-------------------------------------------------------
% Parse inputs
%-------------------------------------------------------
if (nargin < 1)
error('Need to input a filename@ Quitting...');
elseif (nargin < 2)
error('Need to indicate processing stage! Quitting...');
elseif (nargin < 3)
error('Options missing from input! Quitting...');
end
%-------------------------------------------------------
% Ready to load data
%-------------------------------------------------------
% Load preprocessed stimuli
eval(['load ' files.stim]);
% Apply PCA on stimulus matrix
[~, rspca, ~, ~, rexx] = pca(stim(:,2:end));
rnpca = 300; %number of principal components used
rspca = rspca(1:3870,1:rnpca);
sum(rexx(1:rnpca)) % explained by first npca components
stim = [stim(:,1),rspca]; %Append motion energy column
% Load voxel responses
eval(['load ' files.resp]);
%-------------------------------------------------------
% Set default options
%-------------------------------------------------------
if (isfield(options,'regtype'))
regtype = options.regtype;
else
regtype = 'L2';
end
if (isfield(options,'cvfolds'))
cvfolds = options.cvfolds;
else
cvfolds = 1;
end
if (isfield(options,'vholdout'))
vholdout = options.vholdout;
else
vholdout = 5;
end
if (isfield(options,'ctfolds'))
ctfolds = options.ctfolds;
else
ctfolds = 1;
end
if (isfield(options,'tholdout'))
tholdout = options.tholdout;
else
tholdout = 3;
end
if (isfield(options,'ratSamp'))
ratSamp = options.ratSamp;
else
ratSamp = 1;
end
if (isfield(options,'trnSamp'))
trnSamp = options.trnSamp;
else
trnSamp = 1:length(ranges.crange);
end
if (isfield(options,'lag'))
lag = options.lag;
else
lag = 0;
end
if (isfield(options,'as'))
as = options.as;
else
as = 100*(2.^(0:15)); % default reg. parameters
end
%------------------------
% Voxel selection (ROI)
%------------------------
% load mask-voxel information
disp('Running on ROI...');
eval(['load ' files.roi]);
roiloc = strfind(roilist,files.roiname);
roiid = find(not(cellfun('isempty',roiloc)));
targetvoxels = roivox{roiid}; % Indices of the voxels in the specified ROI
numVox = length(targetvoxels);
fprintf('Running on %d voxels...\n',numVox);
%-------------------------------------------------------
% prepare the training stimulus and response with lag
%-------------------------------------------------------
if strcmp(files.model,'sem') && stage==2
stim = stim(:,2:end); % Remove motion-energy feature for model estimation
end
stim = single(stim);
numFeat = size(stim,2); % Number of features
% Clean NaN entries in the response data
resp(find(isnan(resp))) = 0;
resp = single(resp);
% Restrict time frames
numSamples = floor(ratSamp*length(trnSamp));
numTrainingSamples = (1:numSamples);
% Frame skipping
fskip.TR = 2; % TR for acquisition (2 s)
fskip.flag = 0;
fskip.val = 0;
% Stimulus prep and demeaning
fskip.mode = 1;
[stimsh, timeidx, ~] = embed(stim(trnSamp(numTrainingSamples),:).',lag,fskip);
stimsh = stimsh.';
stimsh = stimsh - repmat(mean(stimsh,1),size(stimsh,1),1);
% Response prep and demeaning
respsh = resp;
respsh = respsh(timeidx,:);
respsh = respsh - repmat(mean(respsh,1),size(respsh,1),1);
% For cross-validation, seperate the data into cvfolds chunks
numTrainingSamples = 1:length(timeidx);
if stage == 1
% find the start-end points of the chunks
chunklen = 25; % 1 chunk = 2 s, 25 chunks = 50 s
numchunk = round(length(numTrainingSamples)/chunklen);
mid_frames = [round((0:(numchunk-1))*length(numTrainingSamples)/numchunk)+1 ...
length(numTrainingSamples)+1];
% divide the data into test and training sets given cvfolds
sblock = 1:numchunk;
numvblock = vholdout;
for cvidx = 1:cvfolds
if (length(sblock)<numvblock), sblock = 1:numchunk; end % restart if sblock is done
testblks = randsample(sblock,numvblock);
trnblks{cvidx} = setdiff(1:numchunk,testblks);
sblock = setdiff(sblock,testblks);
tsample = [];
for blkidx = 1:numvblock
tsample = cat(2,tsample,mid_frames(testblks(blkidx)):(mid_frames(testblks(blkidx)+1)-1));
end
testingSamples{cvidx} = tsample;
trainingSamples{cvidx} = setdiff(numTrainingSamples, testingSamples{cvidx});
end
elseif stage == 2
%-------------------------------------------------------
% prepare the validation stimulus and response with lag
%-------------------------------------------------------
fskip.flag = 0; % Turn on frame skipping
fskip.val = 1; % Set to 1 for validation data
[stimshv, timeidx, ~] = embed(stim(ranges.vrange,:).',lag,fskip);
stimshv = stimshv.';
stimshv = stimshv - repmat(mean(stimshv,1),size(stimshv,1),1);
% Prep response matrix
respshv = resp(ranges.vrange,:);
respshv = respshv(timeidx,:);
respshv = respshv - repmat(mean(respshv,1),size(respshv,1),1);
% Extract validation samples
valSamples = 1:length(timeidx);
end
switch stage
%-------------------------------------------------------
% Run cross-validation for determining the reg. param
%-------------------------------------------------------
case {1}
% initialize parameters
tccsall = zeros(cvfolds,ctfolds,length(as),length(targetvoxels));
mccsall = zeros(cvfolds,ctfolds,length(as));
% Generate prediction scores across cross-validation folds
for cvidx = 1:cvfolds
fprintf('iter no %d of %d(cv)\n',cvidx,cvfolds);
%Get the training blocks for that cvfold and resample from them
sblock = trnblks{cvidx};
numtblock = tholdout;
for tidx = 1:ctfolds
fprintf('%d of %d(ct)\n',tidx,ctfolds);
if (length(sblock)<numtblock), sblock = trnblks{cvidx}; end % restart if sblock if done
testblks = randsample(sblock,numtblock);
sblock = setdiff(sblock,testblks);
tsample = [];
for blkidx = 1:numtblock
tsample = cat(2,tsample,mid_frames(testblks(blkidx)):(mid_frames(testblks(blkidx)+1)-1));
end
subtstSamples{tidx} = tsample;
subtrnSamples{tidx} = setdiff(trainingSamples{cvidx}, subtstSamples{tidx});
% Extract testing and training data
Xtest = stimsh(subtstSamples{tidx},:);
Ytest = respsh(subtstSamples{tidx},:);
Xtrain = stimsh(subtrnSamples{tidx},:);
Ytrain = respsh(subtrnSamples{tidx},:);
% Obtain predicted responses
Ytest_pred = vm_solve(Xtrain, cat(2,Ytrain,nanmean(Ytrain,2)), as, Xtest);
Ytest_pred = Ytest_pred(:,1:(end-1),:);
% Calculate prediction scores
for asidx = 1:length(as)
% Calculate corr for all voxels
tccs = mvn_corr_fast(Ytest, Ytest_pred(:,:,asidx));
tccsall(cvidx,tidx,asidx,:) = tccs;
mccs = nanmean(tccs);
% Store all correlation values
mccsall(cvidx,tidx,asidx) = mccs;
end
end
end
% Save the output as single to reduce footprint
tccsall = single(tccsall);
mccsall = single(mccsall);
% save the output
eval(['save -v7.3 ' files.out(1:end-4) '_cv_lambda.mat as tccsall mccsall trainingSamples testingSamples;']);
%-----------------------------------------------------------------
% Plot prediction scores across reg. params to see optimal values
%-----------------------------------------------------------------
mccsall = reshape(mccsall, [cvfolds*ctfolds length(as)]);
[cm, ci] = max(mean(mccsall,1));
fprintf('Best reg. param based on corrs: %d\n', as(ci));
figure;clf;
semilogx(as, mean(mccsall,1));
xlabel('regularization parameter');
ylabel('average correlation coefficient');
title(sprintf('Max mean test cc: %.3f', cm));
case {2}
% Number of time lags
nTau = length(lag);
%tccs_cmb = zeros(numVox,cvfolds);
tccs_ind = zeros(numVox,cvfolds);
% select the indices of the test features used in prediction
sfeats = 1:numFeat;
testfeats = (nTau*(sfeats(1)-1)+1):(nTau*sfeats(end));
% first fit the model to all training data with optimal reg. param
% training data
Xtrain = stimsh;
Ytrain = respsh;
% validation data
Xvalidation = stimshv(valSamples,:);
Yvalidation = respshv(valSamples,:);
clear resp respsh stim stimsh
% Obtain model weights using optimal reg. parameters
ws = vm_solve(Xtrain, Ytrain, as);
% Obtain predicted responses for independent validation data
Yval_pred = Xvalidation(:,testfeats)*ws(testfeats,:);
% lag-averaged voxel strfs
vsrf = reshape(ws, [nTau, numFeat, numVox]);
vsrf = single(squeeze(mean(vsrf,1)));
vsrf = vsrf(:,1:numVox);
% save the model
hdf5write(sprintf('%s_ridge_srfs.hf5',files.out(1:end-4)),'vsrf',vsrf,'ws',ws);
clear vsrf;
% Obtain prediction scores across cross-validation folds
totaldur = length(valSamples);
for cvidx = 1:cvfolds
timeind = randsample(totaldur,round(totaldur*0.8),false); % with replacement
tccs_ind(:,cvidx) = mvn_corr_fast(Yvalidation(timeind,:), Yval_pred(timeind,:));
mccs_ind(cvidx) = nanmean(tccs_ind(:,cvidx));
fprintf('avg. cc for ind: %.5f\n',mccs_ind(cvidx));
end
% Save all correlation values
tccs_ind = single(tccs_ind);
mccs_ind = single(mccs_ind);
hdf5write(sprintf('%scvall_corrs.hf5',files.out(1:end-4)),'tccs_ind',tccs_ind,'mccs_ind',mccs_ind);
end