forked from lawrennd/gpsim
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgpsimLoadEcoliData.m
40 lines (33 loc) · 1.39 KB
/
gpsimLoadEcoliData.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
function [y, gene, times, scale, rawExp] = gpsimLoadEcoliData
% GPSIMLOADECOLIDATA Load in E. coli data for the represion case.
% FORMAT
% RETURN y : the normalised expression levels.
% RETURN yvar : the variance of the normalised expression levels.
% RETURN gene : the gene names and Affymetrix array tags.
% RETURN times : the times of the expression measurements.
% RETURN scale : the scaling factor applied to normalise.
% RETURN rawExp : the raw gene expresion level.
%
% SEEALSO : demEcoliMap1
%
% COPYRIGHT : Pei Gao, Neil D. Lawrence and Magnus Rattary, 2008
% SHEFFIELDML
if exist('./data/ecoliData.mat') == 2
load('./data/ecoliData.mat');
else
expData = importdata('./data/ecoliNormalisedData.txt');
rawExp.data = expData';
rawExp.genes = {'dinF', 'dinI', 'lexA', 'recA', 'recN', 'ruvA', 'ruvB', ...
'sbmC', 'sulA', 'umuC', 'umuD', 'uvrB', 'yebG', 'yjiW' };
targetInd = [2 3 6 7 9 11 12 14];
% Perform log-normal transformation.
yFull = exp(rawExp.data(:, targetInd)); % Logs are normally distributed
% ... recover mean in exp space.
% Rescale so that average standard deviation of curves is 1.
scale = sqrt(var(yFull));
scaleMat = ones(size(yFull, 1), 1)*scale;
y{1} = yFull./scaleMat;
times = [0 5 10 20 40 60]';
gene = rawExp.genes(targetInd);
% save('./data/ecoliData.mat', 'y', 'gene', 'times', 'scale', 'rawExp');
end