diff rDiff/src/configure_rdiff.m @ 0:0f80a5141704

version 0.3 uploaded
author vipints
date Thu, 14 Feb 2013 23:38:36 -0500
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/rDiff/src/configure_rdiff.m	Thu Feb 14 23:38:36 2013 -0500
@@ -0,0 +1,141 @@
+function CFG = configure_rdiff(CFG)
+% configure_rdiff(CFG)
+
+%%% rDiff parameters %%%
+
+% Give the filenames of the bam-files to be considered
+CFG.BAM_FILES={'condition_A_replicate_1.bam','condition_A_replicate_2.bam','condition_B_replicate_1.bam','condition_B_replicate_2.bam'};
+
+%Name of the experiment. Use the FILENAMES if the entries are empty.
+CFG.NAMES={'A1','A2','B1','B2'};
+
+
+% Give the directory where the bam-files are
+CFG.data_dir = '' ;
+
+% Indicate to which sample the bam-files belong
+CFG.SAMPLES=[1,1,2,2];
+
+% Location of the gene structure
+CFG.genes_path='' ;
+
+% Output directory
+CFG.out_base =  '' ;
+
+% Output directory for temporary files
+CFG.out_base_temp =  '' ;
+
+%Length of the reads
+CFG.sequenced_length=75;
+
+% Prefix for the chromosome name when getting geetting reads from
+% the bam-files
+CFG.chr_prefix='';
+
+%%% Read filters %%%
+
+% Minimal read length
+CFG.min_read_length=30;
+
+
+
+%%% Parameters for gene expression estimation
+%Count the number of reads ( CFG.estimate_gene_expression=1 for yes
+%give the Files for the expresison in CFG.GENE_EXPR_FILES
+CFG.estimate_gene_expression=1;
+
+% Use the following files in CFG.GENE_EXPR_FILES for the
+% gene_expression. Those must be Tab-delimitered files where each
+% line contains the gene name folowed by the expressiob
+CFG.Counts_gene_expression='';
+CFG.Counts_rDiff_parametric='';
+CFG.Counts_rDiff_nonparametric='';
+
+
+
+%%% Parameters for variance function
+
+% Use a parametric form for the variance function for sample 1: sigma= a + bx + cx^2
+% (CFG.predefined_variance_function1=[] if not; CFG.predefined_variance_function1=[a,b,c] otherwise)
+% If CFG.predefined_variance_function1=[a,b,c] is given, the other
+% parameters for the variance function estimations are ignored for
+% sample 1
+CFG.predefined_variance_function1=[];
+
+% Use a parametric form for the variance function for sample 2: sigma= a + bx + cx^2
+% (CFG.predefined_variance_function2=[] if not; CFG.predefined_variance_function2=[a,b,c] otherwise)
+% If CFG.predefined_variance_function2=[a,b,c] is given, the other
+% parameters for the variance function estimations are ignored 
+% for sample 2
+CFG.predefined_variance_function2=[];
+
+% compute variance function for sample 1 ( 1 = yes , 0 = use precomputed
+% variance function saved under CFG.variance_function_1) 
+CFG.compute_variance_function_1=1;
+CFG.variance_function_1='';
+CFG.save_variance_function_1='variance_function_1.mat';
+
+% compute variance function for sample 2 ( 1 = yes , 0 = use precomputed
+% variance function saved under CFG.variance_function2) 
+CFG.compute_variance_function_2=1;
+CFG.variance_function_2='';
+CFG.save_variance_function_2='variance_function_2.mat';
+
+% subsample points for the variance function estimate for rDiff.nonparametric
+CFG.rDiff_nonparametric_subsample_variance_estimation=10000;	
+
+% Subsample the mean-variance pairs to increas the speed of the
+% local regression.CFG.variance_samplebins is the number of bins to
+% use and CFG.variance_samples_per_bin is how many samples should
+% be drwan per bin
+CFG.variance_samplebins=100;
+CFG.variance_samples_per_bin=500;
+
+
+
+%%% Testing parameters %%%
+
+% subsample reads down to rDiff.subsample to increase speed ( If no
+% subsampling shall be done set CFG.rDiff_subsample to 0
+CFG.rDiff_subsample=10000;
+
+% Clib the first CFG.bases_to_clip bases at the end of the reads
+CFG.bases_to_clip=3;
+
+%Number of bootraps for nonparametric test
+CFG.bootstraps=1000;
+
+%Number of bins for variance matching
+CFG.nr_of_slices=10;
+
+% Tests to perform
+CFG.perform_nonparametric=0;
+CFG.perform_parametric=0;
+CFG.perform_mmd=0;
+CFG.perform_poisson=0;
+
+
+%%%%% rproc settings %%%%%
+CFG.use_rproc = 0; % 1: cluster submission or 0: locally
+if CFG.use_rproc,
+    CFG.rproc_num_jobs              = 100;
+    CFG.rproc_memreq                = 8000;
+    CFG.rproc_par.priority          = 55;
+    CFG.rproc_par.resubmit          = 3;
+    CFG.rproc_par.mem_req_resubmit  = [ 24000 40000 60000];
+    CFG.rproc_par.time_req_resubmit = [60*60 100*60 90*60];
+    CFG.rproc_par.express           = 0;
+    CFG.rproc_par.immediately_bg    = 0;
+    CFG.rproc_par.immediately       = 0;
+    CFG.rproc_par.arch              = 64;
+    CFG.rproc_par.identifier        = '';
+    CFG.rproc_par.verbosity         = 0;
+    CFG.rproc_time                  = 15*60; % mins
+else
+    CFG.rproc_num_jobs              = 1;
+end
+
+
+
+
+