@@ -116,12 +116,12 @@ def __init__(self,config_file):
116116 self .CNAs = read_CNAs (df_CNAs ,self .samples )
117117 self .df_breakpoints = add_cna_breakpoints (self .CNAs ,self .df_breakpoints ,self .chr_lengths )
118118 TPM_corrected_file = os .path .join (self .cache_dir ,"TPM_corrected.tsv" )
119- if os .path .exists (TPM_corrected_file ):
120- self .df_TPM = pd .read_csv (TPM_corrected_file ,sep = "\t " ,index_col = 0 )
121- else :
122- print ("Computing gene expression values corrected for copy number..." )
123- self .df_TPM = correct_exp_cn (self .df_TPM ,self .CNAs ,self .genes ,chr_lengths = self .chr_lengths )
124- self .df_TPM .to_csv (TPM_corrected_file ,sep = "\t " )
119+ # if os.path.exists(TPM_corrected_file):
120+ # self.df_TPM = pd.read_csv(TPM_corrected_file,sep="\t",index_col=0)
121+ # else:
122+ print ("Computing gene expression values corrected for copy number..." )
123+ self .df_TPM = correct_exp_cn (self .df_TPM ,self .CNAs ,self .genes ,chr_lengths = self .chr_lengths )
124+ self .df_TPM .to_csv (TPM_corrected_file ,sep = "\t " )
125125
126126 else : self .CNAs = None
127127 self .breakpoints = read_breakpoints (self .df_breakpoints )
@@ -146,17 +146,16 @@ def __init__(self,config_file):
146146 self .ase_dna_dir = None
147147 cache_ase_file = os .path .join (self .cache_dir ,"ase.tsv" )
148148 cache_SNPs_file = os .path .join (self .cache_dir ,"SNPs.tsv" )
149- if os .path .exists (cache_ase_file ) and os .path .exists (cache_SNPs_file ):
150- self .df_ase = pd .read_csv ((cache_ase_file ),sep = "\t " ,index_col = 0 )
151- self .df_n_SNPs = pd .read_csv ((cache_SNPs_file ),sep = "\t " ,index_col = 0 )
152- else :
153- print ("Computing allele-specific expression scores..." )
154- imprinted_genes_file = None
155- if "imprinted_genes_file" in data_yaml :
156- imprinted_genes_file = data_yaml ["imprinted_genes_file" ]
157- self .df_ase , self .df_n_SNPs = compute_ase_matrix (self .samples ,self .ase_dir ,self .genes ,self .genes_index ,imprinted_genes_file = imprinted_genes_file ,CNAs = self .CNAs )
158- self .df_ase .to_csv (cache_ase_file ,sep = "\t " )
159- self .df_n_SNPs .to_csv (cache_SNPs_file ,sep = "\t " )
149+ #if os.path.exists(cache_ase_file) and os.path.exists(cache_SNPs_file):
150+ # self.df_ase = pd.read_csv((cache_ase_file),sep="\t",index_col=0)
151+ # self.df_n_SNPs=pd.read_csv((cache_SNPs_file),sep="\t",index_col=0)
152+ print ("Computing allele-specific expression scores..." )
153+ imprinted_genes_file = None
154+ if "imprinted_genes_file" in data_yaml :
155+ imprinted_genes_file = data_yaml ["imprinted_genes_file" ]
156+ self .df_ase , self .df_n_SNPs = compute_ase_matrix (self .samples ,self .ase_dir ,self .genes ,self .genes_index ,imprinted_genes_file = imprinted_genes_file ,CNAs = self .CNAs )
157+ self .df_ase .to_csv (cache_ase_file ,sep = "\t " )
158+ self .df_n_SNPs .to_csv (cache_SNPs_file ,sep = "\t " )
160159
161160 # Fusion transcripts
162161 if "fusions" in data_yaml :
0 commit comments