AlexsLemonade · jaclyn-taroni · Jan 6, 2021 · Dec 7, 2020 · Dec 7, 2020 · Dec 7, 2020
diff --git a/analyses/collapse-rnaseq/02-analyze-drops.nb.html b/analyses/collapse-rnaseq/02-analyze-drops.nb.html
diff --git a/analyses/collapse-rnaseq/results/pbta-gene-expression-rsem-fpkm-collapsed_table.stranded.rds b/analyses/collapse-rnaseq/results/pbta-gene-expression-rsem-fpkm-collapsed_table.stranded.rds
diff --git a/analyses/collapse-rnaseq/run-collapse-rnaseq.sh b/analyses/collapse-rnaseq/run-collapse-rnaseq.sh
diff --git a/analyses/fusion_filtering/04-project-specific-filtering.Rmd b/analyses/fusion_filtering/04-project-specific-filtering.Rmd
@@ -39,6 +39,14 @@ params:
     label: "results folder for *tsv files"
     value: results
     input: string
+  base_run:
+    label: "1/0 to run with base histology"
+    value: 0
+    input: integer
+  base_histology:
+    label: "Base histology file"
+    value: data/pbta-histologies-base.tsv
+    input: file
 ---
 
 
@@ -88,8 +96,13 @@ fusion_calls<-QCGeneFiltered_filtFusion %>% mutate(FusionName=rm_between(.data$F
 group<-params$group
 
 # get histology file
+if ( params$base_run ==0 ){
 clinical<-read.delim(file.path(root_dir, params$histology), stringsAsFactors = FALSE)
 clinical<-clinical[,c("Kids_First_Biospecimen_ID","Kids_First_Participant_ID",group)]
+} else {
+clinical<-read.delim(file.path(root_dir, params$base_histology), stringsAsFactors = FALSE)
+clinical<-clinical[,c("Kids_First_Biospecimen_ID","Kids_First_Participant_ID",group)]
+}
 
 # Least number of callers
 numCaller<-params$numCaller

diff --git a/analyses/fusion_filtering/04-project-specific-filtering.nb.html b/analyses/fusion_filtering/04-project-specific-filtering.nb.html
diff --git a/analyses/fusion_filtering/05-QC_putative_onco_fusion_dustribution.Rmd b/analyses/fusion_filtering/05-QC_putative_onco_fusion_dustribution.Rmd
@@ -19,6 +19,14 @@ params:
     label: "results folder for pbta-fusion-putative-oncogenic.tsv files"
     value: results
     input: string       
+  base_run:
+    label: "1/0 to run with base histology"
+    value: 0
+    input: integer
+  base_histology:
+    label: "Base histology file"
+    value: data/pbta-histologies-base.tsv
+    input: file
 
 ---
 
@@ -69,8 +77,14 @@ fusion_calls<-read_tsv(file.path(root_dir,params$dataPutativeFusion))
 outputfolder<-params$outputfolder
 
 #### get histology file
+if ( params$base_run ==0 ){
 clinical<-read_tsv(file.path(root_dir, params$histology), guess_max = 10000) %>%
   dplyr::select(Kids_First_Biospecimen_ID, Kids_First_Participant_ID, broad_histology)
+} else {
+clinical<-read_tsv(file.path(root_dir, params$base_histology), guess_max = 10000) %>%
+  dplyr::select(Kids_First_Biospecimen_ID, Kids_First_Participant_ID, broad_histology)
+}
+
 
 # add broad_histology to fusion
 fusion_calls<-fusion_calls %>%

diff --git a/analyses/fusion_filtering/05-QC_putative_onco_fusion_dustribution.nb.html b/analyses/fusion_filtering/05-QC_putative_onco_fusion_dustribution.nb.html
diff --git a/analyses/fusion_filtering/README.md b/analyses/fusion_filtering/README.md
@@ -48,7 +48,16 @@ The code to generate genelistreference.txt and fusionreference.txt is available
 * pbta-fusion-recurrently-fused-genes-bysample.tsv
 
 ### Run script
-`bash run_fusion_merged.sh` 
+use BASE_SUBTYPING=1 to run this module using the pbta-histologies-base.tsv from data folder while running molecular-subtyping modules for release.
+```sh
+BASE_SUBTYPING=1 run_fusion_merged.sh 
+```
+
+OR by default uses pbta-histologies.tsv from data folder
+```sh
+bash run_fusion_merged.sh
+```
+
 
 #### Order of scripts in analysis
 `01-fusion-standardization.R` : Standardizes fusion calls from STARFusion and Arriba

diff --git a/analyses/fusion_filtering/results/FilteredFusion.tsv b/analyses/fusion_filtering/results/FilteredFusion.tsv
diff --git a/analyses/fusion_filtering/results/pbta-fusion-putative-oncogenic.tsv b/analyses/fusion_filtering/results/pbta-fusion-putative-oncogenic.tsv
diff --git a/analyses/fusion_filtering/results/pbta-fusion-recurrent-fusion-byhistology.tsv b/analyses/fusion_filtering/results/pbta-fusion-recurrent-fusion-byhistology.tsv
@@ -1,6 +1,5 @@
 FusionName	broad_histology	count
-KIAA1549--BRAF	Low-grade astrocytic tumor	109
+KIAA1549--BRAF	Low-grade astrocytic tumor	114
 C11orf95--RELA	Ependymal tumor	25
-EWSR1--FLI1	Mesenchymal non-meningothelial tumor	7
-KIAA1549--BRAF	Neuronal and mixed neuronal-glial tumor	6
+EWSR1--FLI1	Mesenchymal non-meningothelial tumor	5
 REV3L--FYN	Diffuse astrocytic and oligodendroglial tumor	5