diff --git a/analyses/gene_match/add_pmtl_ens_hugo.Rmd b/analyses/gene_match/add_pmtl_ens_hugo.Rmd index 7b41740b04..6320dce919 100644 --- a/analyses/gene_match/add_pmtl_ens_hugo.Rmd +++ b/analyses/gene_match/add_pmtl_ens_hugo.Rmd @@ -37,5 +37,6 @@ ens_hugo_pmtl <- ens_map %>% full_join(pmtl) %>% select(ensg_id, gene_symbol, pmtl, version) %>% distinct() %>% + filter(!ensg_id == "Symbol_Not_Found" | !gene_symbol == 'NA') %>% write_tsv("results/ensg-hugo-pmtl-mapping.tsv") ``` diff --git a/analyses/gene_match/add_pmtl_ens_hugo.nb.html b/analyses/gene_match/add_pmtl_ens_hugo.nb.html index 82a9288f7f..5c778dc274 100644 --- a/analyses/gene_match/add_pmtl_ens_hugo.nb.html +++ b/analyses/gene_match/add_pmtl_ens_hugo.nb.html @@ -14,7 +14,7 @@ R Notebook - + @@ -222,17 +222,17 @@

Load merged gene symbol + ENSG mapping file and PMTL file

library(tidyverse)
- -
── Attaching packages ────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse 1.3.1 ──
+ +
── Attaching packages ────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse 1.3.1 ──
- -
✔ ggplot2 3.3.5     ✔ purrr   0.3.4
-✔ tibble  3.1.5     ✔ dplyr   1.0.7
-✔ tidyr   1.1.4     ✔ stringr 1.4.0
-✔ readr   2.0.2     ✔ forcats 0.5.1
+ +
✔ ggplot2 3.3.3     ✔ purrr   0.3.4
+✔ tibble  3.1.2     ✔ dplyr   1.0.6
+✔ tidyr   1.1.3     ✔ stringr 1.4.0
+✔ readr   1.4.0     ✔ forcats 0.5.1
- -
── Conflicts ───────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse_conflicts() ──
+
+
── Conflicts ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── tidyverse_conflicts() ──
 ✖ dplyr::filter() masks stats::filter()
 ✖ dplyr::lag()    masks stats::lag()
@@ -240,35 +240,29 @@

Load merged gene symbol + ENSG mapping file and PMTL file

ens_map <- read_tsv("results/ensembl_gene_symbol_gtf_genode_v28_v38_open_ped_can_v7_merged.tsv") %>%
   rename(ensg_id = ensembl)
- -
Rows: 94841 Columns: 2
- - -
── Column specification ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
-Delimiter: "\t"
-chr (2): gene_symbol, ensembl
- - +

-ℹ Use `spec()` to retrieve the full column specification for this data.
-ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
+── Column specification ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── +cols( + gene_symbol = col_character(), + ensembl = col_character() +)
pmtl <- read_tsv("input/PMTL_v1.1.tsv") %>%
   rename(ensg_id = Ensembl_ID, pmtl = FDA_Designation)
- -
Rows: 512 Columns: 6
- - -
── Column specification ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
-Delimiter: "\t"
-chr (6): Ensembl_ID, Approved_Symbol, FDA_Designation, FDA_Class, FDA_Target...
- - +

-ℹ Use `spec()` to retrieve the full column specification for this data.
-ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
+── Column specification ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────── +cols( + Ensembl_ID = col_character(), + Approved_Symbol = col_character(), + FDA_Designation = col_character(), + FDA_Class = col_character(), + FDA_Target = col_character(), + Mapping_Description = col_character() +)
# add pmtl version
@@ -327,11 +321,12 @@ 

Are there all PMTL ensg ids included in the mapping file?

Keep the gene_symbol as in the RNA-Seq files

- +
ens_hugo_pmtl <- ens_map %>%
   full_join(pmtl) %>%
   select(ensg_id, gene_symbol, pmtl, version) %>%
   distinct() %>%
+  filter(!ensg_id == "Symbol_Not_Found" | !gene_symbol == 'NA') %>%
   write_tsv("results/ensg-hugo-pmtl-mapping.tsv")
@@ -340,7 +335,7 @@

Keep the gene_symbol as in the RNA-Seq files

-
LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKIyMgTG9hZCBtZXJnZWQgZ2VuZSBzeW1ib2wgKyBFTlNHIG1hcHBpbmcgZmlsZSBhbmQgUE1UTCBmaWxlCmBgYHtyfQpsaWJyYXJ5KHRpZHl2ZXJzZSkKCmVuc19tYXAgPC0gcmVhZF90c3YoInJlc3VsdHMvZW5zZW1ibF9nZW5lX3N5bWJvbF9ndGZfZ2Vub2RlX3YyOF92Mzhfb3Blbl9wZWRfY2FuX3Y3X21lcmdlZC50c3YiKSAlPiUKICByZW5hbWUoZW5zZ19pZCA9IGVuc2VtYmwpCnBtdGwgPC0gcmVhZF90c3YoImlucHV0L1BNVExfdjEuMS50c3YiKSAlPiUKICByZW5hbWUoZW5zZ19pZCA9IEVuc2VtYmxfSUQsIHBtdGwgPSBGREFfRGVzaWduYXRpb24pCiMgYWRkIHBtdGwgdmVyc2lvbgpwbXRsJHZlcnNpb24gPC0gIlBNVEwgdmVyc2lvbiAxLjEiCmBgYAojIyBBcmUgdGhlcmUgYWxsIFBNVEwgZW5zZyBpZHMgaW5jbHVkZWQgaW4gdGhlIG1hcHBpbmcgZmlsZT8gCmBgYHtyfQpzZXRkaWZmKHBtdGwkZW5zZ19pZCwgZW5zX21hcCRlbnNnX2lkKQojeWVzCmBgYAoKIyNNZXJnZSB0aGUgUE1UTCBmaWxlIHdpdGggRU5TRyBtYXBwaW5nIGZpbGUKYGBge3J9CmVuc19wbXRsX21lciA8LSBtZXJnZShwbXRsLCBlbnNfbWFwLCBhbGwueCA9IFQpCgojIERvIGFueSBnZW5lIElEcyBtaXNtYXRjaD8KZW5zX3BtdGxfbWVyJG1pc21hdGNoZXMgPC0gaWZlbHNlKGVuc19wbXRsX21lciRBcHByb3ZlZF9TeW1ib2wgPT0gZW5zX3BtdGxfbWVyJGdlbmVfc3ltYm9sLCAidHJ1ZSIsICJmYWxzZSIpCnRhYmxlKGVuc19wbXRsX21lciRtaXNtYXRjaGVzKQplbnNfcG10bF9tZXIgJT4lCiAgZmlsdGVyKG1pc21hdGNoZXMgPT0gImZhbHNlIikgJT4lCiAgc2VsZWN0KEFwcHJvdmVkX1N5bWJvbCwgZ2VuZV9zeW1ib2wpCmBgYAojIyBLZWVwIHRoZSBgZ2VuZV9zeW1ib2xgIGFzIGluIHRoZSBSTkEtU2VxIGZpbGVzCmBgYHtyfQplbnNfaHVnb19wbXRsIDwtIGVuc19tYXAgJT4lCiAgZnVsbF9qb2luKHBtdGwpICU+JQogIHNlbGVjdChlbnNnX2lkLCBnZW5lX3N5bWJvbCwgcG10bCwgdmVyc2lvbikgJT4lCiAgZGlzdGluY3QoKSAlPiUKICB3cml0ZV90c3YoInJlc3VsdHMvZW5zZy1odWdvLXBtdGwtbWFwcGluZy50c3YiKQpgYGAK
+
LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKIyMgTG9hZCBtZXJnZWQgZ2VuZSBzeW1ib2wgKyBFTlNHIG1hcHBpbmcgZmlsZSBhbmQgUE1UTCBmaWxlCmBgYHtyfQpsaWJyYXJ5KHRpZHl2ZXJzZSkKCmVuc19tYXAgPC0gcmVhZF90c3YoInJlc3VsdHMvZW5zZW1ibF9nZW5lX3N5bWJvbF9ndGZfZ2Vub2RlX3YyOF92Mzhfb3Blbl9wZWRfY2FuX3Y3X21lcmdlZC50c3YiKSAlPiUKICByZW5hbWUoZW5zZ19pZCA9IGVuc2VtYmwpCnBtdGwgPC0gcmVhZF90c3YoImlucHV0L1BNVExfdjEuMS50c3YiKSAlPiUKICByZW5hbWUoZW5zZ19pZCA9IEVuc2VtYmxfSUQsIHBtdGwgPSBGREFfRGVzaWduYXRpb24pCiMgYWRkIHBtdGwgdmVyc2lvbgpwbXRsJHZlcnNpb24gPC0gIlBNVEwgdmVyc2lvbiAxLjEiCmBgYAojIyBBcmUgdGhlcmUgYWxsIFBNVEwgZW5zZyBpZHMgaW5jbHVkZWQgaW4gdGhlIG1hcHBpbmcgZmlsZT8gCmBgYHtyfQpzZXRkaWZmKHBtdGwkZW5zZ19pZCwgZW5zX21hcCRlbnNnX2lkKQojeWVzCmBgYAoKIyNNZXJnZSB0aGUgUE1UTCBmaWxlIHdpdGggRU5TRyBtYXBwaW5nIGZpbGUKYGBge3J9CmVuc19wbXRsX21lciA8LSBtZXJnZShwbXRsLCBlbnNfbWFwLCBhbGwueCA9IFQpCgojIERvIGFueSBnZW5lIElEcyBtaXNtYXRjaD8KZW5zX3BtdGxfbWVyJG1pc21hdGNoZXMgPC0gaWZlbHNlKGVuc19wbXRsX21lciRBcHByb3ZlZF9TeW1ib2wgPT0gZW5zX3BtdGxfbWVyJGdlbmVfc3ltYm9sLCAidHJ1ZSIsICJmYWxzZSIpCnRhYmxlKGVuc19wbXRsX21lciRtaXNtYXRjaGVzKQplbnNfcG10bF9tZXIgJT4lCiAgZmlsdGVyKG1pc21hdGNoZXMgPT0gImZhbHNlIikgJT4lCiAgc2VsZWN0KEFwcHJvdmVkX1N5bWJvbCwgZ2VuZV9zeW1ib2wpCmBgYAojIyBLZWVwIHRoZSBgZ2VuZV9zeW1ib2xgIGFzIGluIHRoZSBSTkEtU2VxIGZpbGVzCmBgYHtyfQplbnNfaHVnb19wbXRsIDwtIGVuc19tYXAgJT4lCiAgZnVsbF9qb2luKHBtdGwpICU+JQogIHNlbGVjdChlbnNnX2lkLCBnZW5lX3N5bWJvbCwgcG10bCwgdmVyc2lvbikgJT4lCiAgZGlzdGluY3QoKSAlPiUKICBmaWx0ZXIoIWVuc2dfaWQgPT0gIlN5bWJvbF9Ob3RfRm91bmQiIHwgIWdlbmVfc3ltYm9sID09ICdOQScpICU+JQogIHdyaXRlX3RzdigicmVzdWx0cy9lbnNnLWh1Z28tcG10bC1tYXBwaW5nLnRzdiIpCmBgYAo=
diff --git a/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.Rmd b/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.Rmd index 4b1a8b3712..8165bece24 100644 --- a/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.Rmd +++ b/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.Rmd @@ -14,7 +14,7 @@ suppressPackageStartupMessages({ ## Read ensg-hugo-pmtl-mapping.tsv and OpenPedCan SNV, CNV, TPM, and fusion data ```{r read_open_ped_can_data} -open_ped_can_data_path <- '~/OpenPedCan-analysis/data/v10' +open_ped_can_data_path <- '../../data' snv <- file.path(open_ped_can_data_path, 'snv-consensus-plus-hotspots.maf.tsv.gz') cnv <- file.path(open_ped_can_data_path, 'consensus_wgs_plus_cnvkit_wxs.tsv.gz') diff --git a/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.nb.html b/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.nb.html index 05c95b3387..f416a725f6 100644 --- a/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.nb.html +++ b/analyses/gene_match/qc_ensg_hugo_pmtl_mapping.nb.html @@ -14,7 +14,7 @@ QC ensg-hugo-pmtl-mapping.tsv - + @@ -231,8 +231,8 @@

Load libraries

Read ensg-hugo-pmtl-mapping.tsv and OpenPedCan SNV, CNV, TPM, and fusion data

- -
open_ped_can_data_path <- '~/OpenPedCan-analysis/data/v10'
+
+
open_ped_can_data_path <- '../../data/v10'
 
 snv <- file.path(open_ped_can_data_path, 'snv-consensus-plus-hotspots.maf.tsv.gz')
 cnv <- file.path(open_ped_can_data_path, 'consensus_wgs_plus_cnvkit_wxs.tsv.gz')
@@ -247,8 +247,16 @@ 

Read ensg-hugo-pmtl-mapping.tsv and OpenPedCan SNV, CNV, TPM, and fusion dat CLIN_SIG = col_character(), PUBMED = col_character()))

- -
Warning: One or more parsing issues, see `problems()` for details
+ +
Warning: 28 parsing failures.
+    row col               expected        actual                                                    file
+ 464671  AF no trailing characters 0.3618,0.0022 '../../data/v10/snv-consensus-plus-hotspots.maf.tsv.gz'
+1869464  AF no trailing characters 0.9868,0.0022 '../../data/v10/snv-consensus-plus-hotspots.maf.tsv.gz'
+1892736  AF no trailing characters 0.5821,0.1985 '../../data/v10/snv-consensus-plus-hotspots.maf.tsv.gz'
+2091025  AF no trailing characters 0.7626,0.0640 '../../data/v10/snv-consensus-plus-hotspots.maf.tsv.gz'
+4407213  AF no trailing characters 0.3618,0.0022 '../../data/v10/snv-consensus-plus-hotspots.maf.tsv.gz'
+....... ... ...................... ............. .......................................................
+See problems(...) for more details.
cnv_file <- readr::read_tsv(cnv, col_types = cols())
@@ -299,7 +307,7 @@ 

Check gene symbol overlap

@@ -409,7 +417,7 @@

Check gene ENSG ID overlap

-
LS0tCnRpdGxlOiAiUUMgZW5zZy1odWdvLXBtdGwtbWFwcGluZy50c3YiCm91dHB1dDogaHRtbF9ub3RlYm9vawotLS0KCiMjIExvYWQgbGlicmFyaWVzCgpgYGB7ciBsb2FkX2xpYnJhcmllc30Kc3VwcHJlc3NQYWNrYWdlU3RhcnR1cE1lc3NhZ2VzKHsKICBsaWJyYXJ5KHRpZHl2ZXJzZSkKfSkKYGBgCgojIyBSZWFkIGVuc2ctaHVnby1wbXRsLW1hcHBpbmcudHN2IGFuZCBPcGVuUGVkQ2FuIFNOViwgQ05WLCBUUE0sIGFuZCBmdXNpb24gZGF0YQoKYGBge3IgcmVhZF9vcGVuX3BlZF9jYW5fZGF0YX0Kb3Blbl9wZWRfY2FuX2RhdGFfcGF0aCA8LSAnfi9PcGVuUGVkQ2FuLWFuYWx5c2lzL2RhdGEvdjEwJwoKc252IDwtIGZpbGUucGF0aChvcGVuX3BlZF9jYW5fZGF0YV9wYXRoLCAnc252LWNvbnNlbnN1cy1wbHVzLWhvdHNwb3RzLm1hZi50c3YuZ3onKQpjbnYgPC0gZmlsZS5wYXRoKG9wZW5fcGVkX2Nhbl9kYXRhX3BhdGgsICdjb25zZW5zdXNfd2dzX3BsdXNfY252a2l0X3d4cy50c3YuZ3onKQp0cG08LSBmaWxlLnBhdGgob3Blbl9wZWRfY2FuX2RhdGFfcGF0aCwgJ2dlbmUtZXhwcmVzc2lvbi1yc2VtLXRwbS1jb2xsYXBzZWQucmRzJykKZnVzaW9uPC0gZmlsZS5wYXRoKG9wZW5fcGVkX2Nhbl9kYXRhX3BhdGgsICdmdXNpb24tcHV0YXRpdmUtb25jb2dlbmljLnRzdicpCgojIFJlYWQgaW4gZmlsZXMgZm9yIFNOViwgQ05WLCBUUE0gYW5kIGZ1c2lvbgpzbnZfZmlsZSA8LSByZWFkcjo6cmVhZF90c3YoCiAgICAgIHNudiwgY29tbWVudCA9ICcjJywKICAgICAgY29sX3R5cGVzID0gY29scygKICAgICAgICAuZGVmYXVsdCA9IGNvbF9ndWVzcygpLAogICAgICAgIENMSU5fU0lHID0gY29sX2NoYXJhY3RlcigpLAogICAgICAgIFBVQk1FRCA9IGNvbF9jaGFyYWN0ZXIoKSkpCmNudl9maWxlIDwtIHJlYWRyOjpyZWFkX3RzdihjbnYsIGNvbF90eXBlcyA9IGNvbHMoKSkKdHBtX2ZpbGUgPC0gcmVhZFJEUyh0cG0pCmZ1c2lvbl9maWxlIDwtIHJlYWRyOjpyZWFkX3RzdihmdXNpb24sIGNvbF90eXBlcyA9IGNvbHMoKSkKCiMgcmVhZCBpbiBwbXRsIGVuc2VtYmxlIGh1Z28gbWFwcGVkIAplaHJfZGYgPC0gcmVhZF90c3YoJ3Jlc3VsdHMvZW5zZy1odWdvLXBtdGwtbWFwcGluZy50c3YnLCBjb2xfdHlwZXMgPSBjb2xzKCkpCgojIG1ha2UgdGhlbSB0byBhIGxpc3QKb3Blbl9wZWRfY2FuX2RhdGFfZGZzIDwtIGxpc3QoCiAgc252PXNudl9maWxlLAogIGNudj1jbnZfZmlsZSwKICB0cG09dHBtX2ZpbGUsCiAgZnVzaW9uPWZ1c2lvbl9maWxlCikKCmBgYAoKIyMgQ2hlY2sgZ2VuZSBzeW1ib2wgb3ZlcmxhcAoKYGBge3IgY2hlY2tfZ2VuZV9zeW1ib2xfb3ZlcmxhcH0KZ2VuZV9zeW1ib2xzX2xpc3QgPC0gbGlzdCgKICBzbnYgPSBvcGVuX3BlZF9jYW5fZGF0YV9kZnMkc252JEh1Z29fU3ltYm9sLAogIGNudiA9IG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRjbnYkZ2VuZV9zeW1ib2wsCiAgdHBtID0gcm93bmFtZXMob3Blbl9wZWRfY2FuX2RhdGFfZGZzJHRwbSksCiAgZnVzaW9uID0gYyhvcGVuX3BlZF9jYW5fZGF0YV9kZnMkZnVzaW9uJEdlbmUxQSwKICAgICAgICAgICAgIG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRmdXNpb24kR2VuZTJBLAogICAgICAgICAgICAgb3Blbl9wZWRfY2FuX2RhdGFfZGZzJGZ1c2lvbiRHZW5lMUIsCiAgICAgICAgICAgICBvcGVuX3BlZF9jYW5fZGF0YV9kZnMkZnVzaW9uJEdlbmUyQikKKQoKZ2VuZV9zeW1ib2xzX2xpc3QgPC0gbGFwcGx5KGdlbmVfc3ltYm9sc19saXN0LCBmdW5jdGlvbih4KSB7CiAgeCA8LSB4WyFpcy5uYSh4KV0KICB4IDwtIHVuaXF1ZSh4KQogIHJldHVybih4KQp9KQoKbWFwX2RmcihnZW5lX3N5bWJvbHNfbGlzdCwgZnVuY3Rpb24oeCkgewogIHRpYmJsZSgKICAgIG5fdW5pcV9zeW1ib2xzID0gbGVuZ3RoKHgpLAogICAgbl91bmlxX3N5bWJvbHNfaW5fbWFwcGluZ19maWxlID0gc3VtKHggJWluJSBlaHJfZGYkZ2VuZV9zeW1ib2wpLAogICAgbl91bmlxX3N5bWJvbHNfbm90X2luX21hcHBpbmdfZmlsZSA9IHN1bSgheCAlaW4lIGVocl9kZiRnZW5lX3N5bWJvbCkpCn0sIC5pZCA9ICdEYXRhIHR5cGUnKQpgYGAKCkZvciBnZW5lIHN5bWJvbHMgaW4gZGF0YSBmaWxlcyB0aGF0IGFyZSBub3QgaW4gbWFwcGluZyBmaWxlLCBjaGVjayB3aGV0aGVyIHRoZWlyIEVOU0cgSURzIGFyZSBpbiBtYXBwaW5nIGZpbGUuCgpgYGB7ciBjaGVja19zeW1ib2xfZW5zZ30KZHR5cGVfdmVjIDwtIGMoc252ID0gJ3NudicsIGNudiA9ICdjbnYnKQpzeW1ib2xfbm90X2luX21hcHBpbmdfZmlsZV9saXN0IDwtIGxhcHBseShkdHlwZV92ZWMsIGZ1bmN0aW9uKHgpIHsKICBnc192ZWMgPC0gdW5pcXVlKGdlbmVfc3ltYm9sc19saXN0W1t4XV0pCiAgZ3Nfbm90X2luX21hcHBpbmdfZmlsZV92ZWMgPC0gZ3NfdmVjWyFnc192ZWMgJWluJSBlaHJfZGYkZ2VuZV9zeW1ib2xdCiAgaWYgKHggPT0gJ3NudicpIHsKICAgIGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiA8LSBvcGVuX3BlZF9jYW5fZGF0YV9kZnNbW3hdXSAlPiUKICAgICAgc2VsZWN0KEdlbmUsIEh1Z29fU3ltYm9sKSAlPiUKICAgICAgZmlsdGVyKEh1Z29fU3ltYm9sICVpbiUgZ3Nfbm90X2luX21hcHBpbmdfZmlsZV92ZWMpICU+JQogICAgICByZW5hbWUoZW5zZ19pZCA9IEdlbmUsIGRhdGFfZmlsZV9nZW5lX3N5bWJvbCA9IEh1Z29fU3ltYm9sKQogIH0gZWxzZSB7CiAgICBnc19lbnNnX25vdF9pbl9tYXBwaW5nX2ZpbGVfZGYgPC0gb3Blbl9wZWRfY2FuX2RhdGFfZGZzW1t4XV0gJT4lCiAgICAgIHNlbGVjdChlbnNlbWJsLCBnZW5lX3N5bWJvbCkgJT4lCiAgICAgIGZpbHRlcihnZW5lX3N5bWJvbCAlaW4lIGdzX25vdF9pbl9tYXBwaW5nX2ZpbGVfdmVjKSAlPiUKICAgICAgcmVuYW1lKGVuc2dfaWQgPSBlbnNlbWJsLCBkYXRhX2ZpbGVfZ2VuZV9zeW1ib2wgPSBnZW5lX3N5bWJvbCkKICB9CgogIGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiA8LSBnc19lbnNnX25vdF9pbl9tYXBwaW5nX2ZpbGVfZGYgJT4lCiAgICBmaWx0ZXIoIWlzLm5hKGVuc2dfaWQpKSAlPiUKICAgIGRpc3RpbmN0KCkKCiAgZWhyX2pvaW5fZGYgPC0gZWhyX2RmICU+JQogICAgc2VsZWN0KGVuc2dfaWQsIGdlbmVfc3ltYm9sKSAlPiUKICAgIHJlbmFtZShtYXBwaW5nX2ZpbGVfZ2VuZV9zeW1ib2wgPSBnZW5lX3N5bWJvbCkKCiAgcHJpbnQocGFzdGUoCiAgICB4LCAnZGF0YSBmaWxlIGhhcycsCiAgICBzdW0oIXVuaXF1ZShnc19lbnNnX25vdF9pbl9tYXBwaW5nX2ZpbGVfZGYkZW5zZ19pZCkgJWluJSBlaHJfam9pbl9kZiRlbnNnX2lkKSwKICAgICdnZW5lIHN5bWJvbHMgdGhhdCBhcmUgbm90IGluIG1hcHBpbmcgZmlsZSBhbmQgaGF2ZSBhc3NvY2lhdGVkIEVOU0cgSURzJywKICAgICd0aGF0IGFyZSBhbHNvIG5vdCBpbiBtYXBwaW5nIGZpbGUuJykpCgogIHJlc19kZiA8LSBnc19lbnNnX25vdF9pbl9tYXBwaW5nX2ZpbGVfZGYgJT4lCiAgICBsZWZ0X2pvaW4oZWhyX2pvaW5fZGYsIGJ5ID0gJ2Vuc2dfaWQnKQoKICByZXR1cm4ocmVzX2RmKQp9KQpgYGAKCmBgYHtyIHNudn0Kc3ltYm9sX25vdF9pbl9tYXBwaW5nX2ZpbGVfbGlzdCRzbnYKYGBgCgpgYGB7ciBjbnZ9CnN5bWJvbF9ub3RfaW5fbWFwcGluZ19maWxlX2xpc3QkY252CmBgYAoKCiMjIENoZWNrIGdlbmUgRU5TRyBJRCBvdmVybGFwCgpgYGB7ciBjaGVja19nZW5lX2Vuc2dfb3ZlcmxhcH0KZ2VuZV9lbnNnX2xpc3QgPC0gbGlzdCgKICBzbnYgPSBvcGVuX3BlZF9jYW5fZGF0YV9kZnMkc252JEdlbmUsCiAgY252ID0gb3Blbl9wZWRfY2FuX2RhdGFfZGZzJGNudiRlbnNlbWJsCikKCmdlbmVfZW5zZ19saXN0IDwtIGxhcHBseShnZW5lX2Vuc2dfbGlzdCwgZnVuY3Rpb24oeCkgewogIHggPC0geFshaXMubmEoeCldCiAgeCA8LSB1bmlxdWUoeCkKICByZXR1cm4oeCkKfSkKCm1hcF9kZnIoZ2VuZV9lbnNnX2xpc3QsIGZ1bmN0aW9uKHgpIHsKICB0aWJibGUoCiAgICBuX3VuaXFfZW5zZ3MgPSBsZW5ndGgoeCksCiAgICBuX3VuaXFfZW5zZ3NfaW5fbWFwcGluZ19maWxlID0gc3VtKHggJWluJSBlaHJfZGYkZW5zZ19pZCksCiAgICBuX3VuaXFfZW5zZ3Nfbm90X2luX21hcHBpbmdfZmlsZSA9IHN1bSgheCAlaW4lIGVocl9kZiRlbnNnX2lkKSwKICAgIHVuaXFfZW5zZ3Nfbm90X2luX21hcHBpbmdfZmlsZSA9IHBhc3RlKAogICAgICB4WyF4ICVpbiUgZWhyX2RmJGVuc2dfaWRdLAogICAgICBjb2xsYXBzZSA9ICcsJykpCn0sIC5pZCA9ICdEYXRhIHR5cGUnKQpgYGAK
+
LS0tCnRpdGxlOiAiUUMgZW5zZy1odWdvLXBtdGwtbWFwcGluZy50c3YiCm91dHB1dDogaHRtbF9ub3RlYm9vawotLS0KCiMjIExvYWQgbGlicmFyaWVzCgpgYGB7ciBsb2FkX2xpYnJhcmllc30Kc3VwcHJlc3NQYWNrYWdlU3RhcnR1cE1lc3NhZ2VzKHsKICBsaWJyYXJ5KHRpZHl2ZXJzZSkKfSkKYGBgCgojIyBSZWFkIGVuc2ctaHVnby1wbXRsLW1hcHBpbmcudHN2IGFuZCBPcGVuUGVkQ2FuIFNOViwgQ05WLCBUUE0sIGFuZCBmdXNpb24gZGF0YQoKYGBge3IgcmVhZF9vcGVuX3BlZF9jYW5fZGF0YX0Kb3Blbl9wZWRfY2FuX2RhdGFfcGF0aCA8LSAnLi4vLi4vZGF0YS92MTAnCgpzbnYgPC0gZmlsZS5wYXRoKG9wZW5fcGVkX2Nhbl9kYXRhX3BhdGgsICdzbnYtY29uc2Vuc3VzLXBsdXMtaG90c3BvdHMubWFmLnRzdi5neicpCmNudiA8LSBmaWxlLnBhdGgob3Blbl9wZWRfY2FuX2RhdGFfcGF0aCwgJ2NvbnNlbnN1c193Z3NfcGx1c19jbnZraXRfd3hzLnRzdi5neicpCnRwbTwtIGZpbGUucGF0aChvcGVuX3BlZF9jYW5fZGF0YV9wYXRoLCAnZ2VuZS1leHByZXNzaW9uLXJzZW0tdHBtLWNvbGxhcHNlZC5yZHMnKQpmdXNpb248LSBmaWxlLnBhdGgob3Blbl9wZWRfY2FuX2RhdGFfcGF0aCwgJ2Z1c2lvbi1wdXRhdGl2ZS1vbmNvZ2VuaWMudHN2JykKCiMgUmVhZCBpbiBmaWxlcyBmb3IgU05WLCBDTlYsIFRQTSBhbmQgZnVzaW9uCnNudl9maWxlIDwtIHJlYWRyOjpyZWFkX3RzdigKICAgICAgc252LCBjb21tZW50ID0gJyMnLAogICAgICBjb2xfdHlwZXMgPSBjb2xzKAogICAgICAgIC5kZWZhdWx0ID0gY29sX2d1ZXNzKCksCiAgICAgICAgQ0xJTl9TSUcgPSBjb2xfY2hhcmFjdGVyKCksCiAgICAgICAgUFVCTUVEID0gY29sX2NoYXJhY3RlcigpKSkKY252X2ZpbGUgPC0gcmVhZHI6OnJlYWRfdHN2KGNudiwgY29sX3R5cGVzID0gY29scygpKQp0cG1fZmlsZSA8LSByZWFkUkRTKHRwbSkKZnVzaW9uX2ZpbGUgPC0gcmVhZHI6OnJlYWRfdHN2KGZ1c2lvbiwgY29sX3R5cGVzID0gY29scygpKQoKIyByZWFkIGluIHBtdGwgZW5zZW1ibGUgaHVnbyBtYXBwZWQgCmVocl9kZiA8LSByZWFkX3RzdigncmVzdWx0cy9lbnNnLWh1Z28tcG10bC1tYXBwaW5nLnRzdicsIGNvbF90eXBlcyA9IGNvbHMoKSkKCiMgbWFrZSB0aGVtIHRvIGEgbGlzdApvcGVuX3BlZF9jYW5fZGF0YV9kZnMgPC0gbGlzdCgKICBzbnY9c252X2ZpbGUsCiAgY252PWNudl9maWxlLAogIHRwbT10cG1fZmlsZSwKICBmdXNpb249ZnVzaW9uX2ZpbGUKKQoKYGBgCgojIyBDaGVjayBnZW5lIHN5bWJvbCBvdmVybGFwCgpgYGB7ciBjaGVja19nZW5lX3N5bWJvbF9vdmVybGFwfQpnZW5lX3N5bWJvbHNfbGlzdCA8LSBsaXN0KAogIHNudiA9IG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRzbnYkSHVnb19TeW1ib2wsCiAgY252ID0gb3Blbl9wZWRfY2FuX2RhdGFfZGZzJGNudiRnZW5lX3N5bWJvbCwKICB0cG0gPSByb3duYW1lcyhvcGVuX3BlZF9jYW5fZGF0YV9kZnMkdHBtKSwKICBmdXNpb24gPSBjKG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRmdXNpb24kR2VuZTFBLAogICAgICAgICAgICAgb3Blbl9wZWRfY2FuX2RhdGFfZGZzJGZ1c2lvbiRHZW5lMkEsCiAgICAgICAgICAgICBvcGVuX3BlZF9jYW5fZGF0YV9kZnMkZnVzaW9uJEdlbmUxQiwKICAgICAgICAgICAgIG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRmdXNpb24kR2VuZTJCKQopCgpnZW5lX3N5bWJvbHNfbGlzdCA8LSBsYXBwbHkoZ2VuZV9zeW1ib2xzX2xpc3QsIGZ1bmN0aW9uKHgpIHsKICB4IDwtIHhbIWlzLm5hKHgpXQogIHggPC0gdW5pcXVlKHgpCiAgcmV0dXJuKHgpCn0pCgptYXBfZGZyKGdlbmVfc3ltYm9sc19saXN0LCBmdW5jdGlvbih4KSB7CiAgdGliYmxlKAogICAgbl91bmlxX3N5bWJvbHMgPSBsZW5ndGgoeCksCiAgICBuX3VuaXFfc3ltYm9sc19pbl9tYXBwaW5nX2ZpbGUgPSBzdW0oeCAlaW4lIGVocl9kZiRnZW5lX3N5bWJvbCksCiAgICBuX3VuaXFfc3ltYm9sc19ub3RfaW5fbWFwcGluZ19maWxlID0gc3VtKCF4ICVpbiUgZWhyX2RmJGdlbmVfc3ltYm9sKSkKfSwgLmlkID0gJ0RhdGEgdHlwZScpCmBgYAoKRm9yIGdlbmUgc3ltYm9scyBpbiBkYXRhIGZpbGVzIHRoYXQgYXJlIG5vdCBpbiBtYXBwaW5nIGZpbGUsIGNoZWNrIHdoZXRoZXIgdGhlaXIgRU5TRyBJRHMgYXJlIGluIG1hcHBpbmcgZmlsZS4KCmBgYHtyIGNoZWNrX3N5bWJvbF9lbnNnfQpkdHlwZV92ZWMgPC0gYyhzbnYgPSAnc252JywgY252ID0gJ2NudicpCnN5bWJvbF9ub3RfaW5fbWFwcGluZ19maWxlX2xpc3QgPC0gbGFwcGx5KGR0eXBlX3ZlYywgZnVuY3Rpb24oeCkgewogIGdzX3ZlYyA8LSB1bmlxdWUoZ2VuZV9zeW1ib2xzX2xpc3RbW3hdXSkKICBnc19ub3RfaW5fbWFwcGluZ19maWxlX3ZlYyA8LSBnc192ZWNbIWdzX3ZlYyAlaW4lIGVocl9kZiRnZW5lX3N5bWJvbF0KICBpZiAoeCA9PSAnc252JykgewogICAgZ3NfZW5zZ19ub3RfaW5fbWFwcGluZ19maWxlX2RmIDwtIG9wZW5fcGVkX2Nhbl9kYXRhX2Rmc1tbeF1dICU+JQogICAgICBzZWxlY3QoR2VuZSwgSHVnb19TeW1ib2wpICU+JQogICAgICBmaWx0ZXIoSHVnb19TeW1ib2wgJWluJSBnc19ub3RfaW5fbWFwcGluZ19maWxlX3ZlYykgJT4lCiAgICAgIHJlbmFtZShlbnNnX2lkID0gR2VuZSwgZGF0YV9maWxlX2dlbmVfc3ltYm9sID0gSHVnb19TeW1ib2wpCiAgfSBlbHNlIHsKICAgIGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiA8LSBvcGVuX3BlZF9jYW5fZGF0YV9kZnNbW3hdXSAlPiUKICAgICAgc2VsZWN0KGVuc2VtYmwsIGdlbmVfc3ltYm9sKSAlPiUKICAgICAgZmlsdGVyKGdlbmVfc3ltYm9sICVpbiUgZ3Nfbm90X2luX21hcHBpbmdfZmlsZV92ZWMpICU+JQogICAgICByZW5hbWUoZW5zZ19pZCA9IGVuc2VtYmwsIGRhdGFfZmlsZV9nZW5lX3N5bWJvbCA9IGdlbmVfc3ltYm9sKQogIH0KCiAgZ3NfZW5zZ19ub3RfaW5fbWFwcGluZ19maWxlX2RmIDwtIGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiAlPiUKICAgIGZpbHRlcighaXMubmEoZW5zZ19pZCkpICU+JQogICAgZGlzdGluY3QoKQoKICBlaHJfam9pbl9kZiA8LSBlaHJfZGYgJT4lCiAgICBzZWxlY3QoZW5zZ19pZCwgZ2VuZV9zeW1ib2wpICU+JQogICAgcmVuYW1lKG1hcHBpbmdfZmlsZV9nZW5lX3N5bWJvbCA9IGdlbmVfc3ltYm9sKQoKICBwcmludChwYXN0ZSgKICAgIHgsICdkYXRhIGZpbGUgaGFzJywKICAgIHN1bSghdW5pcXVlKGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiRlbnNnX2lkKSAlaW4lIGVocl9qb2luX2RmJGVuc2dfaWQpLAogICAgJ2dlbmUgc3ltYm9scyB0aGF0IGFyZSBub3QgaW4gbWFwcGluZyBmaWxlIGFuZCBoYXZlIGFzc29jaWF0ZWQgRU5TRyBJRHMnLAogICAgJ3RoYXQgYXJlIGFsc28gbm90IGluIG1hcHBpbmcgZmlsZS4nKSkKCiAgcmVzX2RmIDwtIGdzX2Vuc2dfbm90X2luX21hcHBpbmdfZmlsZV9kZiAlPiUKICAgIGxlZnRfam9pbihlaHJfam9pbl9kZiwgYnkgPSAnZW5zZ19pZCcpCgogIHJldHVybihyZXNfZGYpCn0pCmBgYAoKYGBge3Igc252fQpzeW1ib2xfbm90X2luX21hcHBpbmdfZmlsZV9saXN0JHNudgpgYGAKCmBgYHtyIGNudn0Kc3ltYm9sX25vdF9pbl9tYXBwaW5nX2ZpbGVfbGlzdCRjbnYKYGBgCgoKIyMgQ2hlY2sgZ2VuZSBFTlNHIElEIG92ZXJsYXAKCmBgYHtyIGNoZWNrX2dlbmVfZW5zZ19vdmVybGFwfQpnZW5lX2Vuc2dfbGlzdCA8LSBsaXN0KAogIHNudiA9IG9wZW5fcGVkX2Nhbl9kYXRhX2RmcyRzbnYkR2VuZSwKICBjbnYgPSBvcGVuX3BlZF9jYW5fZGF0YV9kZnMkY252JGVuc2VtYmwKKQoKZ2VuZV9lbnNnX2xpc3QgPC0gbGFwcGx5KGdlbmVfZW5zZ19saXN0LCBmdW5jdGlvbih4KSB7CiAgeCA8LSB4WyFpcy5uYSh4KV0KICB4IDwtIHVuaXF1ZSh4KQogIHJldHVybih4KQp9KQoKbWFwX2RmcihnZW5lX2Vuc2dfbGlzdCwgZnVuY3Rpb24oeCkgewogIHRpYmJsZSgKICAgIG5fdW5pcV9lbnNncyA9IGxlbmd0aCh4KSwKICAgIG5fdW5pcV9lbnNnc19pbl9tYXBwaW5nX2ZpbGUgPSBzdW0oeCAlaW4lIGVocl9kZiRlbnNnX2lkKSwKICAgIG5fdW5pcV9lbnNnc19ub3RfaW5fbWFwcGluZ19maWxlID0gc3VtKCF4ICVpbiUgZWhyX2RmJGVuc2dfaWQpLAogICAgdW5pcV9lbnNnc19ub3RfaW5fbWFwcGluZ19maWxlID0gcGFzdGUoCiAgICAgIHhbIXggJWluJSBlaHJfZGYkZW5zZ19pZF0sCiAgICAgIGNvbGxhcHNlID0gJywnKSkKfSwgLmlkID0gJ0RhdGEgdHlwZScpCmBgYAo=
diff --git a/analyses/gene_match/results/ensg-hugo-pmtl-mapping.tsv b/analyses/gene_match/results/ensg-hugo-pmtl-mapping.tsv index 1b871390f5..65622981e5 100644 --- a/analyses/gene_match/results/ensg-hugo-pmtl-mapping.tsv +++ b/analyses/gene_match/results/ensg-hugo-pmtl-mapping.tsv @@ -94840,4 +94840,3 @@ ENSG00000284745 AL589702.1 NA NA ENSG00000284746 AC068587.10 NA NA ENSG00000284747 AL034417.4 NA NA ENSG00000284748 AL513220.1 NA NA -Symbol_Not_Found NA Relevant Molecular Target PMTL version 1.1