From 0fbb68bcce590e472052d47585ba34a8b33040a3 Mon Sep 17 00:00:00 2001 From: Anh Nguyet Vu <32753274+anngvu@users.noreply.github.com> Date: Thu, 2 Jan 2025 18:48:05 -0700 Subject: [PATCH] New project and package infra upgrades (#207) * Factor out functionality for reuse * Implement new fileview building standards (#192) * More default fileview updates * Implement protocol binding * Update Dockerfile * Export, update pkg reference --- Dockerfile | 4 ++-- NAMESPACE | 1 + R/new_project.R | 56 +++++++++++++++++++++++++++++++--------------- _pkgdown.yml | 1 + man/bind_schema.Rd | 19 ++++++++++++++++ 5 files changed, 61 insertions(+), 20 deletions(-) create mode 100644 man/bind_schema.Rd diff --git a/Dockerfile b/Dockerfile index 7535c753..cfecb5bb 100644 --- a/Dockerfile +++ b/Dockerfile @@ -10,14 +10,14 @@ RUN apt-get update && \ libxt6 -RUN pip install synapseclient==3.0.0 +RUN pip install synapseclient==4.3.1 COPY . /nfportalutils # R components for installation or suggested usage RUN R -e "install.packages(c('remotes', 'rmarkdown', 'DiagrammeR'), repos='http://cran.rstudio.com/')" RUN R -e "remotes::install_local('nfportalutils', dependencies = c('Depends', 'Imports'))" -RUN R -e "remotes::install_version('reticulate', version = '1.28', repos ='http://cran.us.r-project.org')" +RUN R -e "remotes::install_version('reticulate', version = '1.39.0', repos ='http://cran.us.r-project.org')" ENTRYPOINT [ "/bin/bash" ] diff --git a/NAMESPACE b/NAMESPACE index ffb72e7d..74319860 100644 --- a/NAMESPACE +++ b/NAMESPACE @@ -28,6 +28,7 @@ export(annotate_with_samtools_stats) export(as_table_schema) export(assign_study_data_types) export(bad_url) +export(bind_schema) export(bipartite_mmd_template) export(byte_budget) export(calculate_related_studies) diff --git a/R/new_project.R b/R/new_project.R index cf614ee5..f47e2a57 100644 --- a/R/new_project.R +++ b/R/new_project.R @@ -96,13 +96,7 @@ new_project <- function(name, # Bind JSON schema so children folders have NF's dataset schemas, see # https://repo-prod.prod.sagebase.org/repo/v1/schema/type/registered/org.synapse.nf-superdataset - # and https://help.synapse.org/docs/JSON-Schemas.3107291536.html - bind_schema_request <- jsonlite::toJSON(list(entityId = data_folder_id, - `schema$id` = "org.synapse.nf-superdataset", - enableDerivedAnnotations = TRUE), - auto_unbox = TRUE) - binding_uri <- glue::glue("https://repo-prod.prod.sagebase.org/repo/v1/entity/{data_folder_id}/schema/binding") - try(.syn$restPUT(binding_uri, bind_schema_request)) + bind_schema(id = data_folder_id, schema_id = "org.synapse.nf-superdataset", derived_annotations = TRUE) # Create data-specific folders in "Raw Data" if(length(datasets)) { @@ -111,9 +105,15 @@ new_project <- function(name, # Create homes for non-data resources alongside "Raw Data" if(length(other_resources)) { - make_folder(parent = project, folders = other_resources) + other_resource_folders <- make_folder(parent = project, folders = other_resources) + if ("Protocols" %in% names(other_resource_folders)) { + bind_schema(id = other_resource_folders$Protocols$properties$id, schema_id = "org.synapse.nf-protocol", derived_annotations = FALSE) + } } + # Aside from dataset schema, currently only have protocols schema + + # Add Project Files and Metadata fileview, add NF schema; currently doesn't add facets fv <- add_default_fileview(project) @@ -156,29 +156,31 @@ add_default_fileview <- function(project) { view <- synapseclient$EntityViewSchema( name = "Project Files and Metadata", columns=list( + synapseclient$Column(name="contentType", columnType="STRING", maximumSize="20"), synapseclient$Column(name="resourceType", columnType="STRING", maximumSize="50"), - synapseclient$Column(name="assay", columnType="STRING", maximumSize="57"), + synapseclient$Column(name="assay", columnType="STRING", maximumSize="100"), synapseclient$Column(name="dataType", columnType="STRING", maximumSize="30"), synapseclient$Column(name="dataSubtype", columnType="STRING", maximumSize="13"), synapseclient$Column(name="fileFormat", columnType="STRING", maximumSize="13"), synapseclient$Column(name="diagnosis", columnType="STRING", maximumSize="39"), synapseclient$Column(name="tumorType", columnType="STRING", maximumSize="90"), - synapseclient$Column(name="individualID", columnType="STRING", maximumSize="213"), - synapseclient$Column(name="specimenID", columnType="STRING", maximumSize="300"), + synapseclient$Column(name="individualID", columnType="STRING_LIST", maximumSize="50", maximumListLength = "50"), + synapseclient$Column(name="specimenID", columnType="STRING_LIST", maximumSize="50", maximumListLength = "50"), synapseclient$Column(name="nf1Genotype", columnType="STRING", maximumSize="8"), - synapseclient$Column(name="nf2Genotype", columnType="STRING", maximumSize="7"), + synapseclient$Column(name="nf2Genotype", columnType="STRING", maximumSize="20"), synapseclient$Column(name="species", columnType="STRING", maximumSize="100"), - synapseclient$Column(name="modelSystemName", columnType="STRING", maximumSize="42"), - synapseclient$Column(name="cellType", columnType="STRING", maximumSize="300"), - synapseclient$Column(name="sex", columnType="STRING", maximumSize="50"), + synapseclient$Column(name="modelSystemName", columnType="STRING", maximumSize="100"), + synapseclient$Column(name="cellType", columnType="STRING_LIST", maximumSize="50", maximumListLength = "50"), + synapseclient$Column(name="sex", columnType="STRING", maximumSize="30"), synapseclient$Column(name="age", columnType="STRING", maximumSize="50"), - synapseclient$Column(name="experimentalCondition", columnType="STRING", maximumSize="58"), + synapseclient$Column(name="experimentalCondition", columnType="STRING", maximumSize="100"), synapseclient$Column(name="progressReportNumber", columnType="INTEGER") ), parent = project, scopes = project, - includeEntityTypes = list(synapseclient$EntityViewType$FILE), - add_default_columns = TRUE) + includeEntityTypes = list(synapseclient$EntityViewType$FILE, synapseclient$EntityViewType$FOLDER), + add_default_columns = TRUE, + addAnnotationColumns = FALSE) view <- .syn$store(view) invisible(view) } @@ -296,3 +298,21 @@ is_valid_team <- function(id) { if(length(status)) return(TRUE) else return(FALSE) } +#' Wrapper for JSON schema binding +#' +#' See https://help.synapse.org/docs/JSON-Schemas.3107291536.html +#' +#' @param id Id of entity to which schema will be bound +#' @param schema_id Schema id as registered on Synapse. +#' @param derived_annotations Whether to enabled derived annotations. +#' Default `FALSE` as this is the API default. +#' @export +bind_schema <- function(id, schema_id, derived_annotations = FALSE) { + + bind_schema_request <- jsonlite::toJSON(list(entityId = id, + `schema$id` = schema_id, + enableDerivedAnnotations = derived_annotations), + auto_unbox = TRUE) + binding_uri <- glue::glue("https://repo-prod.prod.sagebase.org/repo/v1/entity/{id}/schema/binding") + try(.syn$restPUT(binding_uri, bind_schema_request)) +} diff --git a/_pkgdown.yml b/_pkgdown.yml index a1bec94d..8c77e638 100644 --- a/_pkgdown.yml +++ b/_pkgdown.yml @@ -147,6 +147,7 @@ reference: - table_query - as_table_schema - make_folder + - bind_schema - add_to_scope - new_view - list_project_datasets diff --git a/man/bind_schema.Rd b/man/bind_schema.Rd new file mode 100644 index 00000000..c58058f6 --- /dev/null +++ b/man/bind_schema.Rd @@ -0,0 +1,19 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/new_project.R +\name{bind_schema} +\alias{bind_schema} +\title{Wrapper for JSON schema binding} +\usage{ +bind_schema(id, schema_id, derived_annotations = FALSE) +} +\arguments{ +\item{id}{Id of entity to which schema will be bound} + +\item{schema_id}{Schema id as registered on Synapse.} + +\item{derived_annotations}{Whether to enabled derived annotations. +Default \code{FALSE} as this is the API default.} +} +\description{ +See https://help.synapse.org/docs/JSON-Schemas.3107291536.html +}