diff --git a/.Rbuildignore b/.Rbuildignore index fb7695e9..84559d9c 100644 --- a/.Rbuildignore +++ b/.Rbuildignore @@ -7,3 +7,6 @@ ^CHANGELOG\.md$ ^README\.qmd$ ^docs$ +^_pkgdown\.yml$ +^pkgdown$ +^vignettes/*_files$ diff --git a/.github/dependabot.yml b/.github/dependabot.yml new file mode 100644 index 00000000..12301490 --- /dev/null +++ b/.github/dependabot.yml @@ -0,0 +1,6 @@ +version: 2 +updates: + - package-ecosystem: "github-actions" + directory: "/" + schedule: + interval: "daily" diff --git a/.github/workflows/R-CMD-check.yaml b/.github/workflows/R-CMD-check.yaml index 62480786..57a55c00 100644 --- a/.github/workflows/R-CMD-check.yaml +++ b/.github/workflows/R-CMD-check.yaml @@ -20,11 +20,11 @@ jobs: fail-fast: false matrix: config: - - {os: macos-latest, r: 'release'} - - {os: windows-latest, r: 'release'} - - {os: ubuntu-latest, r: 'devel', http-user-agent: 'release'} - - {os: ubuntu-latest, r: 'release'} - - {os: ubuntu-latest, r: 'oldrel-1'} + - { os: macos-latest, r: "release" } + - { os: windows-latest, r: "release" } + - { os: ubuntu-latest, r: "devel", http-user-agent: "release" } + - { os: ubuntu-latest, r: "release" } + - { os: ubuntu-latest, r: "oldrel-1" } env: GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }} @@ -33,8 +33,17 @@ jobs: steps: - uses: actions/checkout@v4 + # - name: Install lamin-cli + # env: + # LAMIN_API_KEY: ${{ secrets.LAMIN_API_KEY }} + # run: | + # pip install lamin-cli + # lamin login + - uses: r-lib/actions/setup-pandoc@v2 + - uses: r-lib/actions/setup-tinytex@v2 + - uses: r-lib/actions/setup-r@v2 with: r-version: ${{ matrix.config.r }} diff --git a/.github/workflows/pkgdown.yaml b/.github/workflows/pkgdown.yaml new file mode 100644 index 00000000..102864d3 --- /dev/null +++ b/.github/workflows/pkgdown.yaml @@ -0,0 +1,57 @@ +# Workflow derived from https://github.com/r-lib/actions/tree/v2/examples +# Need help debugging build failures? Start at https://github.com/r-lib/actions#where-to-find-help +on: + push: + branches: [main, master] + pull_request: + branches: [main, master] + release: + types: [published] + workflow_dispatch: + +name: pkgdown.yaml + +permissions: read-all + +jobs: + pkgdown: + runs-on: ubuntu-latest + # Only restrict concurrency for non-PR jobs + concurrency: + group: pkgdown-${{ github.event_name != 'pull_request' || github.run_id }} + env: + GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }} + permissions: + contents: write + steps: + - uses: actions/checkout@v4 + + - uses: r-lib/actions/setup-pandoc@v2 + + - uses: r-lib/actions/setup-r@v2 + with: + use-public-rspm: true + + - uses: r-lib/actions/setup-r-dependencies@v2 + with: + extra-packages: any::pkgdown, local::. + needs: website + + # - name: Install lamin-cli + # env: + # LAMIN_API_KEY: ${{ secrets.LAMIN_API_KEY }} + # run: | + # pip install lamin-cli + # lamin login + + - name: Build site + run: pkgdown::build_site_github_pages(new_process = FALSE, install = FALSE) + shell: Rscript {0} + + - name: Deploy to GitHub pages 🚀 + if: github.event_name != 'pull_request' + uses: JamesIves/github-pages-deploy-action@v4.5.0 + with: + clean: false + branch: gh-pages + folder: docs diff --git a/.gitignore b/.gitignore index e0795c61..7bd206b7 100644 --- a/.gitignore +++ b/.gitignore @@ -1,2 +1,3 @@ .Rproj.user experiments +docs diff --git a/CHANGELOG.md b/CHANGELOG.md index b833d55e..63b0ba08 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -6,6 +6,8 @@ * Read user settings from env file created by lamin Python package (PR #2, PR #8). +* Render a pkgdown website (PR #13). + ## MAJOR CHANGES * Refactored the internal class data structures for better modularity and extensibility (PR #8). @@ -17,7 +19,15 @@ ## MINOR CHANGES -* Update `README` with new set up instructions and simplify (PR #14) +* Update `README` with new set up instructions and simplify (PR #14). + +* Do not complain when foreign keys are not found in a record, but also do not complain when they are (PR #13). + +* Further simplify the `README`, and move the detailed usage description to a separate vignette (PR #13). + +* Add a `pkgdown` website to the project (PR #13). + +* Generate vignettes using Quarto (PR #13). ## BUG FIXES diff --git a/DESCRIPTION b/DESCRIPTION index c9ea3b7b..b834ce34 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -1,6 +1,6 @@ Package: laminr Title: LaminDB interface in R -Version: 0.0.0.9000 +Version: 0.1.0.9000 Authors@R: c(person("Robrecht", "Cannoodt", role = c("aut", "cre"), @@ -13,7 +13,7 @@ License: Apache License (>= 2) Encoding: UTF-8 Roxygen: list(markdown = TRUE) RoxygenNote: 7.3.2 -URL: https://github.com/laminlabs/laminr +URL: https://laminr.lamin.ai, https://github.com/laminlabs/laminr BugReports: https://github.com/laminlabs/laminr/issues Depends: R (>= 4.0.0) @@ -25,4 +25,6 @@ Imports: R6 Suggests: anndata, + quarto, s3 (>= 1.1.0) +VignetteBuilder: quarto diff --git a/NAMESPACE b/NAMESPACE index 32ba3690..b4e087b5 100644 --- a/NAMESPACE +++ b/NAMESPACE @@ -11,6 +11,7 @@ importFrom(httr,add_headers) importFrom(httr,content) importFrom(jsonlite,toJSON) importFrom(purrr,discard) +importFrom(purrr,keep) importFrom(purrr,list_flatten) importFrom(purrr,map) importFrom(purrr,map2) diff --git a/R/Record.R b/R/Record.R index e063bbd2..2deb0c3f 100644 --- a/R/Record.R +++ b/R/Record.R @@ -65,11 +65,12 @@ Record <- R6::R6Class( # nolint object_name_linter private$.api <- api private$.data <- data - column_names <- map(registry$get_fields(), "column_name") |> - unlist() |> + expected_fields <- + registry$get_fields() |> + discard(~ is.null(.x$column_name)) |> + map_chr("column_name") |> unname() - - unexpected_fields <- setdiff(names(data), column_names) + unexpected_fields <- setdiff(names(data), expected_fields) if (length(unexpected_fields) > 0) { cli_warn( paste0( @@ -79,7 +80,12 @@ Record <- R6::R6Class( # nolint object_name_linter ) } - missing_fields <- setdiff(column_names, names(data)) + required_fields <- + registry$get_fields() |> + keep(~ is.null(.x$relation_type)) |> + map_chr("column_name") |> + unname() + missing_fields <- setdiff(required_fields, names(data)) if (length(missing_fields) > 0) { cli_warn( paste0( diff --git a/R/Registry.R b/R/Registry.R index 41f06f9d..b76a8064 100644 --- a/R/Registry.R +++ b/R/Registry.R @@ -49,7 +49,7 @@ Registry <- R6::R6Class( # nolint object_name_linter ) }, #' Get a record by ID or UID. - get = function(id_or_uid, include_foreign_keys = TRUE, verbose = FALSE) { + get = function(id_or_uid, include_foreign_keys = FALSE, verbose = FALSE) { data <- private$.api$get_record( module_name = private$.module$name, registry_name = private$.registry_name, diff --git a/R/connect.R b/R/connect.R index 49ee2920..5b48c573 100644 --- a/R/connect.R +++ b/R/connect.R @@ -3,8 +3,13 @@ #' Connect to instance #' +#' Note that prior to connecting to an instance, you need to authenticate with +#' `lamin login`. If no slug is provided, the default instance is loaded, which is +#' set by running `lamin load `. +#' #' @param slug The instance slug `account_handle/instance_name` or URL. #' If the instance is owned by you, it suffices to pass the instance name. +#' If no slug is provided, the default instance is loaded. #' #' @export #' @@ -14,9 +19,14 @@ #' instance <- connect("laminlabs/cellxgene") #' instance #' } -connect <- function(slug) { +connect <- function(slug = NULL) { user_settings <- .settings_load__load_or_create_user_settings() + if (is.null(slug)) { + current_instance <- .settings_load__load_instance_settings() + slug <- paste0(current_instance$owner, "/", current_instance$name) + } + owner_name <- .connect_get_owner_name_from_identifier(slug) instance_settings <- .connect_get_instance_settings( diff --git a/R/laminr-package.R b/R/laminr-package.R index 03f15635..85e054e2 100644 --- a/R/laminr-package.R +++ b/R/laminr-package.R @@ -5,6 +5,6 @@ #' @importFrom cli cli_abort cli_warn cli_inform #' @importFrom R6 R6Class #' @importFrom httr GET POST content add_headers -#' @importFrom purrr map map_chr map2 pmap set_names list_flatten transpose discard +#' @importFrom purrr map map_chr map2 pmap set_names list_flatten transpose discard keep ## usethis namespace: end NULL diff --git a/README.md b/README.md index 57d277d6..f10ba7be 100644 --- a/README.md +++ b/README.md @@ -1,8 +1,10 @@ # LaminR: Work with LaminDB instances in R - - + [![R-CMD-check](https://github.com/laminlabs/laminr/actions/workflows/R-CMD-check.yaml/badge.svg)](https://github.com/laminlabs/laminr/actions/workflows/R-CMD-check.yaml) @@ -27,254 +29,28 @@ pip install lamin-cli lamin login ``` -## Usage +> [!TIP] +> +> You can get your token from the [LaminDB web +> interface](https://lamin.ai/settings). + +## Quick start -Load the library +Let’s first connect to a LaminDB instance: ``` r library(laminr) -``` -## Database instance - -``` r db <- connect("laminlabs/cellxgene") -db -``` - - - Inherits from: - Public: - Artifact: active binding - bionty: active binding - Collection: active binding - Feature: active binding - FeatureSet: active binding - FeatureValue: active binding - get_module: function (module_name) - get_module_names: function () - get_modules: function () - initialize: function (settings, api, schema) - Param: active binding - ParamValue: active binding - Run: active binding - Storage: active binding - Transform: active binding - ULabel: active binding - User: active binding - Private: - .api: API, R6 - .module_classes: list - .settings: InstanceSettings, R6 - -### Schema module - -``` r -db$get_module("core") -``` - - - Inherits from: - Public: - Artifact: active binding - Collection: active binding - Feature: active binding - FeatureSet: active binding - FeatureValue: active binding - get_registries: function () - get_registry: function (registry_name) - get_registry_names: function () - initialize: function (instance, api, module_name, module_schema) - name: active binding - Param: active binding - ParamValue: active binding - Run: active binding - Storage: active binding - Transform: active binding - ULabel: active binding - User: active binding - Private: - .api: API, R6 - .instance: cellxgene, Instance, R6 - .module_name: core - .registry_classes: list - -``` r -db$bionty -``` - - - Inherits from: - Public: - CellLine: active binding - CellMarker: active binding - CellType: active binding - DevelopmentalStage: active binding - Disease: active binding - Ethnicity: active binding - ExperimentalFactor: active binding - Gene: active binding - get_registries: function () - get_registry: function (registry_name) - get_registry_names: function () - initialize: function (instance, api, module_name, module_schema) - name: active binding - Organism: active binding - Pathway: active binding - Phenotype: active binding - Protein: active binding - Source: active binding - Tissue: active binding - Private: - .api: API, R6 - .instance: cellxgene, Instance, R6 - .module_name: bionty - .registry_classes: list - -### Registry - -``` r -db$Artifact ``` - - Public: - class_name: active binding - get: function (id_or_uid, include_foreign_keys = TRUE, verbose = FALSE) - get_field: function (field_name) - get_field_names: function () - get_fields: function () - get_record_class: function () - initialize: function (instance, module, api, registry_name, registry_schema) - is_link_table: active binding - module: active binding - name: active binding - Private: - .api: API, R6 - .class_name: Artifact - .fields: list - .instance: cellxgene, Instance, R6 - .is_link_table: FALSE - .module: core, Module, R6 - .record_class: R6ClassGenerator - .registry_name: artifact - -``` r -db$bionty$CellLine -``` - - - Public: - class_name: active binding - get: function (id_or_uid, include_foreign_keys = TRUE, verbose = FALSE) - get_field: function (field_name) - get_field_names: function () - get_fields: function () - get_record_class: function () - initialize: function (instance, module, api, registry_name, registry_schema) - is_link_table: active binding - module: active binding - name: active binding - Private: - .api: API, R6 - .class_name: CellLine - .fields: list - .instance: cellxgene, Instance, R6 - .is_link_table: FALSE - .module: bionty, Module, R6 - .record_class: R6ClassGenerator - .registry_name: cellline - -### Record - -#### Get artifact +Get an artifact: ``` r artifact <- db$Artifact$get("KBW89Mf7IGcekja2hADu") -artifact ``` - - Inherits from: - Public: - _accessor: active binding - _action_targets: active binding - _actions: active binding - _environment_of: active binding - _feature_values: active binding - _hash_type: active binding - _key_is_virtual: active binding - _meta_of_collection: active binding - _param_values: active binding - _previous_runs: active binding - _report_of: active binding - _source_artifact_of: active binding - _source_code_of: active binding - _source_dataframe_of: active binding - cache: function () - cell_lines: active binding - cell_markers: active binding - cell_types: active binding - clone: function (deep = FALSE) - collections: active binding - created_at: active binding - created_by: active binding - description: active binding - developmental_stages: active binding - diseases: active binding - ethnicities: active binding - experimental_factors: active binding - feature_sets: active binding - genes: active binding - hash: active binding - id: active binding - initialize: function (data) - input_of_runs: active binding - is_latest: active binding - key: active binding - links_cell_line: active binding - links_cell_marker: active binding - links_cell_type: active binding - links_collection: active binding - links_developmental_stage: active binding - links_disease: active binding - links_ethnicity: active binding - links_experimental_factor: active binding - links_feature_set: active binding - links_gene: active binding - links_organism: active binding - links_pathway: active binding - links_phenotype: active binding - links_protein: active binding - links_tissue: active binding - links_ulabel: active binding - load: function () - n_objects: active binding - n_observations: active binding - organisms: active binding - pathways: active binding - phenotypes: active binding - proteins: active binding - run: active binding - size: active binding - storage: active binding - suffix: active binding - tissues: active binding - transform: active binding - type: active binding - uid: active binding - ulabels: active binding - updated_at: active binding - version: active binding - visibility: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) - -#### Print simple fields +Access some of its fields: ``` r artifact$id @@ -294,194 +70,27 @@ artifact$key [1] "cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad" -#### Print related fields +Fetch related fields: ``` r -artifact$storage +artifact$storage$root ``` - Warning: Data is missing expected fields: run_id, created_by_id - - - Inherits from: - Public: - _previous_runs: active binding - artifacts: active binding - created_at: active binding - created_by: active binding - description: active binding - id: active binding - initialize: function (data) - instance_uid: active binding - region: active binding - root: active binding - run: active binding - type: active binding - uid: active binding - updated_at: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) + [1] "s3://cellxgene-data-public" ``` r -artifact$created_by +artifact$created_by$handle ``` - - Inherits from: - Public: - created_artifacts: active binding - created_at: active binding - created_runs: active binding - created_transforms: active binding - handle: active binding - id: active binding - initialize: function (data) - name: active binding - uid: active binding - updated_at: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) + [1] "sunnyosun" -``` r -artifact$experimental_factors -``` - - Warning: Data is missing expected fields: run_id, source_id, created_by_id - - Warning: Data is missing expected fields: run_id, source_id, created_by_id - Data is missing expected fields: run_id, source_id, created_by_id - - [[1]] - - Inherits from: - Public: - _previous_runs: active binding - abbr: active binding - artifacts: active binding - children: active binding - created_at: active binding - created_by: active binding - description: active binding - id: active binding - initialize: function (data) - instrument: active binding - links_artifact: active binding - measurement: active binding - molecule: active binding - name: active binding - ontology_id: active binding - parents: active binding - run: active binding - source: active binding - synonyms: active binding - uid: active binding - updated_at: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) - - [[2]] - - Inherits from: - Public: - _previous_runs: active binding - abbr: active binding - artifacts: active binding - children: active binding - created_at: active binding - created_by: active binding - description: active binding - id: active binding - initialize: function (data) - instrument: active binding - links_artifact: active binding - measurement: active binding - molecule: active binding - name: active binding - ontology_id: active binding - parents: active binding - run: active binding - source: active binding - synonyms: active binding - uid: active binding - updated_at: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) - - [[3]] - - Inherits from: - Public: - _previous_runs: active binding - abbr: active binding - artifacts: active binding - children: active binding - created_at: active binding - created_by: active binding - description: active binding - id: active binding - initialize: function (data) - instrument: active binding - links_artifact: active binding - measurement: active binding - molecule: active binding - name: active binding - ontology_id: active binding - parents: active binding - run: active binding - source: active binding - synonyms: active binding - uid: active binding - updated_at: active binding - Private: - .api: API, R6 - .data: list - .instance: cellxgene, Instance, R6 - .registry: Registry, R6 - get_value: function (key) - -### Download and cache an artifact - -> [!NOTE] -> -> Only S3 storage is supported at the moment. - -``` r -artifact$cache() -``` - - Warning: Data is missing expected fields: run_id, created_by_id - - ℹ 's3://cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' already exists at '/home/luke/.cache/lamindb/cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' - -### Load an artifact - -> [!NOTE] -> -> Only S3 storage and AnnData accessors are supported at the moment. +Load the artifact: ``` r artifact$load() ``` - Warning: Data is missing expected fields: run_id, created_by_id - - ℹ 's3://cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' already exists at '/home/luke/.cache/lamindb/cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' + ℹ 's3://cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' already exists at '/home/rcannood/.cache/lamindb/cellxgene-data-public/cell-census/2024-07-01/h5ads/fe52003e-1460-4a65-a213-2bb1a508332f.h5ad' AnnData object with n_obs × n_vars = 51552 × 36398 obs: 'donor_id', 'Predicted_labels_CellTypist', 'Majority_voting_CellTypist', 'Manually_curated_celltype', 'assay_ontology_term_id', 'cell_type_ontology_term_id', 'development_stage_ontology_term_id', 'disease_ontology_term_id', 'self_reported_ethnicity_ontology_term_id', 'is_primary_data', 'organism_ontology_term_id', 'sex_ontology_term_id', 'tissue_ontology_term_id', 'suspension_type', 'tissue_type', 'cell_type', 'assay', 'disease', 'organism', 'sex', 'tissue', 'self_reported_ethnicity', 'development_stage', 'observation_joinid' diff --git a/README.qmd b/README.qmd index 3ee72c1a..2cba7d5c 100644 --- a/README.qmd +++ b/README.qmd @@ -3,9 +3,11 @@ title: "LaminR: Work with LaminDB instances in R" format: gfm --- - - + [![R-CMD-check](https://github.com/laminlabs/laminr/actions/workflows/R-CMD-check.yaml/badge.svg)](https://github.com/laminlabs/laminr/actions/workflows/R-CMD-check.yaml) @@ -29,49 +31,27 @@ pip install lamin-cli lamin login ``` -## Usage +:::{.callout-tip} +You can get your token from the [LaminDB web interface](https://lamin.ai/settings). +::: + +## Quick start -Load the library +Let's first connect to a LaminDB instance: ```{r setup} library(laminr) -``` -## Database instance - -```{r connect} db <- connect("laminlabs/cellxgene") -db -``` - -### Schema module - -```{r get_module} -db$get_module("core") - -db$bionty -``` - -### Registry - -```{r get_artifact_registry} -db$Artifact ``` -```{r get_bionty_celline} -db$bionty$CellLine -``` - -### Record - -#### Get artifact +Get an artifact: ```{r get_artifact} artifact <- db$Artifact$get("KBW89Mf7IGcekja2hADu") -artifact ``` -#### Print simple fields +Access some of its fields: ```{r print_simple_fields} artifact$id @@ -81,31 +61,15 @@ artifact$uid artifact$key ``` -#### Print related fields +Fetch related fields: ```{r print_related_fields} -artifact$storage +artifact$storage$root -artifact$created_by - -artifact$experimental_factors +artifact$created_by$handle ``` -### Download and cache an artifact - -:::{.callout-note} -Only S3 storage is supported at the moment. -::: - -```{r cache_artifact} -artifact$cache() -``` - -### Load an artifact - -:::{.callout-note} -Only S3 storage and AnnData accessors are supported at the moment. -::: +Load the artifact: ```{r load_artifact} artifact$load() diff --git a/_pkgdown.yml b/_pkgdown.yml new file mode 100644 index 00000000..dac5a2d7 --- /dev/null +++ b/_pkgdown.yml @@ -0,0 +1,3 @@ +url: https://laminr.lamin.ai/ +template: + bootstrap: 5 diff --git a/docs/class_diagram.md b/docs/class_diagram.md deleted file mode 100644 index d75fab29..00000000 --- a/docs/class_diagram.md +++ /dev/null @@ -1,122 +0,0 @@ -# Class Diagram - - -``` mermaid -classDiagram - laminr --> RichInstance - laminr --> UserSettings - laminr --> InstanceSettings - RichInstance --|> Instance - Instance --> InstanceAPI - Instance --> Module - Core --|> Module - Bionty --|> Module - Module --> Registry - Registry --> Field - Registry --> RichRecord - Artifact --|> Record - RichInstance --> Core - RichInstance --> Bionty - Core --> Artifact - RichRecord --|> Record - - class laminr{ - +connect(String slug): RichInstance - } - - class UserSettings{ - +initialize(...): UserSettings - +email: String - +access_token: String - +uid: String - +uuid: String - +handle: String - +name: String - } - - class InstanceSettings{ - +initialize(...): InstanceSettings - +owner: String - +name: String - +id: String - +schema_id: String - +api_url: String - } - class Instance{ - +initialize(InstanceSettings Instance_settings, API api, Map schema): Instance - +get_modules(): Module[] - +get_module(String module_name): Module - +get_module_names(): String[] - - } - class InstanceAPI{ - +initialize(InstanceSettings Instance_settings) - +get_schema(): Map~String, Any~ - +get_record(...): Map~String, Any~ - } - class RichInstance{ - +initialize(InstanceSettings Instance_settings, API api, Map schema): RichInstance - +Registry Artifact - +Registry Collection - +...registry accessors... - +Registry User - +Bionty bionty - } - class Core{ - +Registry Artifact - +Registry Collection - +...registry accessors... - +Registry User - } - class Bionty{ - +Registry CellLine - +Registry CellMarker - +...registry accessors... - +Registry Tissue - } - class Module{ - +initialize(Instance Instance, API api, String module_name, Map module_schema): Module - +name: String - +get_registries(): Registry[] - +get_registry(String registry_name): Registry - +get_registry_names(): String[] - } - class Registry{ - +initialize(Instance Instance, Module module, API api, String registry_name, Map registry_schema): Registry - +name: String - +class_name: String - +is_link_table: Bool - +get_fields(): Field[] - +get_field(String field_name): Field - +get_field_names(): String[] - +get(String id_or_uid, Bool include_foreign_keys, List~String~ select, Bool verbose): RichRecord - +get_registry_class(): RichRecordClass - } - class Artifact{ - +initialize(...): Artifact - +cache(): String - +load(): Any - } - class Field{ - +initialize(...): Field - +type: String - +through: Map - +field_name: String - +registry_name: String - +column_name: String - +module_name: String - +is_link_table: Bool - +relation_type: String - +related_field_name: String - +related_registry_name: String - +related_module_name: String - - } - class RichRecord{ - +...field value accessors... - } - class Record{ - +initialize(Instance Instance, Registry registry, API api, Map data): Record - +get_value(String field_name): Any - } -``` diff --git a/docs/class_diagram.qmd b/docs/class_diagram.qmd deleted file mode 100644 index 39ceebbd..00000000 --- a/docs/class_diagram.qmd +++ /dev/null @@ -1,124 +0,0 @@ ---- -title: Class Diagram -format: gfm ---- - -```{mermaid} -classDiagram - laminr --> RichInstance - laminr --> UserSettings - laminr --> InstanceSettings - RichInstance --|> Instance - Instance --> InstanceAPI - Instance --> Module - Core --|> Module - Bionty --|> Module - Module --> Registry - Registry --> Field - Registry --> RichRecord - Artifact --|> Record - RichInstance --> Core - RichInstance --> Bionty - Core --> Artifact - RichRecord --|> Record - - class laminr{ - +connect(String slug): RichInstance - } - - class UserSettings{ - +initialize(...): UserSettings - +email: String - +access_token: String - +uid: String - +uuid: String - +handle: String - +name: String - } - - class InstanceSettings{ - +initialize(...): InstanceSettings - +owner: String - +name: String - +id: String - +schema_id: String - +api_url: String - } - class Instance{ - +initialize(InstanceSettings Instance_settings, API api, Map schema): Instance - +get_modules(): Module[] - +get_module(String module_name): Module - +get_module_names(): String[] - - } - class InstanceAPI{ - +initialize(InstanceSettings Instance_settings) - +get_schema(): Map~String, Any~ - +get_record(...): Map~String, Any~ - } - class RichInstance{ - +initialize(InstanceSettings Instance_settings, API api, Map schema): RichInstance - +Registry Artifact - +Registry Collection - +...registry accessors... - +Registry User - +Bionty bionty - } - class Core{ - +Registry Artifact - +Registry Collection - +...registry accessors... - +Registry User - } - class Bionty{ - +Registry CellLine - +Registry CellMarker - +...registry accessors... - +Registry Tissue - } - class Module{ - +initialize(Instance Instance, API api, String module_name, Map module_schema): Module - +name: String - +get_registries(): Registry[] - +get_registry(String registry_name): Registry - +get_registry_names(): String[] - } - class Registry{ - +initialize(Instance Instance, Module module, API api, String registry_name, Map registry_schema): Registry - +name: String - +class_name: String - +is_link_table: Bool - +get_fields(): Field[] - +get_field(String field_name): Field - +get_field_names(): String[] - +get(String id_or_uid, Bool include_foreign_keys, List~String~ select, Bool verbose): RichRecord - +get_registry_class(): RichRecordClass - } - class Artifact{ - +initialize(...): Artifact - +cache(): String - +load(): Any - } - class Field{ - +initialize(...): Field - +type: String - +through: Map - +field_name: String - +registry_name: String - +column_name: String - +module_name: String - +is_link_table: Bool - +relation_type: String - +related_field_name: String - +related_registry_name: String - +related_module_name: String - - } - class RichRecord{ - +...field value accessors... - } - class Record{ - +initialize(Instance Instance, Registry registry, API api, Map data): Record - +get_value(String field_name): Any - } -``` diff --git a/man/connect.Rd b/man/connect.Rd index e8d8126b..bfb645ea 100644 --- a/man/connect.Rd +++ b/man/connect.Rd @@ -4,14 +4,17 @@ \alias{connect} \title{Connect to instance} \usage{ -connect(slug) +connect(slug = NULL) } \arguments{ \item{slug}{The instance slug \code{account_handle/instance_name} or URL. -If the instance is owned by you, it suffices to pass the instance name.} +If the instance is owned by you, it suffices to pass the instance name. +If no slug is provided, the default instance is loaded.} } \description{ -Connect to instance +Note that prior to connecting to an instance, you need to authenticate with +\verb{lamin login}. If no slug is provided, the default instance is loaded, which is +set by running \verb{lamin load }. } \examples{ \dontrun{ diff --git a/man/laminr-package.Rd b/man/laminr-package.Rd index d41d66c0..a6443720 100644 --- a/man/laminr-package.Rd +++ b/man/laminr-package.Rd @@ -11,6 +11,7 @@ The laminr package provides an interface to the LaminDB database. It allows you \seealso{ Useful links: \itemize{ + \item \url{https://laminr.lamin.ai} \item \url{https://github.com/laminlabs/laminr} \item Report bugs at \url{https://github.com/laminlabs/laminr/issues} } diff --git a/vignettes/.gitignore b/vignettes/.gitignore new file mode 100644 index 00000000..4063bdd5 --- /dev/null +++ b/vignettes/.gitignore @@ -0,0 +1,5 @@ +/.quarto/ +*.html +*.R +*_files +_quarto.yaml diff --git a/vignettes/structure.qmd b/vignettes/structure.qmd new file mode 100644 index 00000000..88b8cd58 --- /dev/null +++ b/vignettes/structure.qmd @@ -0,0 +1,251 @@ +--- +title: "Package structure" +vignette: > + %\VignetteIndexEntry{Package structure} + %\VignetteEncoding{UTF-8} + %\VignetteEngine{quarto::html} +knitr: + opts_chunk: + collapse: true + comment: "#>" +--- + +This package is designed to interact with LaminDB instances. + +## Basic structure + +When connecting to a LaminDB instance, laminr will interact with the LaminDB instance API to retrieve the schema of the data structures in that instance. This schema is used to instantiate Modules containing Registries, which in turn contain Fields. A registry can be used to retrieve Records. + +### Class diagram + +```{mermaid} +classDiagram +%% # nolint start + laminr --> Instance + laminr --> UserSettings + laminr --> InstanceSettings + Instance --> InstanceAPI + Instance --> Module + Module --> Registry + Registry --> Field + Registry --> Record + + class laminr{ + +connect(String slug): Instance + } + + class UserSettings{ + +initialize(...): UserSettings + +email: String + +access_token: String + +uid: String + +uuid: String + +handle: String + +name: String + } + + class InstanceSettings{ + +initialize(...): InstanceSettings + +owner: String + +name: String + +id: String + +schema_id: String + +api_url: String + } + class Instance{ + +initialize(InstanceSettings Instance_settings, API api, Map schema): Instance + +get_modules(): Module[] + +get_module(String module_name): Module + +get_module_names(): String[] + } + class InstanceAPI{ + +initialize(InstanceSettings Instance_settings) + +get_schema(): Map + +get_record(...): Map + } + class Module{ + +initialize(Instance Instance, API api, String module_name, Map module_schema): Module + +name: String + +get_registries(): Registry[] + +get_registry(String registry_name): Registry + +get_registry_names(): String[] + } + class Registry{ + +initialize(Instance Instance, Module module, API api, String registry_name, Map registry_schema): Registry + +name: String + +class_name: String + +is_link_table: Bool + +get_fields(): Field[] + +get_field(String field_name): Field + +get_field_names(): String[] + +get(String id_or_uid, Bool include_foreign_keys, List~String~ select, Bool verbose): RichRecord + +get_registry_class(): RichRecordClass + } + class Field{ + +initialize(...): Field + +type: String + +through: Map + +field_name: String + +registry_name: String + +column_name: String + +module_name: String + +is_link_table: Bool + +relation_type: String + +related_field_name: String + +related_registry_name: String + +related_module_name: String + } + class Record{ + +initialize(Instance Instance, Registry registry, API api, Map data): Record + +get_value(String field_name): Any + } +%% # nolint end +``` + +## Sugar syntax + +The `laminr` package adds some sugar syntax to the `Instance` and `Registry` classes. This allows to directly access an instance's registies and a record's fields. + +For instance, instead of writing: + +```r +db <- connect("laminlabs/cellxgene") + +artifact <- db$get_module("core")$get_registry("artifact")$get("KBW89Mf7IGcekja2hADu") + +artifact$get_value("id") +``` + +Using the sugar syntax, you can write: + +```r +db <- connect("laminlabs/cellxgene") + +artifact <- db$core$artifact$get("KBW89Mf7IGcekja2hADu") + +artifact$id +``` + +This sugar syntax is achieved by creating RichInstance and RichRecord classes that inherit from Instance and Record, respectively. + +### Class diagram + +```{mermaid} +classDiagram +%% # nolint start + laminr --> RichInstance + laminr --> UserSettings + laminr --> InstanceSettings + RichInstance --|> Instance + Instance --> InstanceAPI + Instance --> Module + Core --|> Module + Bionty --|> Module + Module --> Registry + Registry --> Field + Registry --> RichRecord + Artifact --|> Record + RichInstance --> Core + RichInstance --> Bionty + Core --> Artifact + RichRecord --|> Record + + class laminr{ + +connect(String slug): RichInstance + } + + class UserSettings{ + +initialize(...): UserSettings + +email: String + +access_token: String + +uid: String + +uuid: String + +handle: String + +name: String + } + + class InstanceSettings{ + +initialize(...): InstanceSettings + +owner: String + +name: String + +id: String + +schema_id: String + +api_url: String + } + class Instance{ + +initialize(InstanceSettings Instance_settings, API api, Map schema): Instance + +get_modules(): Module[] + +get_module(String module_name): Module + +get_module_names(): String[] + } + class InstanceAPI{ + +initialize(InstanceSettings Instance_settings) + +get_schema(): Map + +get_record(...): Map + } + class RichInstance{ + +initialize(InstanceSettings Instance_settings, API api, Map schema): RichInstance + +Registry Artifact + +Registry Collection + +...registry accessors... + +Registry User + +Bionty bionty + } + class Core{ + +Registry Artifact + +Registry Collection + +...registry accessors... + +Registry User + } + class Bionty{ + +Registry CellLine + +Registry CellMarker + +...registry accessors... + +Registry Tissue + } + class Module{ + +initialize(Instance Instance, API api, String module_name, Map module_schema): Module + +name: String + +get_registries(): Registry[] + +get_registry(String registry_name): Registry + +get_registry_names(): String[] + } + class Registry{ + +initialize(Instance Instance, Module module, API api, String registry_name, Map registry_schema): Registry + +name: String + +class_name: String + +is_link_table: Bool + +get_fields(): Field[] + +get_field(String field_name): Field + +get_field_names(): String[] + +get(String id_or_uid, Bool include_foreign_keys, List~String~ select, Bool verbose): RichRecord + +get_registry_class(): RichRecordClass + } + class Artifact{ + +initialize(...): Artifact + +cache(): String + +load(): Any + } + class Field{ + +initialize(...): Field + +type: String + +through: Map + +field_name: String + +registry_name: String + +column_name: String + +module_name: String + +is_link_table: Bool + +relation_type: String + +related_field_name: String + +related_registry_name: String + +related_module_name: String + } + class RichRecord{ + +...field value accessors... + } + class Record{ + +initialize(Instance Instance, Registry registry, API api, Map data): Record + +get_value(String field_name): Any + } +%% # nolint end +```