diff --git a/.Rbuildignore b/.Rbuildignore
index 561a653e..59863e10 100644
--- a/.Rbuildignore
+++ b/.Rbuildignore
@@ -9,4 +9,5 @@
^pkgdown$
^\.circleci$
^\.circleci/config\.yml$
-^\.github$
\ No newline at end of file
+^\.github$
+^cran-comments\.md$
diff --git a/.github/workflows/dsBase_test_suite.yaml b/.github/workflows/dsBase_test_suite.yaml
new file mode 100755
index 00000000..bea80e31
--- /dev/null
+++ b/.github/workflows/dsBase_test_suite.yaml
@@ -0,0 +1,210 @@
+################################################################################
+# DataSHIELD GHA test suite - dsBase
+# Adapted from `azure-pipelines.yml` by Roberto Villegas-Diaz
+#
+# Inside the root directory $(Pipeline.Workspace) will be a file tree like:
+# /dsBase <- Checked out version of datashield/dsBase
+# /dsBase/logs <- Where results of tests and logs are collated
+# /testStatus <- Checked out version of datashield/testStatus
+#
+# As of Jul 2025 this takes ~ 9 mins to run.
+################################################################################
+name: dsBase tests' suite
+
+on:
+ push:
+ schedule:
+ - cron: '0 0 * * 0' # Weekly
+
+jobs:
+ dsBase_test_suite:
+ runs-on: ubuntu-latest
+ timeout-minutes: 120
+ permissions:
+ contents: write
+
+ # These should all be constant, except TEST_FILTER. This can be used to test
+ # subsets of test files in the testthat directory. Options are like:
+ # '*' <- Run all tests.
+ # 'asNumericDS*' <- Run all asNumericDS tests, i.e. all the arg, etc. tests.
+ # '*_smk_*' <- Run all the smoke tests for all functions.
+ env:
+ TEST_FILTER: '*'
+ _r_check_system_clock_: 0
+ WORKFLOW_ID: ${{ github.run_id }}-${{ github.run_attempt }}
+ PROJECT_NAME: dsBase
+ BRANCH_NAME: ${{ github.ref_name }}
+ REPO_OWNER: ${{ github.repository_owner }}
+ R_KEEP_PKG_SOURCE: yes
+ GITHUB_TOKEN: ${{ github.token || 'placeholder-token' }}
+
+ steps:
+ - name: Checkout dsBase
+ uses: actions/checkout@v4
+ with:
+ path: dsBase
+
+ - name: Checkout testStatus
+ if: ${{ github.actor != 'nektos/act' }} # for local deployment only
+ uses: actions/checkout@v4
+ with:
+ repository: ${{ env.REPO_OWNER }}/testStatus
+ ref: master
+ path: testStatus
+ persist-credentials: false
+ token: ${{ env.GITHUB_TOKEN }}
+
+ - uses: r-lib/actions/setup-pandoc@v2
+
+ - uses: r-lib/actions/setup-r@v2
+ with:
+ r-version: release
+ http-user-agent: release
+ use-public-rspm: true
+
+ - name: Install dsBase
+ run: |
+ Rscript -e 'install.packages(c("RANN", "stringr", "lme4", "dplyr", "reshape2", "polycor", "gamlss", "gamlss.dist", "mice", "childsds", "usethis", "devtools"), dependencies = TRUE)'
+ R CMD INSTALL ./dsBase
+
+ - uses: r-lib/actions/setup-r-dependencies@v2
+ with:
+ dependencies: 'c("Imports")'
+ extra-packages: |
+ any::rcmdcheck
+ cran::devtools
+ cran::git2r
+ cran::RCurl
+ cran::readr
+ cran::magrittr
+ cran::xml2
+ cran::purrr
+ cran::dplyr
+ cran::stringr
+ cran::tidyr
+ cran::quarto
+ cran::knitr
+ cran::kableExtra
+ cran::rmarkdown
+ cran::downlit
+ needs: check
+
+ - name: Check man files up-to-date
+ run: |
+ orig_sum=$(find man -type f | sort -u | xargs cat | md5sum)
+ R -e "devtools::document()"
+ new_sum=$(find man -type f | sort -u | xargs cat | md5sum)
+ if [ "$orig_sum" != "$new_sum" ]; then
+ echo "Your committed manual files (man/*.Rd) are out of sync with the R files. Run devtools::document() locally then commit."
+ exit 1
+ else
+ echo "Documentation up-to-date."
+ fi
+ working-directory: dsBase
+ continue-on-error: true
+
+ - name: Run devtools::check
+ run: |
+ R -q -e "library('devtools'); devtools::check(args = c('--no-tests', '--no-examples'))" | tee ../check.Rout
+ grep -q "^0 errors" ../check.Rout && grep -q " 0 warnings" ../check.Rout && grep -q " 0 notes" ../check.Rout
+ working-directory: dsBase
+ continue-on-error: true
+
+ - name: Run tests with coverage & JUnit report
+ run: |
+ mkdir -p logs
+ R -q -e "devtools::reload();"
+ R -q -e '
+ write.csv(
+ covr::coverage_to_list(
+ covr::package_coverage(
+ type = c("none"),
+ code = c('"'"'
+ output_file <- file("test_console_output.txt");
+ sink(output_file);
+ sink(output_file, type = "message");
+ junit_rep <- testthat::JunitReporter$new(file = file.path(getwd(), "test_results.xml"));
+ progress_rep <- testthat::ProgressReporter$new(max_failures = 999999);
+ multi_rep <- testthat::MultiReporter$new(reporters = list(progress_rep, junit_rep));
+ testthat::test_package("${{ env.PROJECT_NAME }}", filter = "${{ env.TEST_FILTER }}", reporter = multi_rep, stop_on_failure = FALSE)'"'"'
+ )
+ )
+ ),
+ "coveragelist.csv"
+ )'
+
+ mv coveragelist.csv logs/
+ mv test_* logs/
+ grep -q " FAIL 0 " logs/test_console_output.txt
+ working-directory: dsBase
+
+ - name: Check for JUnit errors
+ run: |
+ issue_count=$(sed 's/failures="0" errors="0"//' test_results.xml | grep -c errors= || true)
+ echo "Number of testsuites with issues: $issue_count"
+ sed 's/failures="0" errors="0"//' test_results.xml | grep errors= > issues.log || true
+ cat issues.log || true
+ exit $issue_count
+ working-directory: dsBase/logs
+
+ - name: Write versions to file
+ run: |
+ echo "branch:${{ env.BRANCH_NAME }}" > ${{ env.WORKFLOW_ID }}.txt
+ echo "os:$(lsb_release -ds)" >> ${{ env.WORKFLOW_ID }}.txt
+ echo "R:$(R --version | head -n1)" >> ${{ env.WORKFLOW_ID }}.txt
+ Rscript --vanilla -e 'sessionInfo()' >> session_info_${{ env.WORKFLOW_ID }}.txt
+ working-directory: dsBase/logs
+
+ - name: Parse results from testthat and covr
+ run: |
+ Rscript --verbose --vanilla ../testStatus/source/parse_test_report.R logs/ logs/ https://github.com/datashield/${{ env.PROJECT_NAME }}/blob/${{ env.BRANCH_NAME }} '[^-:.]+' '(?<=::)[^:]+(?=::)'
+ working-directory: dsBase
+ env:
+ PROJECT_NAME: ${{ env.PROJECT_NAME }}
+ BRANCH_NAME: ${{ env.BRANCH_NAME }}
+
+ - name: Render report
+ run: |
+ cd testStatus
+
+ mkdir -p new/logs/${{ env.PROJECT_NAME }}/${{ env.BRANCH_NAME }}/${{ env.WORKFLOW_ID }}/
+ mkdir -p new/docs/${{ env.PROJECT_NAME }}/${{ env.BRANCH_NAME }}/latest/
+
+ # Copy logs to new logs directory location
+ cp -rv ../${{ env.PROJECT_NAME }}/logs/* new/logs/${{ env.PROJECT_NAME }}/${{ env.BRANCH_NAME }}/${{ env.WORKFLOW_ID }}/
+ cp -rv ../${{ env.PROJECT_NAME }}/logs/${{ env.WORKFLOW_ID }}.txt new/logs/${{ env.PROJECT_NAME }}/${{ env.BRANCH_NAME }}/${{ env.WORKFLOW_ID }}/
+
+ R -e 'input_dir <- file.path("../new/logs", Sys.getenv("PROJECT_NAME"), Sys.getenv("BRANCH_NAME"), Sys.getenv("WORKFLOW_ID")); quarto::quarto_render("source/test_report.qmd", execute_params = list(input_dir = input_dir))'
+ mv source/test_report.html new/docs/${{ env.PROJECT_NAME }}/${{ env.BRANCH_NAME }}/latest/index.html
+
+ env:
+ PROJECT_NAME: ${{ env.PROJECT_NAME }}
+ BRANCH_NAME: ${{ env.BRANCH_NAME }}
+ WORKFLOW_ID: ${{ env.WORKFLOW_ID }}
+
+ - name: Upload test logs
+ uses: actions/upload-artifact@v4
+ with:
+ name: dsbase-logs
+ path: testStatus/new
+
+ - name: Dump environment info
+ run: |
+ echo -e "\n#############################"
+ echo -e "ls /: ######################"
+ ls -al .
+ echo -e "\n#############################"
+ echo -e "lscpu: ######################"
+ lscpu
+ echo -e "\n#############################"
+ echo -e "memory: #####################"
+ free -m
+ echo -e "\n#############################"
+ echo -e "env: ########################"
+ env
+ echo -e "\n#############################"
+ echo -e "R sessionInfo(): ############"
+ R -e 'sessionInfo()'
+ sudo apt install tree -y
+ tree .
+
diff --git a/.github/workflows/pkgdown.yaml b/.github/workflows/pkgdown.yaml
new file mode 100644
index 00000000..bfc9f4db
--- /dev/null
+++ b/.github/workflows/pkgdown.yaml
@@ -0,0 +1,49 @@
+# Workflow derived from https://github.com/r-lib/actions/tree/v2/examples
+# Need help debugging build failures? Start at https://github.com/r-lib/actions#where-to-find-help
+on:
+ push:
+ branches: [main, master]
+ pull_request:
+ release:
+ types: [published]
+ workflow_dispatch:
+
+name: pkgdown.yaml
+
+permissions: read-all
+
+jobs:
+ pkgdown:
+ runs-on: ubuntu-latest
+ # Only restrict concurrency for non-PR jobs
+ concurrency:
+ group: pkgdown-${{ github.event_name != 'pull_request' || github.run_id }}
+ env:
+ GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
+ permissions:
+ contents: write
+ steps:
+ - uses: actions/checkout@v4
+
+ - uses: r-lib/actions/setup-pandoc@v2
+
+ - uses: r-lib/actions/setup-r@v2
+ with:
+ use-public-rspm: true
+
+ - uses: r-lib/actions/setup-r-dependencies@v2
+ with:
+ extra-packages: any::pkgdown, local::.
+ needs: website
+
+ - name: Build site
+ run: pkgdown::build_site_github_pages(new_process = FALSE, install = FALSE)
+ shell: Rscript {0}
+
+ - name: Deploy to GitHub pages 🚀
+ if: github.event_name != 'pull_request'
+ uses: JamesIves/github-pages-deploy-action@v4.5.0
+ with:
+ clean: false
+ branch: gh-pages
+ folder: docs
diff --git a/.github/workflows/test-coverage.yaml b/.github/workflows/test-coverage.yaml
new file mode 100644
index 00000000..0ab748d6
--- /dev/null
+++ b/.github/workflows/test-coverage.yaml
@@ -0,0 +1,62 @@
+# Workflow derived from https://github.com/r-lib/actions/tree/v2/examples
+# Need help debugging build failures? Start at https://github.com/r-lib/actions#where-to-find-help
+on:
+ push:
+ branches: [main, master]
+ pull_request:
+
+name: test-coverage.yaml
+
+permissions: read-all
+
+jobs:
+ test-coverage:
+ runs-on: ubuntu-latest
+ env:
+ GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
+
+ steps:
+ - uses: actions/checkout@v4
+
+ - uses: r-lib/actions/setup-r@v2
+ with:
+ use-public-rspm: true
+
+ - uses: r-lib/actions/setup-r-dependencies@v2
+ with:
+ extra-packages: any::covr, any::xml2
+ needs: coverage
+
+ - name: Test coverage
+ run: |
+ cov <- covr::package_coverage(
+ quiet = FALSE,
+ clean = FALSE,
+ install_path = file.path(normalizePath(Sys.getenv("RUNNER_TEMP"), winslash = "/"), "package")
+ )
+ print(cov)
+ covr::to_cobertura(cov)
+ shell: Rscript {0}
+
+ - uses: codecov/codecov-action@v5
+ with:
+ # Fail if error if not on PR, or if on PR and token is given
+ fail_ci_if_error: ${{ github.event_name != 'pull_request' || secrets.CODECOV_TOKEN }}
+ files: ./cobertura.xml
+ plugins: noop
+ disable_search: true
+ token: ${{ secrets.CODECOV_TOKEN }}
+
+ - name: Show testthat output
+ if: always()
+ run: |
+ ## --------------------------------------------------------------------
+ find '${{ runner.temp }}/package' -name 'testthat.Rout*' -exec cat '{}' \; || true
+ shell: bash
+
+ - name: Upload test results
+ if: failure()
+ uses: actions/upload-artifact@v4
+ with:
+ name: coverage-test-failures
+ path: ${{ runner.temp }}/package
diff --git a/DESCRIPTION b/DESCRIPTION
index 31c7e951..f37bbbca 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -1,23 +1,27 @@
Package: dsBase
-Title: 'DataSHIELD' Server Site Base Functions
+Title: 'DataSHIELD' Server Side Base Functions
Description: Base 'DataSHIELD' functions for the server side. 'DataSHIELD' is a software package which allows
you to do non-disclosive federated analysis on sensitive data. 'DataSHIELD' analytic functions have
been designed to only share non disclosive summary statistics, with built in automated output
checking based on statistical disclosure control. With data sites setting the threshold values for
- the automated output checks.
-Version: 6.4.0-9000
+ the automated output checks. For more details, see 'citation("dsBase")'.
+Version: 6.4.0.9000
Authors@R: c(person(given = "Paul",
family = "Burton",
- role = c("aut")),
+ role = c("aut"),
+ comment = c(ORCID = "0000-0001-5799-9634")),
person(given = "Rebecca",
family = "Wilson",
- role = c("aut")),
+ role = c("aut"),
+ comment = c(ORCID = "0000-0003-2294-593X")),
person(given = "Olly",
family = "Butters",
- role = c("aut")),
+ role = c("aut"),
+ comment = c(ORCID = "0000-0003-0354-8461")),
person(given = "Patricia",
family = "Ryser-Welch",
- role = c("aut")),
+ role = c("aut"),
+ comment = c(ORCID = "0000-0002-0070-0264")),
person(given = "Alex",
family = "Westerberg",
role = c("aut")),
@@ -37,6 +41,17 @@ Authors@R: c(person(given = "Paul",
role = c("aut"),
email = "yannick.marcon@obiba.org",
comment = c(ORCID = "0000-0003-0138-2023")),
+ person(given = "Tom",
+ family = "Bishop",
+ role = c("aut")),
+ person(given = "Amadou",
+ family = "Gaye",
+ role = c("aut"),
+ comment = c(ORCID = "0000-0002-1180-2792")),
+ person(given = "Xavier",
+ family = "Escribà-Montagut",
+ role = c("aut"),
+ comment = c(ORCID = "0000-0003-2888-8948")),
person(given = "Stuart",
family = "Wheater",
role = c("aut", "cre"),
@@ -59,8 +74,11 @@ Imports:
childsds,
purrr,
tibble,
- tidyselect
+ tidyselect,
+ tidytable
Suggests:
+ spelling,
testthat
-RoxygenNote: 7.3.2
+RoxygenNote: 7.3.3
Encoding: UTF-8
+Language: en-GB
diff --git a/NAMESPACE b/NAMESPACE
index 655cae99..9f7a5fbd 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -88,6 +88,7 @@ export(matrixDimnamesDS)
export(matrixInvertDS)
export(matrixMultDS)
export(matrixTransposeDS)
+export(mdPatternDS)
export(meanDS)
export(meanSdGpDS)
export(mergeDS)
@@ -125,6 +126,8 @@ export(setSeedDS)
export(skewnessDS1)
export(skewnessDS2)
export(sqrtDS)
+export(subsetByClassDS)
+export(subsetDS)
export(table1DDS)
export(table2DDS)
export(tableDS)
diff --git a/R/BooleDS.R b/R/BooleDS.R
index 8d5f5a49..3a905953 100644
--- a/R/BooleDS.R
+++ b/R/BooleDS.R
@@ -28,7 +28,7 @@
BooleDS <- function(V1.name=NULL, V2.name=NULL, Boolean.operator.n=NULL, na.assign.text, numeric.output=TRUE){
# Check Permissive Privacy Control Level.
- dsBase::checkPermissivePrivacyControlLevel(c('permissive', 'banana'))
+ dsBase::checkPermissivePrivacyControlLevel(c('permissive', 'banana', 'carrot'))
V1 <- eval(parse(text=V1.name), envir = parent.frame())
V2 <- eval(parse(text=V2.name), envir = parent.frame())
diff --git a/R/asDataMatrixDS.R b/R/asDataMatrixDS.R
index b8f53f19..2980965d 100644
--- a/R/asDataMatrixDS.R
+++ b/R/asDataMatrixDS.R
@@ -1,7 +1,12 @@
#' @title asDataFrameDS a serverside assign function called by ds.asDataFrame
#' @description Coerces an R object into a matrix maintaining original
#' class for all columns in data.frames.
-#' @details This assign function is based on the native R function \code{data.frame}
+#' @details This assign function is based on the native R function \code{data.matrix}
+#' If applied to a data.frame, the native R function \code{as.matrix}
+#' converts all columns into character class. In contrast, if applied to
+#' a data.frame the native R function \code{data.matrix} converts
+#' the data.frame to a matrix but maintains all data columns in their
+#' original class
#' @param x.name the name of the input object to be coerced to class
#' data.frame. Must be specified in inverted commas. But this argument is
#' usually specified directly by Paul Burton. Author.
+ Rebecca Wilson. Author.
+ Olly Butters. Author.
+ Patricia Ryser-Welch. Author.
+ Tom Bishop. Author.
+ Stuart Wheater. Author, maintainer.
Burton P, Wilson R, Butters O, Ryser-Welch P, Westerberg A, Abarrategui L, Villegas-Diaz R, Avraam D, Marcon Y, Wheater S (2025).
-dsBase: 'DataSHIELD' Server Site Base Functions.
-R package version 6.4.0-9000.
+ Burton P, Wilson R, Butters O, Ryser-Welch P, Westerberg A, Abarrategui L, Villegas-Diaz R, Avraam D, Marcon Y, Bishop T, Gaye A, Escribà-Montagut X, Wheater S (????).
+dsBase: 'DataSHIELD' Server Side Base Functions.
+R package version 6.4.0.9000.
Gaye A, Marcon Y, Isaeva J, LaFlamme P, Turner A, Jones E, Minion J, Boyd A, Newby C, Nuotio M, Wilson R, Butters O, Murtagh B, Demir I, Doiron D, Giepmans L, Wallace S, Budin-Ljøsne I, Schmidt C, Boffetta P, Boniol M, Bota M, Carter K, deKlerk N, Dibben C, Francis R, Hiekkalinna T, Hveem K, Kvaløy K, Millar S, Perry I, Peters A, Phillips C, Popham F, Raab G, Reischl E, Sheehan N, Waldenberger M, Perola M, van den Heuvel E, Macleod J, Knoppers B, Stolk R, Fortier I, Harris J, Woffenbuttel B, Murtagh M, Ferretti V, Burton P (2014).
+“DataSHIELD: taking the analysis to the data, not the data to the analysis.”
+International Journal of Epidemiology, 43(6), 1929–1944.
+doi:10.1093/ije/dyu188.
+ Wilson R, Butters O, Avraam D, Baker J, Tedds J, Turner A, Murtagh M, Burton P (2017).
+“DataSHIELD – New Directions and Dimensions.”
+Data Science Journal, 16(21), 1–21.
+doi:10.5334/dsj-2017-021.
+ Avraam D, Wilson R, Aguirre Chan N, Banerjee S, Bishop T, Butters O, Cadman T, Cederkvist L, Duijts L, Escribà Montagut X, Garner H, Gonçalves G, González J, Haakma S, Hartlev M, Hasenauer J, Huth M, Hyde E, Jaddoe V, Marcon Y, Mayrhofer M, Molnar-Gabor F, Morgan A, Murtagh M, Nestor M, Nybo Andersen A, Parker S, Pinot de Moira A, Schwarz F, Strandberg-Larsen K, Swertz M, Welten M, Wheater S, Burton P (2024).
+“DataSHIELD: mitigating disclosure risk in a multi-site federated analysis platform.”
+Bioinformatics Advances, 5(1), 1–21.
+doi:10.1093/bioadv/vbaf046.
+Page not found (404)
diff --git a/docs/LICENSE.html b/docs/LICENSE.html
index 07b43ee3..f1cadf0d 100644
--- a/docs/LICENSE.html
+++ b/docs/LICENSE.html
@@ -1,5 +1,5 @@
-NA
diff --git a/docs/authors.html b/docs/authors.html
index 6ce542a0..3526a873 100644
--- a/docs/authors.html
+++ b/docs/authors.html
@@ -1,5 +1,5 @@
-Authors and Citation
Authors and Citation
Citation
- @Manual{,
- title = {dsBase: 'DataSHIELD' Server Site Base Functions},
- author = {Paul Burton and Rebecca Wilson and Olly Butters and Patricia Ryser-Welch and Alex Westerberg and Leire Abarrategui and Roberto Villegas-Diaz and Demetris Avraam and Yannick Marcon and Stuart Wheater},
- year = {2025},
- note = {R package version 6.4.0-9000},
+ title = {dsBase: 'DataSHIELD' Server Side Base Functions},
+ author = {Paul Burton and Rebecca Wilson and Olly Butters and Patricia Ryser-Welch and Alex Westerberg and Leire Abarrategui and Roberto Villegas-Diaz and Demetris Avraam and Yannick Marcon and Tom Bishop and Amadou Gaye and Xavier Escribà-Montagut and Stuart Wheater},
+ note = {R package version 6.4.0.9000},
+}
+ @Article{,
+ title = {{DataSHIELD: taking the analysis to the data, not the data to the analysis}},
+ author = {Amadou Gaye and Yannick Marcon and Julia Isaeva and Philippe {LaFlamme} and Andrew Turner and Elinor M Jones and Joel Minion and Andrew W Boyd and Christopher J Newby and Marja-Liisa Nuotio and Rebecca Wilson and Oliver Butters and Barnaby Murtagh and Ipek Demir and Dany Doiron and Lisette Giepmans and Susan E Wallace and Isabelle Budin-Lj{\o}sne and Carsten O. Schmidt and Paolo Boffetta and Mathieu Boniol and Maria Bota and Kim W Carter and Nick {deKlerk} and Chris Dibben and Richard W Francis and Tero Hiekkalinna and Kristian Hveem and Kirsti Kval{\o}y and Sean Millar and Ivan J Perry and Annette Peters and Catherine M Phillips and Frank Popham and Gillian Raab and Eva Reischl and Nuala Sheehan and Melanie Waldenberger and Markus Perola and Edwin {{van den Heuvel}} and John Macleod and Bartha M Knoppers and Ronald P Stolk and Isabel Fortier and Jennifer R Harris and Bruce H R Woffenbuttel and Madeleine J Murtagh and Vincent Ferretti and Paul R Burton},
+ journal = {International Journal of Epidemiology},
+ year = {2014},
+ volume = {43},
+ number = {6},
+ pages = {1929--1944},
+ doi = {10.1093/ije/dyu188},
+}
+ @Article{,
+ title = {{DataSHIELD – New Directions and Dimensions}},
+ author = {Rebecca C. Wilson and Oliver W. Butters and Demetris Avraam and James Baker and Jonathan A. Tedds and Andrew Turner and Madeleine Murtagh and Paul R. Burton},
+ journal = {Data Science Journal},
+ year = {2017},
+ volume = {16},
+ number = {21},
+ pages = {1--21},
+ doi = {10.5334/dsj-2017-021},
+}
+ @Article{,
+ title = {{DataSHIELD: mitigating disclosure risk in a multi-site federated analysis platform}},
+ author = {Demetris Avraam and Rebecca C Wilson and Noemi {{Aguirre Chan}} and Soumya Banerjee and Tom R P Bishop and Olly Butters and Tim Cadman and Luise Cederkvist and Liesbeth Duijts and Xavier {{Escrib{\a`a} Montagut}} and Hugh Garner and Gon{\c c}alo {Gon{\c c}alves} and Juan R Gonz{\a'a}lez and Sido Haakma and Mette Hartlev and Jan Hasenauer and Manuel Huth and Eleanor Hyde and Vincent W V Jaddoe and Yannick Marcon and Michaela Th Mayrhofer and Fruzsina Molnar-Gabor and Andrei Scott Morgan and Madeleine Murtagh and Marc Nestor and Anne-Marie {{Nybo Andersen}} and Simon Parker and Angela {{Pinot de Moira}} and Florian Schwarz and Katrine Strandberg-Larsen and Morris A Swertz and Marieke Welten and Stuart Wheater and Paul R Burton},
+ journal = {Bioinformatics Advances},
+ year = {2024},
+ volume = {5},
+ number = {1},
+ pages = {1--21},
+ doi = {10.1093/bioadv/vbaf046},
+ editor = {Thomas Lengauer},
+ publisher = {Oxford University Press (OUP)},
}
@@ -106,11 +164,11 @@ Citation
diff --git a/docs/index.html b/docs/index.html
index 81e9827b..1d86586f 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -1,18 +1,18 @@
-
+
-
+install.packages("remotes")
+remotes::install_github("datashield/dsBase", "<BRANCH>")
+
+# Install v6.3.4 with the following
+remotes::install_github("datashield/dsBase", "6.3.4")For a full list of development branches, checkout https://github.com/datashield/dsBase/branches
+ +DataSHIELD is a software package which allows you to do non-disclosive federated analysis on sensitive data. Our website (https://www.datashield.org) has in depth descriptions of what it is, how it works and how to install it. A key point to highlight is that DataSHIELD has a client-server infrastructure, so the dsBase package (https://github.com/datashield/dsBase) needs to be used in conjunction with the dsBaseClient package (https://github.com/datashield/dsBaseClient) - trying to use one without the other makes no sense.
Detailed instructions on how to install DataSHIELD are at https://wiki.datashield.org/. The code here is organised as:
[1] Burton P, Wilson R, Butters O, Ryser-Welch P, Westerberg A, Abarrategui L, Villegas-Diaz R, Avraam D, Marcon Y, Bishop T, Gaye A, Escribà Montagut X, Wheater S (2025). dsBase: ‘DataSHIELD’ Server Side Base Functions. R package version 6.3.4. https://doi.org/10.32614/CRAN.package.dsBase.
+[2] Gaye A, Marcon Y, Isaeva J, LaFlamme P, Turner A, Jones E, Minion J, Boyd A, Newby C, Nuotio M, Wilson R, Butters O, Murtagh B, Demir I, Doiron D, Giepmans L, Wallace S, Budin-Ljøsne I, Oliver Schmidt C, Boffetta P, Boniol M, Bota M, Carter K, deKlerk N, Dibben C, Francis R, Hiekkalinna T, Hveem K, Kvaløy K, Millar S, Perry I, Peters A, Phillips C, Popham F, Raab G, Reischl E, Sheehan N, Waldenberger M, Perola M, van den Heuvel E, Macleod J, Knoppers B, Stolk R, Fortier I, Harris J, Woffenbuttel B, Murtagh M, Ferretti V, Burton P (2014). “DataSHIELD: taking the analysis to the data, not the data to the analysis.” International Journal of Epidemiology, 43(6), 1929-1944. https://doi.org/10.1093/ije/dyu188.
+[3] Wilson R, W. Butters O, Avraam D, Baker J, Tedds J, Turner A, Murtagh M, R. Burton P (2017). “DataSHIELD – New Directions and Dimensions.” Data Science Journal, 16(21), 1-21. https://doi.org/10.5334/dsj-2017-021.
+[4] Avraam D, Wilson R, Aguirre Chan N, Banerjee S, Bishop T, Butters O, Cadman T, Cederkvist L, Duijts L, Escribà Montagut X, Garner H, Gonçalves G, González J, Haakma S, Hartlev M, Hasenauer J, Huth M, Hyde E, Jaddoe V, Marcon Y, Mayrhofer M, Molnar-Gabor F, Morgan A, Murtagh M, Nestor M, Nybo Andersen A, Parker S, Pinot de Moira A, Schwarz F, Strandberg-Larsen K, Swertz M, Welten M, Wheater S, Burton P (2024). “DataSHIELD: mitigating disclosure risk in a multi-site federated analysis platform.” Bioinformatics Advances, 5(1), 1-21. https://doi.org/10.1093/bioadv/vbaf046.
++Note: Apple Mx architecture users, please be aware that there are some numerical limitations on this platform, which leads to unexpected results when using base R packages, like stats.
+x <- c(0, 3, 7)
+1 - cor(x, x)
+The above should result in a value of zero.
+Also See: For more details see https://cran.r-project.org/doc/FAQ/R-FAQ.html#Why-doesn_0027t-R-think-these-numbers-are-equal_003f and the bug report: https://bugs.r-project.org/show_bug.cgi?id=18941
+
if a user sets the parameter 'weights' on the client site function ds.glm this
+
if a user sets the parameter 'weights' on the client side function ds.glm this
server side function is called to verify that the 'weights' vector does not have negative values
because no negative are allowed in weights.