{
  "_id": "6a0f631dacfb0bcc41c5c693",
  "Package": "BERT",
  "Title": "High Performance Data Integration for Large-Scale Analyses of\nIncomplete Omic Profiles Using Batch-Effect Reduction Trees\n(BERT)",
  "Version": "1.9.0",
  "Authors@R": "c(person(\"Yannis\", \"Schumann\", ,\"yannis.schumann@desy.de\", role = c(\"aut\", \"cre\"),\ncomment = c(ORCID = \"0000-0002-2379-200X\")),\nperson(\"Simon\", \"Schlumbohm\", , \"schlumbohm@hsu-hh.de\", role = c(\"aut\"),\ncomment = c(ORCID = \"0000-0002-0083-5142\")))",
  "Description": "Provides efficient batch-effect adjustment of data with\nmissing values. BERT orders all batch effect correction to a\ntree of pairwise computations. BERT allows parallelization over\nsub-trees.",
  "Encoding": "UTF-8",
  "Roxygen": "list(markdown = TRUE)",
  "RoxygenNote": "7.3.2",
  "biocViews": "BatchEffect, Preprocessing, ExperimentalDesign,\nQualityControl",
  "URL": "https://github.com/HSU-HPC/BERT/",
  "BugReports": "https://github.com/HSU-HPC/BERT/issues",
  "License": "GPL-3",
  "Config/testthat/edition": "3",
  "VignetteBuilder": "knitr",
  "Config/pak/sysreqs": "libicu-dev libpng-dev libxml2-dev libssl-dev\nzlib1g-dev",
  "Repository": "https://bioc.r-universe.dev",
  "Date/Publication": "2026-04-28 13:02:01 UTC",
  "RemoteUrl": "https://github.com/bioc/BERT",
  "RemoteRef": "HEAD",
  "RemoteSha": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-21 10:36:04 UTC",
    "User": "root"
  },
  "Author": "Yannis Schumann [aut, cre] (ORCID:\n<https://orcid.org/0000-0002-2379-200X>),\nSimon Schlumbohm [aut] (ORCID: <https://orcid.org/0000-0002-0083-5142>)",
  "Maintainer": "Yannis Schumann <yannis.schumann@desy.de>",
  "MD5sum": "5ad74d6d2d791fa21e1053addd15575b",
  "_user": "bioc",
  "_type": "src",
  "_file": "BERT_1.9.0.tar.gz",
  "_fileid": "cc72e8860661af0d7a961852a3b092c4badf1c96e9de747d7108c021d236afb9",
  "_filesize": 176787,
  "_sha256": "cc72e8860661af0d7a961852a3b092c4badf1c96e9de747d7108c021d236afb9",
  "_created": "2026-05-21T10:36:04.000Z",
  "_published": "2026-05-21T19:55:09.424Z",
  "_jobs": [
    {
      "job": 77256571345,
      "time": 165,
      "config": "bioc-checks",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7133548283"
    },
    {
      "job": 77256570917,
      "time": 244,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7133563370"
    },
    {
      "job": 77256570918,
      "time": 206,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7133561009"
    },
    {
      "job": 77256571126,
      "time": 135,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7133538463"
    },
    {
      "job": 77256571069,
      "time": 116,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7133533245"
    },
    {
      "job": 77256570406,
      "time": 231,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7133495998"
    },
    {
      "job": 77256570526,
      "time": 136,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7145786904"
    },
    {
      "job": 77256571452,
      "time": 170,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7133549589"
    },
    {
      "job": 77256571407,
      "time": 152,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7133545578"
    },
    {
      "job": 77256571105,
      "time": 147,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7133542900"
    }
  ],
  "_bioccheck": {
    "error": 0,
    "warning": 0,
    "note": 6
  },
  "_buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/bioc/BERT",
  "_commit": {
    "id": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
    "author": "A Wokaty <andres.wokaty@sph.cuny.edu>",
    "committer": "A Wokaty <andres.wokaty@sph.cuny.edu>",
    "message": "bump x.y.z version to odd y following creation of RELEASE_3_23 branch\n",
    "time": 1777381321
  },
  "_maintainer": {
    "name": "Yannis Schumann",
    "email": "yannis.schumann@desy.de",
    "login": "deryannis",
    "description": "",
    "uuid": 81758255,
    "orcid": "0000-0002-2379-200X"
  },
  "_distro": "noble",
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 4.3.0",
      "role": "Depends"
    },
    {
      "package": "cluster",
      "role": "Imports"
    },
    {
      "package": "comprehenr",
      "role": "Imports"
    },
    {
      "package": "foreach",
      "version": ">= 1.5.2",
      "role": "Imports"
    },
    {
      "package": "invgamma",
      "role": "Imports"
    },
    {
      "package": "iterators",
      "version": ">= 1.0.14",
      "role": "Imports"
    },
    {
      "package": "janitor",
      "version": ">= 2.2.0",
      "role": "Imports"
    },
    {
      "package": "limma",
      "version": ">= 3.46.0",
      "role": "Imports"
    },
    {
      "package": "logging",
      "version": ">= 0.10-108",
      "role": "Imports"
    },
    {
      "package": "sva",
      "version": ">= 3.38.0",
      "role": "Imports"
    },
    {
      "package": "SummarizedExperiment",
      "role": "Imports"
    },
    {
      "package": "methods",
      "role": "Imports"
    },
    {
      "package": "BiocParallel",
      "role": "Imports"
    },
    {
      "package": "testthat",
      "version": ">= 3.0.0",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "BiocStyle",
      "role": "Suggests"
    }
  ],
  "_owner": "bioc",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2025-23",
      "n": 4
    },
    {
      "week": "2025-44",
      "n": 2
    },
    {
      "week": "2026-18",
      "n": 2
    }
  ],
  "_tags": [],
  "_bioc": [
    {
      "branch": "devel",
      "version": "1.9.0",
      "bioc": "3.24"
    },
    {
      "branch": "release",
      "version": "1.8.0",
      "bioc": "3.23"
    }
  ],
  "_topics": [
    "batcheffect",
    "preprocessing",
    "experimentaldesign",
    "qualitycontrol",
    "batch-effect",
    "bioconductor-package",
    "bioinformatics",
    "data-integration",
    "data-science",
    "nature-communications"
  ],
  "_stars": 4,
  "_contributors": [
    {
      "user": "deryannis",
      "count": 30,
      "uuid": 81758255
    },
    {
      "user": "simonschlumbohm",
      "count": 12,
      "uuid": 78701285
    },
    {
      "user": "jwokaty",
      "count": 6,
      "uuid": 1744257
    }
  ],
  "_userbio": {
    "uuid": 2286807,
    "type": "organization",
    "name": "Bioconductor",
    "description": "Software for the analysis and comprehension of high-throughput genomic data"
  },
  "_downloads": {
    "count": 241,
    "source": "https://www.bioconductor.org/packages/stats/bioc/BERT"
  },
  "_devurl": "https://github.com/hsu-hpc/bert",
  "_searchresults": 20,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/BERT.html",
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/hsu-hpc/bert",
  "_realowner": "bioc",
  "_cranurl": false,
  "_exports": [
    "BERT",
    "compute_asw",
    "count_existing",
    "generate_data_covariables",
    "generate_dataset"
  ],
  "_help": [
    {
      "page": "adjust_node",
      "title": "Adjust two batches to each other.",
      "topics": [
        "adjust_node"
      ]
    },
    {
      "page": "adjustment_step",
      "title": "Adjust a hierarchy level sequentially.",
      "topics": [
        "adjustment_step"
      ]
    },
    {
      "page": "BERT",
      "title": "Adjust data using the BERT algorithm.",
      "topics": [
        "BERT"
      ]
    },
    {
      "page": "chunk_data",
      "title": "Chunks data into n segments with (close-to) equivalent number of batches and stores them in temporary RDS files",
      "topics": [
        "chunk_data"
      ]
    },
    {
      "page": "compute_asw",
      "title": "Compute the average silhouette width (ASW) for the dataset with respect to both label and batch.",
      "topics": [
        "compute_asw"
      ]
    },
    {
      "page": "count_existing",
      "title": "Count the number of numeric features in this dataset. Columns labeled \"Batch\", \"Sample\" or \"Label\" will be ignored.",
      "topics": [
        "count_existing"
      ]
    },
    {
      "page": "format_DF",
      "title": "Format the data as expected by BERT.",
      "topics": [
        "format_DF"
      ]
    },
    {
      "page": "generate_data_covariables",
      "title": "Generate dataset with batch-effects and 2 classes with a specified imbalance.",
      "topics": [
        "generate_data_covariables"
      ]
    },
    {
      "page": "generate_dataset",
      "title": "Generate dataset with batch-effects and biological labels using a simple LS model",
      "topics": [
        "generate_dataset"
      ]
    },
    {
      "page": "get_adjustable_features",
      "title": "Check, which features contain enough numeric data to be adjusted (at least 2 numeric values)",
      "topics": [
        "get_adjustable_features"
      ]
    },
    {
      "page": "get_adjustable_features_with_mod",
      "title": "Check, which features contain enough numeric data to be adjusted (at least 2 numeric values per batch and covariate level)",
      "topics": [
        "get_adjustable_features_with_mod"
      ]
    },
    {
      "page": "identify_adjustableFeatures_refs",
      "title": "Identifies the adjustable features using only the references. Similar to the function in adjust_features.R but with different arguments",
      "topics": [
        "identify_adjustableFeatures_refs"
      ]
    },
    {
      "page": "identify_references",
      "title": "Identifies the references to use for this specific batch effect adjustment",
      "topics": [
        "identify_references"
      ]
    },
    {
      "page": "ordinal_encode",
      "title": "Ordinal encoding of a vector.",
      "topics": [
        "ordinal_encode"
      ]
    },
    {
      "page": "parallel_bert",
      "title": "Adjusts all chunks of data (in parallel) as far as possible.",
      "topics": [
        "parallel_bert"
      ]
    },
    {
      "page": "removeBatchEffectRefs",
      "title": "A method to remove batch effects estimated from a subset (references) per batch only. Source code is heavily based on limma::removeBatchEffects by Gordon Smyth and Carolyn de Graaf",
      "topics": [
        "removeBatchEffectRefs"
      ]
    },
    {
      "page": "replace_missing",
      "title": "Replaces missing values (NaN) by NA, this appears to be faster",
      "topics": [
        "replace_missing"
      ]
    },
    {
      "page": "strip_Covariable",
      "title": "Strip column labelled Cov_1 from dataframe.",
      "topics": [
        "strip_Covariable"
      ]
    },
    {
      "page": "validate_bert_input",
      "title": "Verifies that the input to BERT is valid.",
      "topics": [
        "validate_bert_input"
      ]
    },
    {
      "page": "validate_input_generate_dataset",
      "title": "Validate the user input to the function generate_dataset. Raises an error if and only if the input is malformatted.",
      "topics": [
        "validate_input_generate_dataset"
      ]
    },
    {
      "page": "verify_references",
      "title": "Verify that the Reference column of the data contains only zeros and ones (if it is present at all)",
      "topics": [
        "verify_references"
      ]
    }
  ],
  "_readme": "https://github.com/bioc/BERT/raw/HEAD/README.md",
  "_rundeps": [
    "abind",
    "annotate",
    "AnnotationDbi",
    "askpass",
    "BH",
    "Biobase",
    "BiocGenerics",
    "BiocParallel",
    "Biostrings",
    "bit",
    "bit64",
    "blob",
    "cachem",
    "cli",
    "cluster",
    "codetools",
    "comprehenr",
    "cpp11",
    "crayon",
    "curl",
    "DBI",
    "DelayedArray",
    "dplyr",
    "edgeR",
    "fastmap",
    "foreach",
    "formatR",
    "futile.logger",
    "futile.options",
    "genefilter",
    "generics",
    "GenomicRanges",
    "glue",
    "hms",
    "httr",
    "invgamma",
    "IRanges",
    "iterators",
    "janitor",
    "jsonlite",
    "KEGGREST",
    "lambda.r",
    "lattice",
    "lifecycle",
    "limma",
    "locfit",
    "logging",
    "lubridate",
    "magrittr",
    "Matrix",
    "MatrixGenerics",
    "matrixStats",
    "memoise",
    "mgcv",
    "mime",
    "nlme",
    "openssl",
    "pillar",
    "pkgconfig",
    "png",
    "purrr",
    "R6",
    "rlang",
    "RSQLite",
    "S4Arrays",
    "S4Vectors",
    "Seqinfo",
    "snakecase",
    "snow",
    "SparseArray",
    "statmod",
    "stringi",
    "stringr",
    "SummarizedExperiment",
    "survival",
    "sva",
    "sys",
    "tibble",
    "tidyr",
    "tidyselect",
    "timechange",
    "utf8",
    "vctrs",
    "withr",
    "XML",
    "xtable",
    "XVector"
  ],
  "_vignettes": [
    {
      "source": "BERT-Vignette.Rmd",
      "filename": "BERT-Vignette.html",
      "title": "BERT-Vignette",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Installation",
        "Data Preparation",
        "Basic Usage",
        "Advanced Options",
        "Parameters",
        "Verbosity",
        "Choosing the Optimal Number of Cores",
        "Examples",
        "Sequential Adjustment with limma",
        "Parallel Batch Effect Correction with ComBat",
        "Batch Effect Correction Using SummarizedExperiment",
        "BERT with Covariables",
        "BERT with references",
        "Issues",
        "License",
        "Reference",
        "Session Info"
      ],
      "created": "2023-05-30 13:46:23",
      "modified": "2025-01-22 07:25:44",
      "commits": 15
    }
  ],
  "_score": 5.380211241711606,
  "_indexed": true,
  "_nocasepkg": "bert",
  "_universes": [
    "bioc",
    "deryannis",
    "hsu-hpc"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.9.0",
      "date": "2026-05-21T10:39:07.000Z",
      "distro": "noble",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "fd0413f438dc81a96d966273e3df87e2be578539f1b9b481ac6192e3c5fda9d6",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.9.0",
      "date": "2026-05-21T10:39:03.000Z",
      "distro": "noble",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "434e53a4636a33962cdf498da6d4c58337bac8cf46cbacd97813ed3d2deb9e83",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.9.0",
      "date": "2026-05-21T10:37:56.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "fd4f020e82b40a277586e4653c143681527218dc023be920fc775fdfa46e5f77",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "1.9.0",
      "date": "2026-05-21T10:37:41.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "b1cfdd4c57ff6ead9120c8ac6fc67398243372e24f181a9454f26ca50d90bb85",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.9.0",
      "date": "2026-05-21T19:54:55.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "a1b37ff195cffa3b8156706387223f97e57c7d366b75d7311b0c37beb51af73e",
      "status": "success",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.9.0",
      "date": "2026-05-21T10:37:46.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "ad719030219b44a7b510f291650abdf000d0621436248374190d438dee7645a9",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.9.0",
      "date": "2026-05-21T10:37:49.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "5f3390ae96366028045940e7368a089f1c4efd861b4d51424a2b66b4e4777749",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "1.9.0",
      "date": "2026-05-21T10:37:38.000Z",
      "commit": "072dd1e1eb9583b9687f26288ed3c12b6460fdb3",
      "fileid": "98aa74d2455bf05cedccb0b37c416a016d358f210438e47b2ec5447bccd2471c",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/bioc/actions/runs/26220618591"
    }
  ]
}