2020-04-24 23:36:52 +00:00
|
|
|
#!/usr/bin/env Rscript
|
2024-09-19 14:19:46 +00:00
|
|
|
|
|
|
|
# This script can be used to generate the .json file for a given R package set
|
|
|
|
# that is part of the `rPackages` tree
|
|
|
|
#
|
|
|
|
# See R section of the nixpkgs manual for an example of how to use this script
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
library(data.table)
|
|
|
|
library(parallel)
|
2021-09-18 10:52:07 +00:00
|
|
|
library(BiocManager)
|
2024-09-19 14:19:46 +00:00
|
|
|
library(jsonlite)
|
|
|
|
|
|
|
|
# always order strings according to POSIX ordering
|
|
|
|
locale <- Sys.setlocale(locale = "C")
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2021-09-18 10:52:07 +00:00
|
|
|
biocVersion <- BiocManager:::.version_map()
|
|
|
|
biocVersion <- biocVersion[biocVersion$R == getRversion()[, 1:2],c("Bioc", "BiocStatus")]
|
|
|
|
if ("release" %in% biocVersion$BiocStatus) {
|
|
|
|
biocVersion <- as.numeric(as.character(biocVersion[biocVersion$BiocStatus == "release", "Bioc"]))
|
|
|
|
} else {
|
|
|
|
biocVersion <- max(as.numeric(as.character(biocVersion$Bioc)))
|
|
|
|
}
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-06-20 14:57:18 +00:00
|
|
|
mirrorUrls <- list( bioc=paste0("http://bioconductor.org/packages/", biocVersion, "/bioc/src/contrib/")
|
|
|
|
, "bioc-annotation"=paste0("http://bioconductor.org/packages/", biocVersion, "/data/annotation/src/contrib/")
|
|
|
|
, "bioc-experiment"=paste0("http://bioconductor.org/packages/", biocVersion, "/data/experiment/src/contrib/")
|
2023-04-12 12:48:02 +00:00
|
|
|
, cran="https://cran.r-project.org/src/contrib/"
|
2020-04-24 23:36:52 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
mirrorType <- commandArgs(trailingOnly=TRUE)[1]
|
|
|
|
stopifnot(mirrorType %in% names(mirrorUrls))
|
2024-09-19 14:19:46 +00:00
|
|
|
|
|
|
|
packagesFile <- paste(mirrorType, 'packages.json', sep='-')
|
|
|
|
prevPkgs <- fromJSON(packagesFile)$packages
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
write(paste("downloading package lists"), stderr())
|
2024-09-19 14:19:46 +00:00
|
|
|
pkgTables <- lapply(mirrorUrls, function(url) as.data.table(available.packages(url, filters=c("R_version", "OS_type", "duplicates")), method="libcurl"))
|
|
|
|
knownPackageNames <- c(unique(do.call("rbind", pkgTables)$Package))
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
pkgTable <- pkgTables[mirrorType][[1]]
|
2020-04-24 23:36:52 +00:00
|
|
|
mirrorUrl <- mirrorUrls[mirrorType][[1]]
|
2024-09-19 14:19:46 +00:00
|
|
|
|
|
|
|
escapeName <- function(name) {
|
|
|
|
gsub(".", "_", switch(name, "import" = "r_import", "assert" = "r_assert", name), fixed=TRUE)
|
|
|
|
}
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
nixPrefetch <- function(name, version) {
|
2024-09-19 14:19:46 +00:00
|
|
|
prevPkg <- prevPkgs[[escapeName(name)]]
|
|
|
|
if (!is.null(prevPkg) && prevPkg$version == version)
|
|
|
|
prevPkg$sha256
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
else {
|
|
|
|
# avoid nix-prefetch-url because it often fails to fetch/hash large files
|
|
|
|
url <- paste0(mirrorUrl, name, "_", version, ".tar.gz")
|
|
|
|
tmp <- tempfile(pattern=paste0(name, "_", version), fileext=".tar.gz")
|
|
|
|
cmd <- paste0("wget -q -O '", tmp, "' '", url, "'")
|
2023-04-12 12:48:02 +00:00
|
|
|
if(mirrorType == "cran"){
|
|
|
|
archiveUrl <- paste0(mirrorUrl, "Archive/", name, "/", name, "_", version, ".tar.gz")
|
|
|
|
cmd <- paste0(cmd, " || wget -q -O '", tmp, "' '", archiveUrl, "'")
|
|
|
|
}
|
2020-04-24 23:36:52 +00:00
|
|
|
cmd <- paste0(cmd, " && nix-hash --type sha256 --base32 --flat '", tmp, "'")
|
|
|
|
cmd <- paste0(cmd, " && echo >&2 ' added ", name, " v", version, "'")
|
|
|
|
cmd <- paste0(cmd, " ; rm -rf '", tmp, "'")
|
|
|
|
system(cmd, intern=TRUE)
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
formatPackage <- function(name, version, sha256, depends, imports, linkingTo) {
|
|
|
|
options(warn=5)
|
|
|
|
depends <- paste( if (is.na(depends)) "" else gsub("[ \t\n]+", "", depends)
|
|
|
|
, if (is.na(imports)) "" else gsub("[ \t\n]+", "", imports)
|
|
|
|
, if (is.na(linkingTo)) "" else gsub("[ \t\n]+", "", linkingTo)
|
|
|
|
, sep=","
|
|
|
|
)
|
|
|
|
depends <- unlist(strsplit(depends, split=",", fixed=TRUE))
|
|
|
|
depends <- lapply(depends, gsub, pattern="([^ \t\n(]+).*", replacement="\\1")
|
2024-09-19 14:19:46 +00:00
|
|
|
depends <- depends[depends %in% knownPackageNames]
|
2021-01-15 22:18:51 +00:00
|
|
|
depends <- lapply(depends, escapeName)
|
2020-04-24 23:36:52 +00:00
|
|
|
depends <- paste(depends)
|
2024-09-19 14:19:46 +00:00
|
|
|
depends <- sort(unique(depends))
|
|
|
|
list(name=unbox(name), version=unbox(version), sha256=unbox(sha256), depends=depends)
|
2020-04-24 23:36:52 +00:00
|
|
|
}
|
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
cl <- makeCluster(10)
|
|
|
|
clusterExport(cl, c("escapeName", "nixPrefetch", "prevPkgs", "mirrorUrl", "mirrorType", "knownPackageNames"))
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
write(paste("updating", mirrorType, "packages"), stderr())
|
2024-09-19 14:19:46 +00:00
|
|
|
pkgTable$sha256 <- parApply(cl, pkgTable, 1, function(p) nixPrefetch(p[1], p[2]))
|
|
|
|
|
|
|
|
stopCluster(cl)
|
|
|
|
|
|
|
|
pkgs <- lapply(1:nrow(pkgTable), function(i) with(pkgTable[i,], formatPackage(Package, Version, sha256, Depends, Imports, LinkingTo)))
|
|
|
|
names(pkgs) <- lapply(pkgs, function(p) escapeName(p$name))
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2021-09-28 08:13:01 +00:00
|
|
|
# Mark deleted packages as broken
|
2024-09-19 14:19:46 +00:00
|
|
|
brokenPkgs <- lapply(prevPkgs[setdiff(names(prevPkgs), names(pkgs))], function(p)
|
|
|
|
list(name=unbox(p$name),
|
|
|
|
version=unbox(p$version),
|
|
|
|
sha256=unbox(p$sha256),
|
|
|
|
depends=p$depends,
|
|
|
|
broken=unbox(T)))
|
|
|
|
|
|
|
|
# sort packages by their non-escaped names
|
|
|
|
pkgs <- pkgs[order(sapply(pkgs, function(p) p$name))]
|
|
|
|
brokenPkgs<- brokenPkgs[order(sapply(brokenPkgs, function(p) p$name))]
|
|
|
|
|
|
|
|
# empty named list
|
|
|
|
extraArgs = setNames(list(), character(0))
|
|
|
|
|
|
|
|
if (mirrorType != "cran") {
|
|
|
|
extraArgs=list(biocVersion=unbox(paste(biocVersion)))
|
2021-09-28 08:13:01 +00:00
|
|
|
}
|
2020-04-24 23:36:52 +00:00
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
cat(toJSON(list(extraArgs=extraArgs, packages=c(pkgs, brokenPkgs)), pretty=TRUE))
|
|
|
|
cat("\n")
|
|
|
|
write("done", stderr())
|
|
|
|
|