diff --git a/README.md b/README.md index 178e12394..598e38871 100644 --- a/README.md +++ b/README.md @@ -217,7 +217,7 @@ To learn more about the docker pull rate limits and the open source software pro | [Mykrobe + Genotyphi + sonneityping](https://hub.docker.com/r/staphb/mykrobe)
[![docker pulls](https://badgen.net/docker/pulls/staphb/mykrobe)](https://hub.docker.com/r/staphb/mykrobe) | | https://github.com/Mykrobe-tools/mykrobe
https://github.com/typhoidgenomics/genotyphi
https://github.com/katholt/sonneityping | | [NanoPlot](https://hub.docker.com/r/staphb/nanoplot)
[![docker pulls](https://badgen.net/docker/pulls/staphb/nanoplot)](https://hub.docker.com/r/staphb/nanoplot) | | https://github.com/wdecoster/NanoPlot | | [ngmaster](https://hub.docker.com/r/staphb/ngmaster)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ngmaster)](https://hub.docker.com/r/staphb/ngmaster) | | https://github.com/MDU-PHL/ngmaster | -| [NCBI Datasets](https://hub.docker.com/r/staphb/ncbi-datasets)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ncbi-datasets)](https://hub.docker.com/r/staphb/ncbi-datasets) |
Click to see all datasets versions **datasets versions** | [https://github.com/ncbi/datasets](https://github.com/ncbi/datasets)
[https://www.ncbi.nlm.nih.gov/datasets/docs/v1/](https://www.ncbi.nlm.nih.gov/datasets/docs/v1/) | +| [NCBI Datasets](https://hub.docker.com/r/staphb/ncbi-datasets)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ncbi-datasets)](https://hub.docker.com/r/staphb/ncbi-datasets) |
Click to see all datasets versions **datasets versions** | [https://github.com/ncbi/datasets](https://github.com/ncbi/datasets)
[https://www.ncbi.nlm.nih.gov/datasets/docs/v1/](https://www.ncbi.nlm.nih.gov/datasets/docs/v1/) | | [NCBI AMRFinderPlus](https://hub.docker.com/r/staphb/ncbi-amrfinderplus)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ncbi-amrfinderplus)](https://hub.docker.com/r/staphb/ncbi-amrfinderplus) | **AMRFinderPlus & database verion**
Click to see AMRFinderplus v3.11.4 and older versions!
  • 3.1.1b
  • 3.8.4
  • 3.8.28
  • 3.9.3
  • 3.9.8
  • 3.10.1
  • 3.10.5
  • 3.10.16
  • 3.10.20
  • 3.10.24
  • 3.10.30
  • 3.10.36
  • 3.10.42
  • 3.11.2 & 2022-12-19.1
  • [3.11.2 & 2023-02-23.1](ncbi-amrfinderplus/3.11.2-2023-02-23.1/)
  • [3.11.4 & 2023-02-23.1](ncbi-amrfinderplus/3.11.4-2023-02-23.1/)
| [https://github.com/ncbi/amr](https://github.com/ncbi/amr) | | [NCBI table2asn](https://hub.docker.com/r/staphb/ncbi-table2asn)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ncbi-table2asn)](https://hub.docker.com/r/staphb/ncbi-table2asn) | | [https://www.ncbi.nlm.nih.gov/genbank/table2asn/](https://www.ncbi.nlm.nih.gov/genbank/table2asn/)
[https://ftp.ncbi.nlm.nih.gov/asn1-converters/versions/2022-06-14/by_program/table2asn/](https://ftp.ncbi.nlm.nih.gov/asn1-converters/versions/2022-06-14/by_program/table2asn/) | | [ONTime](https://hub.docker.com/r/staphb/ontime)
[![docker pulls](https://badgen.net/docker/pulls/staphb/ontime)](https://hub.docker.com/r/staphb/ontime) | | https://github.com/mbhall88/ontime | diff --git a/ncbi-datasets/16.30.0/Dockerfile b/ncbi-datasets/16.30.0/Dockerfile new file mode 100644 index 000000000..1fc28593c --- /dev/null +++ b/ncbi-datasets/16.30.0/Dockerfile @@ -0,0 +1,47 @@ +FROM ubuntu:jammy as app + +ARG DATASETS_VER="16.30.0" + +LABEL base.image="ubuntu:jammy" +LABEL dockerfile.version="1" +LABEL software="NCBI's datasets and dataformat" +LABEL software.version="${DATASETS_VER}" +LABEL description="Downloads biological sequence data from NCBI" +LABEL website="https://github.com/ncbi/datasets" +LABEL documentation="https://www.ncbi.nlm.nih.gov/datasets/docs/v1/" +LABEL license="https://github.com/ncbi/datasets/blob/master/pkgs/ncbi-datasets-cli/LICENSE.md" +LABEL maintainer="Erin Young" +LABEL maintainer.email="eriny@utah.gov" + +# unzip isn't needed for datasets/dataformat, but it is often used after downloading files with datasets +RUN apt-get update && apt-get install -y --no-install-recommends \ + wget \ + ca-certificates \ + unzip && \ + apt-get autoclean && rm -rf /var/lib/apt/lists/* + +WORKDIR /usr/local/bin + +# install ncbi datasets tool (pre-compiled binary) +RUN wget https://github.com/ncbi/datasets/releases/download/v${DATASETS_VER}/linux-amd64.cli.package.zip && \ + unzip linux-amd64.cli.package.zip && \ + rm linux-amd64.cli.package.zip && \ + chmod +x dataformat datasets + +ENV LC_ALL=C + +WORKDIR /data + +# datasets is generally datasets --help, but just typing in 'datasets' should bring up a help menu +CMD [ "datasets", "--help" ] + +FROM app as test + +RUN dataformat --help && datasets --help + +# stolen from Curtis at https://github.com/StaPH-B/docker-builds/blob/master/pangolin/4.1.2/Dockerfile +RUN datasets download virus genome accession ON924087.1 --filename ON924087.1.zip && \ + unzip ON924087.1.zip && \ + rm ON924087.1.zip && \ + cp ncbi_dataset/data/genomic.fna ON924087.1.fna && \ + wc -c ON924087.1.fna diff --git a/ncbi-datasets/16.30.0/README.md b/ncbi-datasets/16.30.0/README.md new file mode 100644 index 000000000..6474b9282 --- /dev/null +++ b/ncbi-datasets/16.30.0/README.md @@ -0,0 +1,20 @@ +# NCBI datasets and dataformat container + +Main tool : [datasets](https://www.ncbi.nlm.nih.gov/datasets/docs/v1/download-and-install/#use-the-datasets-tool-to-download-biological-data) and [dataformat](https://www.ncbi.nlm.nih.gov/datasets/docs/v1/download-and-install/#use-the-dataformat-tool-to-convert-data-reports-to-other-formats) + +Full documentation: [https://www.ncbi.nlm.nih.gov/datasets/docs/v1/how-tos/](https://www.ncbi.nlm.nih.gov/datasets/docs/v1/how-tos/) + +> Use NCBI Datasets to gather metadata, download data packages, view reports and more + +## Example Usage + +```bash +# will download the fasta for ON924087.1 in a zipped directory +datasets download virus genome accession ON924087.1 --filename ON924087.1.zip + +# unzipping the directory and the fasta file will be located at ncbi_dataset/data/genomic.fna +unzip ON924087.1.zip + +# copying the file into something with a better name +cp ncbi_dataset/data/genomic.fna ncbi_dataset/data/ON924087.1.genomic.fna +```