Skip to content

Commit

Permalink
Create datasets.yml
Browse files Browse the repository at this point in the history
  • Loading branch information
erinyoung committed Jul 31, 2023
1 parent 8de2193 commit 765c5b1
Showing 1 changed file with 59 additions and 0 deletions.
59 changes: 59 additions & 0 deletions .github/workflows/datasets.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,59 @@
name: Test datasets

on:
workflow_dispatch:
schedule:
- cron: '30 4 * * TUE'

jobs:
check:
runs-on: ubuntu-20.04
steps:
- name: Checkout
uses: actions/checkout@v3

- name: download datasets
run: |
DATASETS_VER=$(grep container modules/datasets.nf | sort | uniq | head -n 1 | awk '{print $2}' | sed 's/'\''//g' | cut -f 2 -d ":")
RUN wget https://github.com/ncbi/datasets/releases/download/v${DATASETS_VER}/linux-amd64.cli.package.zip && \
unzip linux-amd64.cli.package.zip && \
rm linux-amd64.cli.package.zip && \
chmod +x dataformat datasets
- name: get accessions
run: |
taxons=("Acinetobacter baumannii",
"Burkholderia cenocepacia",
"Campylobacter jejuni",
"Citrobacter sp",
"Elizabethkingia meningoseptica",
"Escherichia coli",
"Klebsiella oxytoca",
"Legionella pneumophila",
"Pseudomonas sp",
"Raoultella ornithinolytica",
"Salmonella enterica")
for taxon in ${taxons[@]}
do
echo "the taxon is now $taxon"
organism=$(echo $taxon | sed 's/ /_/g')
echo "Getting the representative genome"
./datasets summary genome taxon "$taxon" --reference --limit 5 --as-json-lines | \
dataformat tsv genome --fields accession,assminfo-refseq-category,assminfo-level,organism-name,assmstats-total-ungapped-len | \
grep -v Homo | \
tr '\\t' ',' \
| tee ${organism}_genomes.csv
echo "Getting additional genomes"
./datasets summary genome taxon "$taxon" --limit 5 --as-json-lines | \
dataformat tsv genome --fields accession,assminfo-refseq-category,assminfo-level,organism-name,assmstats-total-ungapped-len | \
grep -v Homo | \
grep -v "Assembly Accession" | \
tr '\\t' ',' \
| tee -a ${organism}_genomes.csv
done
head *genomes.csv

0 comments on commit 765c5b1

Please sign in to comment.