From 2c6181c7eb86c0285928a434a37401d6680f9f79 Mon Sep 17 00:00:00 2001 From: Pjotr Prins Date: Fri, 1 Jan 2021 12:24:44 +0000 Subject: genbank-fetch-ids --- workflows/pull-data/genbank/README.md | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) (limited to 'workflows/pull-data/genbank/README.md') diff --git a/workflows/pull-data/genbank/README.md b/workflows/pull-data/genbank/README.md index c235be7..f442b5d 100644 --- a/workflows/pull-data/genbank/README.md +++ b/workflows/pull-data/genbank/README.md @@ -3,8 +3,10 @@ ```sh # --- get list of IDs already in PubSeq sparql-fetch-ids > pubseq_ids.txt +# --- get list of missing genbank IDs +genbank-fetch-ids --skip pubseq_ids.txt > genbank_ids.txt # --- fetch XML -update-from-genbank.py --skip pubseq_ids.txt --outdir ~/tmp/genbank +update-from-genbank.py --ids genbank_ids.txt --outdir ~/tmp/genbank # --- Transform to YAML and FASTA transform-genbank-xml2yamlfa --dir ~/tmp/genbank id --outdir ~/tmp/pubseq ``` -- cgit v1.2.3