From 3541089aa8af5d229e669eb38d3735cd2b0b8a05 Mon Sep 17 00:00:00 2001 From: Pjotr Prins Date: Thu, 31 Dec 2020 14:17:42 +0000 Subject: genbank: sparql-fetch-ids --- workflows/pull-data/genbank/README.md | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) (limited to 'workflows/pull-data/genbank/README.md') diff --git a/workflows/pull-data/genbank/README.md b/workflows/pull-data/genbank/README.md index ee67e70..0204dd0 100644 --- a/workflows/pull-data/genbank/README.md +++ b/workflows/pull-data/genbank/README.md @@ -1,4 +1,4 @@ -Pipeline: +# pipeline ```sh # --- get list of IDs already in PubSeq @@ -11,3 +11,7 @@ genbank-fetch-ids --dir ~/tmp/pubseq > genbank_ids.txt for id in genbank_ids.txt: transform-genbank-xml2yamlfa --dir ~/tmp/genbank id --outdir ~/tmp/pubseq ``` + +# TODO + +- [ ] Add id for GenBank accession - i.e. how can we tell a record is from GenBank -- cgit v1.2.3