<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en">
<head>
<!-- 2020-07-21 Tue 05:38 -->
<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
<meta name="viewport" content="width=device-width, initial-scale=1" />
<title>PubSeq REST API</title>
<meta name="generator" content="Org mode" />
<meta name="author" content="Pjotr Prins" />
<style type="text/css">
 <!--/*--><![CDATA[/*><!--*/
  .title  { text-align: center;
             margin-bottom: .2em; }
  .subtitle { text-align: center;
              font-size: medium;
              font-weight: bold;
              margin-top:0; }
  .todo   { font-family: monospace; color: red; }
  .done   { font-family: monospace; color: green; }
  .priority { font-family: monospace; color: orange; }
  .tag    { background-color: #eee; font-family: monospace;
            padding: 2px; font-size: 80%; font-weight: normal; }
  .timestamp { color: #bebebe; }
  .timestamp-kwd { color: #5f9ea0; }
  .org-right  { margin-left: auto; margin-right: 0px;  text-align: right; }
  .org-left   { margin-left: 0px;  margin-right: auto; text-align: left; }
  .org-center { margin-left: auto; margin-right: auto; text-align: center; }
  .underline { text-decoration: underline; }
  #postamble p, #preamble p { font-size: 90%; margin: .2em; }
  p.verse { margin-left: 3%; }
  pre {
    border: 1px solid #ccc;
    box-shadow: 3px 3px 3px #eee;
    padding: 8pt;
    font-family: monospace;
    overflow: auto;
    margin: 1.2em;
  }
  pre.src {
    position: relative;
    overflow: visible;
    padding-top: 1.2em;
  }
  pre.src:before {
    display: none;
    position: absolute;
    background-color: white;
    top: -10px;
    right: 10px;
    padding: 3px;
    border: 1px solid black;
  }
  pre.src:hover:before { display: inline;}
  /* Languages per Org manual */
  pre.src-asymptote:before { content: 'Asymptote'; }
  pre.src-awk:before { content: 'Awk'; }
  pre.src-C:before { content: 'C'; }
  /* pre.src-C++ doesn't work in CSS */
  pre.src-clojure:before { content: 'Clojure'; }
  pre.src-css:before { content: 'CSS'; }
  pre.src-D:before { content: 'D'; }
  pre.src-ditaa:before { content: 'ditaa'; }
  pre.src-dot:before { content: 'Graphviz'; }
  pre.src-calc:before { content: 'Emacs Calc'; }
  pre.src-emacs-lisp:before { content: 'Emacs Lisp'; }
  pre.src-fortran:before { content: 'Fortran'; }
  pre.src-gnuplot:before { content: 'gnuplot'; }
  pre.src-haskell:before { content: 'Haskell'; }
  pre.src-hledger:before { content: 'hledger'; }
  pre.src-java:before { content: 'Java'; }
  pre.src-js:before { content: 'Javascript'; }
  pre.src-latex:before { content: 'LaTeX'; }
  pre.src-ledger:before { content: 'Ledger'; }
  pre.src-lisp:before { content: 'Lisp'; }
  pre.src-lilypond:before { content: 'Lilypond'; }
  pre.src-lua:before { content: 'Lua'; }
  pre.src-matlab:before { content: 'MATLAB'; }
  pre.src-mscgen:before { content: 'Mscgen'; }
  pre.src-ocaml:before { content: 'Objective Caml'; }
  pre.src-octave:before { content: 'Octave'; }
  pre.src-org:before { content: 'Org mode'; }
  pre.src-oz:before { content: 'OZ'; }
  pre.src-plantuml:before { content: 'Plantuml'; }
  pre.src-processing:before { content: 'Processing.js'; }
  pre.src-python:before { content: 'Python'; }
  pre.src-R:before { content: 'R'; }
  pre.src-ruby:before { content: 'Ruby'; }
  pre.src-sass:before { content: 'Sass'; }
  pre.src-scheme:before { content: 'Scheme'; }
  pre.src-screen:before { content: 'Gnu Screen'; }
  pre.src-sed:before { content: 'Sed'; }
  pre.src-sh:before { content: 'shell'; }
  pre.src-sql:before { content: 'SQL'; }
  pre.src-sqlite:before { content: 'SQLite'; }
  /* additional languages in org.el's org-babel-load-languages alist */
  pre.src-forth:before { content: 'Forth'; }
  pre.src-io:before { content: 'IO'; }
  pre.src-J:before { content: 'J'; }
  pre.src-makefile:before { content: 'Makefile'; }
  pre.src-maxima:before { content: 'Maxima'; }
  pre.src-perl:before { content: 'Perl'; }
  pre.src-picolisp:before { content: 'Pico Lisp'; }
  pre.src-scala:before { content: 'Scala'; }
  pre.src-shell:before { content: 'Shell Script'; }
  pre.src-ebnf2ps:before { content: 'ebfn2ps'; }
  /* additional language identifiers per "defun org-babel-execute"
       in ob-*.el */
  pre.src-cpp:before  { content: 'C++'; }
  pre.src-abc:before  { content: 'ABC'; }
  pre.src-coq:before  { content: 'Coq'; }
  pre.src-groovy:before  { content: 'Groovy'; }
  /* additional language identifiers from org-babel-shell-names in
     ob-shell.el: ob-shell is the only babel language using a lambda to put
     the execution function name together. */
  pre.src-bash:before  { content: 'bash'; }
  pre.src-csh:before  { content: 'csh'; }
  pre.src-ash:before  { content: 'ash'; }
  pre.src-dash:before  { content: 'dash'; }
  pre.src-ksh:before  { content: 'ksh'; }
  pre.src-mksh:before  { content: 'mksh'; }
  pre.src-posh:before  { content: 'posh'; }
  /* Additional Emacs modes also supported by the LaTeX listings package */
  pre.src-ada:before { content: 'Ada'; }
  pre.src-asm:before { content: 'Assembler'; }
  pre.src-caml:before { content: 'Caml'; }
  pre.src-delphi:before { content: 'Delphi'; }
  pre.src-html:before { content: 'HTML'; }
  pre.src-idl:before { content: 'IDL'; }
  pre.src-mercury:before { content: 'Mercury'; }
  pre.src-metapost:before { content: 'MetaPost'; }
  pre.src-modula-2:before { content: 'Modula-2'; }
  pre.src-pascal:before { content: 'Pascal'; }
  pre.src-ps:before { content: 'PostScript'; }
  pre.src-prolog:before { content: 'Prolog'; }
  pre.src-simula:before { content: 'Simula'; }
  pre.src-tcl:before { content: 'tcl'; }
  pre.src-tex:before { content: 'TeX'; }
  pre.src-plain-tex:before { content: 'Plain TeX'; }
  pre.src-verilog:before { content: 'Verilog'; }
  pre.src-vhdl:before { content: 'VHDL'; }
  pre.src-xml:before { content: 'XML'; }
  pre.src-nxml:before { content: 'XML'; }
  /* add a generic configuration mode; LaTeX export needs an additional
     (add-to-list 'org-latex-listings-langs '(conf " ")) in .emacs */
  pre.src-conf:before { content: 'Configuration File'; }

  table { border-collapse:collapse; }
  caption.t-above { caption-side: top; }
  caption.t-bottom { caption-side: bottom; }
  td, th { vertical-align:top;  }
  th.org-right  { text-align: center;  }
  th.org-left   { text-align: center;   }
  th.org-center { text-align: center; }
  td.org-right  { text-align: right;  }
  td.org-left   { text-align: left;   }
  td.org-center { text-align: center; }
  dt { font-weight: bold; }
  .footpara { display: inline; }
  .footdef  { margin-bottom: 1em; }
  .figure { padding: 1em; }
  .figure p { text-align: center; }
  .equation-container {
    display: table;
    text-align: center;
    width: 100%;
  }
  .equation {
    vertical-align: middle;
  }
  .equation-label {
    display: table-cell;
    text-align: right;
    vertical-align: middle;
  }
  .inlinetask {
    padding: 10px;
    border: 2px solid gray;
    margin: 10px;
    background: #ffffcc;
  }
  #org-div-home-and-up
   { text-align: right; font-size: 70%; white-space: nowrap; }
  textarea { overflow-x: auto; }
  .linenr { font-size: smaller }
  .code-highlighted { background-color: #ffff00; }
  .org-info-js_info-navigation { border-style: none; }
  #org-info-js_console-label
    { font-size: 10px; font-weight: bold; white-space: nowrap; }
  .org-info-js_search-highlight
    { background-color: #ffff00; color: #000000; font-weight: bold; }
  .org-svg { width: 90%; }
  /*]]>*/-->
</style>
<link rel="Blog stylesheet" type="text/css" href="blog.css" />
<script type="text/javascript">
/*
@licstart  The following is the entire license notice for the
JavaScript code in this tag.

Copyright (C) 2012-2020 Free Software Foundation, Inc.

The JavaScript code in this tag is free software: you can
redistribute it and/or modify it under the terms of the GNU
General Public License (GNU GPL) as published by the Free Software
Foundation, either version 3 of the License, or (at your option)
any later version.  The code is distributed WITHOUT ANY WARRANTY;
without even the implied warranty of MERCHANTABILITY or FITNESS
FOR A PARTICULAR PURPOSE.  See the GNU GPL for more details.

As additional permission under GNU GPL version 3 section 7, you
may distribute non-source (e.g., minimized or compacted) forms of
that code without the copy of the GNU GPL normally required by
section 4, provided you include this license notice and a URL
through which recipients can access the Corresponding Source.


@licend  The above is the entire license notice
for the JavaScript code in this tag.
*/
<!--/*--><![CDATA[/*><!--*/
 function CodeHighlightOn(elem, id)
 {
   var target = document.getElementById(id);
   if(null != target) {
     elem.cacheClassElem = elem.className;
     elem.cacheClassTarget = target.className;
     target.className = "code-highlighted";
     elem.className   = "code-highlighted";
   }
 }
 function CodeHighlightOff(elem, id)
 {
   var target = document.getElementById(id);
   if(elem.cacheClassElem)
     elem.className = elem.cacheClassElem;
   if(elem.cacheClassTarget)
     target.className = elem.cacheClassTarget;
 }
/*]]>*///-->
</script>
</head>
<body>
<div id="org-div-home-and-up">
 <a accesskey="h" href=""> UP </a>
 |
 <a accesskey="H" href="http://covid19.genenetwork.org/apidoc"> HOME </a>
</div><div id="content">
<h1 class="title">PubSeq REST API</h1>
<div id="table-of-contents">
<h2>Table of Contents</h2>
<div id="text-table-of-contents">
<ul>
<li><a href="#orgc76638c">1. PubSeq REST API</a>
<ul>
<li><a href="#org247cf63">1.1. Introduction</a></li>
<li><a href="#orgcc2b1b0">1.2. Search for an entry</a></li>
<li><a href="#org0ef2d2f">1.3. Fetch metadata</a></li>
<li><a href="#org82c693c">1.4. Fetch EBI XML</a></li>
</ul>
</li>
<li><a href="#org49153e2">2. Configure emacs to run tests</a></li>
</ul>
</div>
</div>

<div id="outline-container-orgc76638c" class="outline-2">
<h2 id="orgc76638c"><span class="section-number-2">1</span> PubSeq REST API</h2>
<div class="outline-text-2" id="text-1">
<p>
Here we document the public REST API that comes with PubSeq. The tests
run in the amazing emacs <a href="https://orgmode.org/worg/org-contrib/babel/languages/ob-doc-python.html">org-babel</a>.  See the bottom of this document
for running the tests inside emacs.
</p>
</div>

<div id="outline-container-org247cf63" class="outline-3">
<h3 id="org247cf63"><span class="section-number-3">1.1</span> Introduction</h3>
<div class="outline-text-3" id="text-1-1">
<p>
We built a REST API for COVID-19 PubSeq. The API source code can be
found in <a href="https://github.com/arvados/bh20-seq-resource/tree/master/bh20simplewebuploader/api.py">api.py</a>. To see if the service is up try
</p>

<div class="org-src-container">
<pre class="src src-sh">curl http://covid19.genenetwork.org/api/version
</pre>
</div>

<div class="org-src-container">
<pre class="src src-js">{
  "service": "PubSeq",
  "version": 0.1
}
</pre>
</div>

<p>
The Python3 version is
</p>

<div class="org-src-container">
<pre class="src src-python">import requests
baseURL="http://localhost:5000" # for development
# baseURL="http://covid19.genenetwork.org"
response = requests.get(baseURL+"/api/version")
response_body = response.json()
assert response_body["service"] == "PubSeq", "PubSeq API not found"
response_body
</pre>
</div>

<table border="2" cellspacing="0" cellpadding="6" rules="groups" frame="hsides">


<colgroup>
<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-right" />
</colgroup>
<tbody>
<tr>
<td class="org-left">service</td>
<td class="org-left">:</td>
<td class="org-left">PubSeq</td>
<td class="org-left">version</td>
<td class="org-left">:</td>
<td class="org-right">0.1</td>
</tr>
</tbody>
</table>
</div>
</div>

<div id="outline-container-orgcc2b1b0" class="outline-3">
<h3 id="orgcc2b1b0"><span class="section-number-3">1.2</span> Search for an entry</h3>
<div class="outline-text-3" id="text-1-2">
<p>
When you use the search box on PubSeq it queries the REST end point
for information on the search items. For example
</p>

<div class="org-src-container">
<pre class="src src-python">requests.get(baseURL+"/api/search?s=MT533203.1").json()
</pre>
</div>

<table border="2" cellspacing="0" cellpadding="6" rules="groups" frame="hsides">


<colgroup>
<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />
</colgroup>
<tbody>
<tr>
<td class="org-left">collection</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126">http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126</a></td>
<td class="org-left">fasta</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/sequence.fasta">http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/sequence.fasta</a></td>
<td class="org-left">id</td>
<td class="org-left">:</td>
<td class="org-left">MT533203.1</td>
<td class="org-left">info</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://identifiers.org/insdc/MT533203.1#sequence">http://identifiers.org/insdc/MT533203.1#sequence</a></td>
</tr>
</tbody>
</table>

<p>
where collection is the raw uploaded data. The hash value in <code>c=</code> is
computed on the contents of the Arvados keep <a href="https://doc.arvados.org/v2.0/user/tutorials/tutorial-keep-mount-gnu-linux.html">collection</a> and effectively
acts as a deduplication uuid.
</p>
</div>
</div>

<div id="outline-container-org0ef2d2f" class="outline-3">
<h3 id="org0ef2d2f"><span class="section-number-3">1.3</span> Fetch metadata</h3>
<div class="outline-text-3" id="text-1-3">
<p>
Using above collection link you can fetch the metadata in JSON as it
was uploaded originally from the SHeX expression, e.g. using
<a href="https://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/">https://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/</a>
</p>

<p>
But better to use the more advanced sample metadata fetcher
because is does a bit more in terms of expansion
</p>

<div class="org-src-container">
<pre class="src src-python">requests.get(baseURL+"/api/sample/MT533203.1.json").json()
</pre>
</div>

<table border="2" cellspacing="0" cellpadding="6" rules="groups" frame="hsides">


<colgroup>
<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-right" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />

<col  class="org-left" />
</colgroup>
<tbody>
<tr>
<td class="org-left">collection</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126">http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126</a></td>
<td class="org-left">date</td>
<td class="org-left">:</td>
<td class="org-right">2020-04-27</td>
<td class="org-left">fasta</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/sequence.fasta">http://collections.lugli.arvadosapi.com/c=0015b0d65dfd2e82bb3cee4436bf2893+126/sequence.fasta</a></td>
<td class="org-left">id</td>
<td class="org-left">:</td>
<td class="org-left">MT533203.1</td>
<td class="org-left">info</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://identifiers.org/insdc/MT533203.1#sequence">http://identifiers.org/insdc/MT533203.1#sequence</a></td>
<td class="org-left">mapper</td>
<td class="org-left">:</td>
<td class="org-left">minimap v. 2.17</td>
<td class="org-left">sequencer</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://www.ebi.ac.uk/efo/EFO_0008632">http://www.ebi.ac.uk/efo/EFO_0008632</a></td>
<td class="org-left">specimen</td>
<td class="org-left">:</td>
<td class="org-left"><a href="http://purl.obolibrary.org/obo/NCIT_C155831">http://purl.obolibrary.org/obo/NCIT_C155831</a></td>
</tr>
</tbody>
</table>
</div>
</div>



<div id="outline-container-org82c693c" class="outline-3">
<h3 id="org82c693c"><span class="section-number-3">1.4</span> Fetch EBI XML</h3>
<div class="outline-text-3" id="text-1-4">
<p>
PubSeq provides an API that is used to export formats that are
suitable for uploading data to EBI/ENA from our <a href="http://covid19.genenetwork.org/export">EXPORT</a> menu. This is
documented <a href="http://covid19.genenetwork.org/blog?id=using-covid-19-pubseq-part6">here</a>.
</p>

<div class="org-src-container">
<pre class="src src-python">requests.get(baseURL+"/api/ebi/sample-MT326090.1.xml").text
</pre>
</div>

<pre class="example">
&lt;?xml version="1.0" encoding="UTF-8"?&gt;
&lt;SAMPLE_SET&gt;
  &lt;SAMPLE alias="MT326090.1" center_name="COVID-19 PubSeq"&gt;
    &lt;TITLE&gt;COVID-19 PubSeq Sample&lt;/TITLE&gt;
    &lt;SAMPLE_NAME&gt;
      &lt;TAXON_ID&gt;2697049&lt;/TAXON_ID&gt;
      &lt;SCIENTIFIC_NAME&gt;Severe acute respiratory syndrome coronavirus 2&lt;/SCIENTIFIC_NAME&gt;
      &lt;COMMON_NAME&gt;SARS-CoV-2&lt;/COMMON_NAME&gt;
    &lt;/SAMPLE_NAME&gt;
    &lt;SAMPLE_ATTRIBUTES&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;investigation type&lt;/TAG&gt;
        &lt;VALUE&gt;&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;sequencing method&lt;/TAG&gt;
        &lt;VALUE&gt;http://purl.obolibrary.org/obo/OBI_0000759&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;collection date&lt;/TAG&gt;
        &lt;VALUE&gt;2020-03-21&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;geographic location (latitude)&lt;/TAG&gt;
        &lt;VALUE&gt;&lt;/VALUE&gt;
     &lt;UNITS&gt;DD&lt;/UNITS&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;geographic location (longitude)&lt;/TAG&gt;
        &lt;VALUE&gt;&lt;/VALUE&gt;
     &lt;UNITS&gt;DD&lt;/UNITS&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
     &lt;TAG&gt;geographic location (country and/or sea)&lt;/TAG&gt;
     &lt;VALUE&gt;&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;geographic location (region and locality)&lt;/TAG&gt;
        &lt;VALUE&gt;&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;environment (material)&lt;/TAG&gt;
        &lt;VALUE&gt;http://purl.obolibrary.org/obo/NCIT_C155831&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
      &lt;SAMPLE_ATTRIBUTE&gt;
        &lt;TAG&gt;ENA-CHECKLIST&lt;/TAG&gt;
        &lt;VALUE&gt;ERC000011&lt;/VALUE&gt;
      &lt;/SAMPLE_ATTRIBUTE&gt;
    &lt;/SAMPLE_ATTRIBUTES&gt;
  &lt;/SAMPLE&gt;
&lt;/SAMPLE_SET&gt;
</pre>
</div>
</div>
</div>

<div id="outline-container-org49153e2" class="outline-2">
<h2 id="org49153e2"><span class="section-number-2">2</span> Configure emacs to run tests</h2>
<div class="outline-text-2" id="text-2">
<p>
Execute a code
block with C-c C-c. You may need to set
</p>

<div class="org-src-container">
<pre class="src src-elisp">(org-babel-do-load-languages
 'org-babel-load-languages
 '((python . t)))
(setq org-babel-python-command "python3")
(setq org-babel-eval-verbose t)
</pre>
</div>

<p>
To skip confirmations you may also want to set
</p>

<pre class="example">
(setq org-confirm-babel-evaluate nil)
</pre>


<p>
To see output of the inpreter open then <b>Python</b> buffer.
</p>
</div>
</div>
</div>
<div id="postamble" class="status">
<hr><small>Created by <a href="http://thebird.nl/">Pjotr Prins</a> (pjotr.public768 at thebird 'dot' nl) using Emacs org-mode and a healthy dose of Lisp!<br />Modified 2020-07-21 Tue 05:38</small>.
</div>
</body>
</html>