1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
|
PREFIX : <https://raw.githubusercontent.com/arvados/bh20-seq-resource/master/bh20sequploader/bh20seq-shex.rdf#>
PREFIX MainSchema: <http://biohackathon.org/bh20-seq-schema#MainSchema/>
PREFIX hostSchema: <http://biohackathon.org/bh20-seq-schema#hostSchema/>
PREFIX cc: <https://creativecommons.org/ns#>
PREFIX cclicenses: <https://creativecommons.org/licenses/>
PREFIX dc: <http://purl.org/metadata/dublin_core_elements#>
PREFIX xsd: <http://www.w3.org/2001/XMLSchema#>
PREFIX obo: <http://purl.obolibrary.org/obo/>
PREFIX sio: <http://semanticscience.org/resource/>
PREFIX efo: <http://www.ebi.ac.uk/efo/>
PREFIX evs: <http://ncicb.nci.nih.gov/xml/owl/EVS/Thesaurus.owl#>
PREFIX edam: <http://edamontology.org/>
PREFIX wikidata: <http://www.wikidata.org/entity/>
:submissionShape {
MainSchema:host @:hostShape ;
MainSchema:sample @:sampleShape ;
MainSchema:submitter @:submitterShape ;
MainSchema:technology @:technologyShape ;
MainSchema:virus @:virusShape;
MainSchema:license @:licenseShape ?;
}
## documentation: #(name of option in yaml), ontology label, mandatory|optional, type
## entries marked with ?????? need review
:hostShape {
efo:EFO_0000532 [ obo:NCBITaxon_~ ] ; #(host_species host), mandatory field, from namespace obo:NCBITaxon
sio:SIO_000115 xsd:string ?; #(host_id), identifier, optional string
obo:PATO_0000047 [ obo:PATO_0000384 obo:PATO_0000383 obo:PATO_0001340] ?; #(host_sex) biological sex, optional, one selected value
obo:PATO_0000011 xsd:integer ?; #(host_age) age, optional integer
obo:NCIT_C42574 [ obo:UO_~ ] ?; #host_age_unit, optional from namespace obo:UO
obo:NCIT_C25688 [obo:NCIT_C115935 obo:NCIT_C3833 obo:NCIT_C25269 obo:GENEPIO_0002020 obo:GENEPIO_0001849 obo:NCIT_C28554 obo:NCIT_C37987 ] ? ; #(host_health_status) status, optional, one selected value
efo:EFO_0000727 xsd:string ?; #(host_treatment), treatment, optional
obo:VO_0000002 xsd:string {0,10}; #(host_vaccination), vaccination, optional list of String 0-10
sio:SIO_001014 [ obo:HANCESTRO_~ ] ? ; #(ethnicity), ethnicity from obo:HANCESTRO
sio:SIO_001167 xsd:string ?; #(additional_host_information), comment, optional, string
}
:sampleShape {
sio:SIO_000115 xsd:string; #(sampleId), identifier, mandatory string
evs:C25164 xsd:string; #(collection_date), date, mandatory, string but should be date
obo:GAZ_00000448 [wikidata:~] ; #(collection_location), geographic location, mandatory, from wikidata namespace
obo:OBI_0001895 xsd:string ?; #(collector_name), specimen collector, optional string
obo:NCIT_C41206 xsd:string ?; #(collecting_institution) Institute, optional string
obo:OBI_0001479 [ obo:NCIT_~ ] ? ; #(specimen_source), specimen from organism, optional, from obo:NCIT
obo:OBI_0001472 xsd:string ?; #(sample_storage_conditions), specimen with known storage state, optional string
sio:SIO_001167 xsd:string ?; #(additional_collection_information), comment, optional, string
edam:data_2091 IRI {0,3}; #(source_database_accession), Accession, optional, IRI 0-3
}
:submitterShape {
obo:NCIT_C42781 xsd:string + ; #(authors), Author, mandatory, list 1-*
sio:SIO_000116 xsd:string *; #(submitter_name), name, optional 0-*
sio:SIO_000172 xsd:string ?; #(submitter_address), address, optional, string
obo:NCIT_C37984 xsd:string ?; #(originating_lab) Laboratory, optional, string
obo:NCIT_C37900 xsd:string ?; #(lab address), Provider, optional, string
efo:EFO_0001741 xsd:string ?; #(provider_sample_id), submitter, optional ????????????????????
obo:NCIT_C42781 xsd:string ?; #(submitter_sample_id), Author, optional string ????????????????????
obo:NCIT_C19026 xsd:string ?; #(publication), Scientific Publication, optional string
sio:SIO_000115 /https:\u002F\u002Forcid.org\u002F.{4}-.{4}-.{4}-.{4}/ {0,10}; #(submitter_orcid) identifier, optional but given regular expression
sio:SIO_001167 xsd:string ?; #(additional_submitter_information), comment, optional string
}
:technologyShape {
obo:OBI_0600047 IRI {0,3} ; #(sample_sequencing_technology) sequencing assay, optional ????????????
efo:EFO_0002699 xsd:string ?; #(sequence_assembly_method) high throughput sequencer, optional ?????????????
obo:FLU_0000848 xsd:double OR xsd:integer {0,3}; #(sequence coverage) sequence coverage, optional
sio:SIO_001167 xsd:string ?; #(additional_technology_information), comment, optional, string
}
:virusShape{
edam:data_1875 [ obo:NCBITaxon_~ ] ; # (virus_species) NCBI taxon, mandatory, from namespace obo:NCBITaxon_
sio:SIO_010055 xsd:string ?; # (virus_strain) strain, optional string
}
:licenseShape{
cc:License [ cclicenses:~ ] ;
dc:Title xsd:string ?;
cc:attributionName xsd:string ?;
cc:attributionURL /^http/ ;
cc:attributionSource xsd:string ?;
}
|