aboutsummaryrefslogtreecommitdiff
path: root/bh20sequploader/bh20seq-schema.yml
blob: a072bd78e60c8cefe5978468385dfe8a476d96d0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
$base: http://biohackathon.org/bh20-seq-schema
$namespaces:
  sch: https://schema.org/
  efo: http://www.ebi.ac.uk/efo/
  obo: http://purl.obolibrary.org/obo/
  sio: http://semanticscience.org/resource/
  edam: http://edamontology.org/
  evs: http://ncicb.nci.nih.gov/xml/owl/EVS/Thesaurus.owl#

$graph:

- name: hostSchema
  type: record
  fields:
    host_species:
        type: string
        jsonldPredicate:
          _id: http://www.ebi.ac.uk/efo/EFO_0000532
    host_id:
        type: string
        jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_000115
    host_common_name:
        type: string?
        jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/NOMEN_0000037
    host_sex:
        type: string
        jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/PATO_0000047
    host_age:
        type: int?
        jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/PATO_0000011
    host_age_unit:
        type: string?
        jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/UO_0000036
    host_health_status:
        type: string?
        jsonldPredicate: http://purl.obolibrary.org/obo/NCIT_C25688
    host_treatment:
      type: string?
      jsonldPredicate:
          _id: http://www.ebi.ac.uk/efo/EFO_0000727
    host_vaccination:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/VO_0000001
    additional_host_information:
      type: string?
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_001167

- name: sampleSchema
  type: record
  fields:
    collector_name:
      type: string
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/OBI_0001895
    collecting_institution:
      type: string
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_001167
    specimen_source:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/OBI_0001479
    collection_date:
      type: string?
      jsonldPredicate:
          _id: http://ncicb.nci.nih.gov/xml/owl/EVS/Thesaurus.owl#C25164
    collection_location:
      type: string?
      jsonldPredicate:
        _id: http://purl.obolibrary.org/obo/GAZ_00000448
    sample_storage_conditions:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/OBI_0001472
    additional_collection_information:
      type: string?
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_001167
    sample_id:
      type: string
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_000115
    source_database_accession:
      type: string?
      jsonldPredicate:
          _id: http://edamontology.org/data_2091

- name: virusSchema
  type: record
  fields:
    virus_species:
      type: string?
      jsonldPredicate:
          _id: http://edamontology.org/data_1875
    virus_strain:
      type: string?
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_010055

- name: technologySchema
  type: record
  fields:
    sample_sequencing_technology:
      type: string
      jsonldPredicate:
        _id: http://purl.obolibrary.org/obo/OBI_0600047
    sequence_assembly_method:
      type: string?
      jsonldPredicate:
        _id: http://www.ebi.ac.uk/efo/EFO_0002699
    sequencing_coverage:
      type: string?
      jsonldPredicate:
        _id: http://purl.obolibrary.org/obo/FLU_0000848

- name: submitterSchema
  type: record
  fields:
    submitter_name:
      type: string
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_000116
    submitter_date:
      type: string
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/NCIT_C94162
    submitter_address:
      type: string?
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_000172
    originating_lab:
      type: string
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/NCIT_C37984
    lab_address:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/OBI_0600047
    provider_sample_id:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/NCIT_C37900
    submitter_sample_id:
      type: string?
      jsonldPredicate:
          _id: http://www.ebi.ac.uk/efo/EFO_0001741
    authors:
      type: string?
      jsonldPredicate:
          _id: http://purl.obolibrary.org/obo/NCIT_C42781
    submitter_id:
      type: string?
      jsonldPredicate:
          _id: http://semanticscience.org/resource/SIO_000115

- name: MainSchema
  type: record
  documentRoot: true
  fields:
    host: hostSchema
    sample: sampleSchema
    virus: virusSchema?
    technology: technologySchema
    submitter: submitterSchema
    submission:
      type: string
      jsonldPredicate:
        _id: "@id"
        #_type: "@id"
    id:
      doc: The subject (eg the fasta/fastq file) that the metadata describes
      type: string?
      jsonldPredicate:
        _id: "@id"
        _type: "@id"