-
Notifications
You must be signed in to change notification settings - Fork 3
/
genome_annotation.yaml
155 lines (136 loc) · 3.81 KB
/
genome_annotation.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
id: https://identifiers.org/brain-bican/genome-annotation-schema
name: genome-annotation-schema
title: Genome Annotation Schema
description: |-
The Genome Annotation schema is designed to represent types and relationships of an organism's annotated genome.
prefixes:
linkml: https://w3id.org/linkml/
bican: https://identifiers.org/brain-bican/vocab/
spdx: http://spdx.org/rdf/terms#
schema: http://schema.org/
ncbi: https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Info&id=
NCBIAssembly: https://www.ncbi.nlm.nih.gov/assembly/
prov: http://www.w3.org/ns/prov#
imports:
- linkml:types
- bican_biolink
default_range: string
default_prefix: bican
classes:
gene annotation:
is_a: gene
description: >-
An annotation describing the location, boundaries, and functions of
individual genes within a genome annotation.
slots:
- molecular type
- source id
attributes:
referenced in:
description: The genome annotation that this gene annotation was referenced from.
required: true
inlined: true
any_of:
- range: genome annotation
- range: string
id_prefixes:
- ENSEMBL
- MGI
- NCBIGene
genome annotation:
is_a: genome
description: >-
Location and nomenclature of genes and all of the coding regions in a genome assembly
and the classification of genes and transcripts into types.
slots:
- version
- digest
- content_url
- authority
attributes:
reference assembly:
description: The reference genome assembly that this genome annotation was created from.
required: true
inlined: true
any_of:
- range: genome assembly
- range: string
genome assembly:
is_a: named thing
mixins:
- thing with taxon
description: >-
Genome assembly to contain version and label information
slots:
- version
- strain
checksum:
is_a: entity
description: >-
Checksum values associated with digital entities.
slots:
- checksum algorithm
attributes:
value:
description: The checksum value obtained from a specific cryotographic hash function.
annotation collection:
tree_root: true
attributes:
annotations:
multivalued: true
inlined_as_list: true
range: gene annotation
genome_annotations:
multivalued: true
inlined_as_list: true
range: genome annotation
genome_assemblies:
multivalued: true
inlined_as_list: true
range: genome assembly
slots:
molecular type:
any_of:
- range: BioType
- range: string
digest:
description: Stores checksum information.
multivalued: true
inlined_as_list: true
any_of:
- range: checksum
- range: string
content_url:
slot_uri: schema:url
multivalued: true
authority:
description: The organization responsible for publishing the data.
range: AuthorityType
checksum algorithm:
description: The type of cryptographic hash function used to calculate the checksum value.
range: DigestType
source id:
description: The authority specific identifier.
slot_uri: schema:identifier
strain:
description: The genetic variant or subtype of a species or organism.
enums:
DigestType:
permissible_values:
spdx:checksumAlgorithm_sha1:
title: SHA1
meaning: spdx:checksumAlgorithm_sha1
spdx:checksumAlgorithm_md5:
title: MD5
meaning: spdx:checksumAlgorithm_md5
spdx:checksumAlgorithm_sha256:
title: SHA256
meaning: spdx:checksumAlgorithm_sha256
BioType:
permissible_values:
protein_coding:
noncoding:
AuthorityType:
permissible_values:
ENSEMBL:
NCBI: