introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
25 rows where transcript_id = 25387421
This data as json, CSV (advanced)
Suggested facets: score, length, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 140016206 | GT-AG | 0 | 1.000000099473604e-05 | 1050 | rna-XM_040243925.1 25387421 | 1 | 73815738 | 73816787 | Oryx dammah 59534 | GAG|GTGGGCGAGC...ATGTCTGTGATG/CTCCCTCTCATT...TACAG|GTG | 0 | 1 | 1.569 |
| 140016207 | GT-AG | 0 | 1.0400255106308554e-05 | 87 | rna-XM_040243925.1 25387421 | 2 | 73815444 | 73815530 | Oryx dammah 59534 | CAG|GTACTGTTGG...CTCTCCTGCACC/CTGAGGCTGAAG...TACAG|GTA | 0 | 1 | 7.585 |
| 140016208 | GT-AG | 0 | 1.000000099473604e-05 | 1613 | rna-XM_040243925.1 25387421 | 3 | 73813714 | 73815326 | Oryx dammah 59534 | GAG|GTAAGTCAAG...CTGTCTCTGTCC/ATATGTGTCACT...TGCAG|CTG | 0 | 1 | 10.985 |
| 140016209 | GT-AG | 0 | 1.000000099473604e-05 | 325 | rna-XM_040243925.1 25387421 | 4 | 73813209 | 73813533 | Oryx dammah 59534 | AGG|GTAAGATCCA...CTTCTCCTGACC/CTTCTCCTGACC...TCCAG|GAG | 0 | 1 | 16.216 |
| 140016210 | GT-AG | 0 | 1.000000099473604e-05 | 242 | rna-XM_040243925.1 25387421 | 5 | 73812798 | 73813039 | Oryx dammah 59534 | ACG|GTGGGAGGCA...AGGGTCTTAGCA/CTTAGCATCACC...CCCAG|GGA | 1 | 1 | 21.128 |
| 140016211 | GT-AG | 0 | 1.000000099473604e-05 | 87 | rna-XM_040243925.1 25387421 | 6 | 73812576 | 73812662 | Oryx dammah 59534 | ATG|GTGAGTAGAC...TTTCTCTTTCCT/TCTCCTCTCACG...CACAG|GTA | 1 | 1 | 25.051 |
| 140016212 | GT-AG | 0 | 1.000000099473604e-05 | 88 | rna-XM_040243925.1 25387421 | 7 | 73812324 | 73812411 | Oryx dammah 59534 | AAG|GTGAGCTGGA...TGGCTCTGAACT/CTGGCTCTGAAC...CTCAG|GGC | 0 | 1 | 29.817 |
| 140016213 | GT-AG | 0 | 1.000000099473604e-05 | 205 | rna-XM_040243925.1 25387421 | 8 | 73811998 | 73812202 | Oryx dammah 59534 | TGG|GTGAGGCAGC...TTCCTTCTGACA/TTCCTTCTGACA...TTCAG|CCA | 1 | 1 | 33.333 |
| 140016214 | GT-AG | 0 | 1.000000099473604e-05 | 311 | rna-XM_040243925.1 25387421 | 9 | 73811628 | 73811938 | Oryx dammah 59534 | CTG|GTGAGTAGGG...CCAGCCCTGACT/CCAGCCCTGACT...CCCAG|CCG | 0 | 1 | 35.048 |
| 140016215 | GT-AG | 0 | 0.0010534879831941 | 192 | rna-XM_040243925.1 25387421 | 10 | 73811334 | 73811525 | Oryx dammah 59534 | CAG|GTACCAGTTG...GGTTCCTTGCTT/GGTGGTCTCACA...CCCAG|GTG | 0 | 1 | 38.012 |
| 140016216 | GT-AG | 0 | 1.000000099473604e-05 | 172 | rna-XM_040243925.1 25387421 | 11 | 73811046 | 73811217 | Oryx dammah 59534 | GCA|GTGAGTTTCA...CAGTACTTGATG/CAGTACTTGATG...CCCAG|CAT | 2 | 1 | 41.383 |
| 140016217 | GT-AG | 0 | 1.000000099473604e-05 | 157 | rna-XM_040243925.1 25387421 | 12 | 73810711 | 73810867 | Oryx dammah 59534 | GAG|GTGAGGTGGG...GGCACTTGGACT/CTTGGACTGAGC...TGCAG|TGG | 0 | 1 | 46.556 |
| 140016218 | GT-AG | 0 | 1.000000099473604e-05 | 169 | rna-XM_040243925.1 25387421 | 13 | 73810419 | 73810587 | Oryx dammah 59534 | GAG|GTGAGCAGCT...CCTTCCTTGTTG/TCCTTGTTGATC...CCTAG|GCC | 0 | 1 | 50.131 |
| 140016219 | GT-AG | 0 | 1.000000099473604e-05 | 150 | rna-XM_040243925.1 25387421 | 14 | 73810120 | 73810269 | Oryx dammah 59534 | ACT|GTGAGTGTTA...TGCCCCATACTC/CAGTGCCCCATA...TCTAG|CCA | 2 | 1 | 54.461 |
| 140016220 | GT-AG | 0 | 1.000000099473604e-05 | 247 | rna-XM_040243925.1 25387421 | 15 | 73809797 | 73810043 | Oryx dammah 59534 | GAG|GTGAGGGCCC...GCCCTCCTGATT/GCCCTCCTGATT...CTCAG|ACC | 0 | 1 | 56.67 |
| 140016221 | GT-AG | 0 | 1.000000099473604e-05 | 110 | rna-XM_040243925.1 25387421 | 16 | 73809546 | 73809655 | Oryx dammah 59534 | GAG|GTCAGGAGCA...TCCTCCTCAGCC/CTCCTCCTCAGC...CACAG|GTG | 0 | 1 | 60.767 |
| 140016222 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_040243925.1 25387421 | 17 | 73809346 | 73809427 | Oryx dammah 59534 | CTG|GTGAGGGAGC...CGCTCTATACCC/TGTAGACTGAGG...CACAG|TGG | 1 | 1 | 64.196 |
| 140016223 | GT-AG | 0 | 1.000000099473604e-05 | 90 | rna-XM_040243925.1 25387421 | 18 | 73809101 | 73809190 | Oryx dammah 59534 | AAG|GTTAGGCGGG...GGTGCCCCATCT/CCATCTCCCATC...AACAG|GAT | 0 | 1 | 68.701 |
| 140016224 | GT-AG | 0 | 1.000000099473604e-05 | 409 | rna-XM_040243925.1 25387421 | 19 | 73808528 | 73808936 | Oryx dammah 59534 | TGG|GTAGGGCCAC...TGCGCCTCACCG/CTGCGCCTCACC...CACAG|GCT | 2 | 1 | 73.467 |
| 140016225 | GT-AG | 0 | 1.000000099473604e-05 | 225 | rna-XM_040243925.1 25387421 | 20 | 73808150 | 73808374 | Oryx dammah 59534 | CAG|GTGATGCCCT...GGGCCCCTGACA/ACTTTGCTCACT...CTCAG|CTC | 2 | 1 | 77.913 |
| 140016226 | GT-AG | 0 | 1.000000099473604e-05 | 749 | rna-XM_040243925.1 25387421 | 21 | 73807303 | 73808051 | Oryx dammah 59534 | CTG|GTAAGTGGTA...CCCCTTCTAATT/CCCCTTCTAATT...CACAG|CGG | 1 | 1 | 80.761 |
| 140016227 | GT-AG | 0 | 0.001595118689476 | 123 | rna-XM_040243925.1 25387421 | 22 | 73807055 | 73807177 | Oryx dammah 59534 | CAG|GTTTCATTGC...CAGGTCTGACCT/TCAGGTCTGACC...CTTAG|ATC | 0 | 1 | 84.394 |
| 140016228 | GT-AG | 0 | 1.000000099473604e-05 | 376 | rna-XM_040243925.1 25387421 | 23 | 73806589 | 73806964 | Oryx dammah 59534 | AGG|GTAAGCCCCT...GTTTCCATCTCC/CCAGTTTCCATC...TTCAG|ACC | 0 | 1 | 87.01 |
| 140016229 | GT-AG | 0 | 1.000000099473604e-05 | 115 | rna-XM_040243925.1 25387421 | 24 | 73806279 | 73806393 | Oryx dammah 59534 | AGG|GTAGGTCCTT...AAGTCTTTTTCC/TTGGCTCTCAGG...CCTAG|GAG | 0 | 1 | 92.677 |
| 140016230 | GT-AG | 0 | 1.000000099473604e-05 | 177 | rna-XM_040243925.1 25387421 | 25 | 73806000 | 73806176 | Oryx dammah 59534 | AAG|GTGAGCTGGC...ATGTCTTTGGCT/ATGCCTTTCATG...CCCAG|GCC | 0 | 1 | 95.641 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);