introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
22 rows where transcript_id = 5981961
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 30724593 | GT-AG | 0 | 1.000000099473604e-05 | 27306 | rna-XM_025882227.1 5981961 | 2 | 19523969 | 19551274 | Callorhinus ursinus 34884 | AAA|GTAAGTTAGT...TGAAATTTAATT/ATTAAACTGACT...AAAAG|GTT | 0 | 1 | 5.746 |
| 30724594 | GT-AG | 0 | 1.000000099473604e-05 | 723 | rna-XM_025882227.1 5981961 | 3 | 19522756 | 19523478 | Callorhinus ursinus 34884 | AAG|GTAATATATC...CTCTTTTTATTA/TCTCTTTTTATT...ACTAG|TTT | 1 | 1 | 16.29 |
| 30724595 | GT-AG | 0 | 1.000000099473604e-05 | 8688 | rna-XM_025882227.1 5981961 | 4 | 19513342 | 19522029 | Callorhinus ursinus 34884 | CAG|GTAATTATCA...AATACCTCAAAT/GAATACCTCAAA...ACCAG|ATA | 1 | 1 | 31.913 |
| 30724596 | GT-AG | 0 | 1.000000099473604e-05 | 2995 | rna-XM_025882227.1 5981961 | 5 | 19510143 | 19513137 | Callorhinus ursinus 34884 | AAG|GTAAGACACT...TTTTTCTTATCA/GTTTTTCTTATC...TCTAG|GAA | 1 | 1 | 36.303 |
| 30724597 | GT-AG | 0 | 0.0002213786532684 | 4273 | rna-XM_025882227.1 5981961 | 6 | 19505706 | 19509978 | Callorhinus ursinus 34884 | GTT|GTAAGTAATC...GATTTCTTAATA/AGATTTCTTAAT...AACAG|GTG | 0 | 1 | 39.832 |
| 30724598 | GT-AG | 0 | 1.000000099473604e-05 | 2084 | rna-XM_025882227.1 5981961 | 7 | 19503460 | 19505543 | Callorhinus ursinus 34884 | GAA|GTAAGTGGTA...ATATTTTTATAT/TGTTTTCTCATG...CTTAG|AGC | 0 | 1 | 43.318 |
| 30724599 | GT-AG | 0 | 0.0008795072441871 | 383 | rna-XM_025882227.1 5981961 | 8 | 19503000 | 19503382 | Callorhinus ursinus 34884 | ACA|GTAAGTTCTT...GAACTTTTAACC/CAGCTACTTACC...ATAAG|GTG | 2 | 1 | 44.975 |
| 30724600 | GC-AG | 0 | 1.000000099473604e-05 | 1208 | rna-XM_025882227.1 5981961 | 9 | 19501566 | 19502773 | Callorhinus ursinus 34884 | CAG|GCAAGTGAAA...CATTTTTTAAAA/TTAAAACTAATT...TACAG|TTT | 0 | 1 | 49.839 |
| 30724601 | GT-AG | 0 | 1.000000099473604e-05 | 1142 | rna-XM_025882227.1 5981961 | 10 | 19500190 | 19501331 | Callorhinus ursinus 34884 | AAG|GTAAAGTAAG...TCTTCCTTAGCA/TTTGTTTTAATT...TATAG|GGC | 0 | 1 | 54.874 |
| 30724602 | GT-AG | 0 | 0.022875126257637 | 1907 | rna-XM_025882227.1 5981961 | 11 | 19498191 | 19500097 | Callorhinus ursinus 34884 | AAG|GTATTTATTT...TTTATTTTAACT/TTTATTTTAACT...TCCAG|TGA | 2 | 1 | 56.854 |
| 30724603 | GT-AG | 0 | 0.0004995947567907 | 1050 | rna-XM_025882227.1 5981961 | 12 | 19497013 | 19498062 | Callorhinus ursinus 34884 | CAG|GTATAGTCTT...CTGTCTTTACTC/TCTGTCTTTACT...TACAG|GGG | 1 | 1 | 59.608 |
| 30724604 | GT-AG | 0 | 0.0011487090859558 | 213 | rna-XM_025882227.1 5981961 | 13 | 19496645 | 19496857 | Callorhinus ursinus 34884 | AAG|GTAACTTAAT...GAGACTTTGATA/TTATTGTTAATA...TCTAG|GCT | 0 | 1 | 62.944 |
| 30724605 | GT-AG | 0 | 1.000000099473604e-05 | 9086 | rna-XM_025882227.1 5981961 | 14 | 19487424 | 19496509 | Callorhinus ursinus 34884 | CCT|GTAAGTGACT...TTTGTTTTATAC/TTTTGTTTTATA...TAAAG|GGA | 0 | 1 | 65.849 |
| 30724606 | GT-AG | 0 | 1.000000099473604e-05 | 1068 | rna-XM_025882227.1 5981961 | 15 | 19486161 | 19487228 | Callorhinus ursinus 34884 | AAG|GTAAGATAGT...TGTATTTTAATT/TGTATTTTAATT...TACAG|GTG | 0 | 1 | 70.045 |
| 30724607 | GT-AG | 0 | 2.746892040083628e-05 | 2200 | rna-XM_025882227.1 5981961 | 16 | 19483778 | 19485977 | Callorhinus ursinus 34884 | CAG|GTACAATTTT...TGACCTTGGATT/TCTGTTTCTATT...GTTAG|GAG | 0 | 1 | 73.983 |
| 30724608 | GT-AG | 0 | 4.640692336840628e-05 | 4778 | rna-XM_025882227.1 5981961 | 17 | 19478783 | 19483560 | Callorhinus ursinus 34884 | CAA|GTAAGCTAAT...CTTTCTGTACTT/AACGATCTCACT...TTCAG|ATG | 1 | 1 | 78.653 |
| 30724609 | GT-AG | 0 | 1.122930494788249e-05 | 2723 | rna-XM_025882227.1 5981961 | 18 | 19475913 | 19478635 | Callorhinus ursinus 34884 | ATG|GTAAGGTTTT...ACTCTCTTATTT/TATTTTCTGATA...ATTAG|ATG | 1 | 1 | 81.816 |
| 30724610 | GT-AG | 0 | 1.000000099473604e-05 | 7519 | rna-XM_025882227.1 5981961 | 19 | 19468251 | 19475769 | Callorhinus ursinus 34884 | CAG|GTAATTGGTT...TATTTCTTGAAA/ATTGAGTTTATC...TGTAG|GTT | 0 | 1 | 84.893 |
| 30724611 | GT-AG | 0 | 1.000000099473604e-05 | 523 | rna-XM_025882227.1 5981961 | 20 | 19467524 | 19468046 | Callorhinus ursinus 34884 | AGG|GTAAGTACTG...TACTTGTTAAGT/GTTAGAGTCACT...CTCAG|AAT | 0 | 1 | 89.283 |
| 30724612 | GT-AG | 0 | 5.30483114516856e-05 | 2319 | rna-XM_025882227.1 5981961 | 21 | 19465087 | 19467405 | Callorhinus ursinus 34884 | CTG|GTATGTGACT...TCTGCTCTAACT/ATCTGTTTCATA...CCTAG|GAG | 1 | 1 | 91.823 |
| 30724613 | GT-AG | 0 | 1.000000099473604e-05 | 363 | rna-XM_025882227.1 5981961 | 22 | 19464621 | 19464983 | Callorhinus ursinus 34884 | ACT|GTGAGTATGA...ATTTGCTTATTT/CATTTGCTTATT...TTCAG|TTA | 2 | 1 | 94.039 |
| 30725068 | GT-AG | 0 | 1.000000099473604e-05 | 63063 | rna-XM_025882227.1 5981961 | 1 | 19551416 | 19614478 | Callorhinus ursinus 34884 | CAG|GTAAGTCCTA...ATTTCCATGGCT/AATGAGTTCATT...AATAG|GAA | 0 | 3.163 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);