introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
22 rows where transcript_id = 25387408
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 140015922 | GT-AG | 0 | 0.0001926482507446 | 148389 | rna-XM_040241685.1 25387408 | 1 | 104625625 | 104774013 | Oryx dammah 59534 | TGG|GTAAGCCTTG...AGTGCCTTGCCT/CCACCGTTCACC...TGCAG|AGA | 1 | 1 | 9.987 |
| 140015923 | GT-AG | 0 | 1.000000099473604e-05 | 79986 | rna-XM_040241685.1 25387408 | 2 | 104545451 | 104625436 | Oryx dammah 59534 | ATG|GTGAGTGAGC...GTGTCCTTCTTC/CAGCGGTCCACG...TCCAG|GGT | 0 | 1 | 14.717 |
| 140015924 | GT-AG | 0 | 1.000000099473604e-05 | 76560 | rna-XM_040241685.1 25387408 | 3 | 104468506 | 104545065 | Oryx dammah 59534 | AAG|GTGAGTCTTC...CTAACTTTAGCC/CAAGCCCTAACT...TGTAG|CGG | 1 | 1 | 24.403 |
| 140015925 | GT-AG | 0 | 1.000000099473604e-05 | 49596 | rna-XM_040241685.1 25387408 | 4 | 104418757 | 104468352 | Oryx dammah 59534 | GAG|GTAGGTCCCC...CCTGCAGTGACT/CAGTGACTGATG...CACAG|GGG | 1 | 1 | 28.252 |
| 140015926 | GT-AG | 0 | 1.000000099473604e-05 | 58815 | rna-XM_040241685.1 25387408 | 5 | 104359834 | 104418648 | Oryx dammah 59534 | AAG|GTAACAGAAT...GTTTCCTCACCT/TGTTTCCTCACC...TACAG|GTT | 1 | 1 | 30.969 |
| 140015927 | GT-AG | 0 | 1.000000099473604e-05 | 36500 | rna-XM_040241685.1 25387408 | 6 | 104323187 | 104359686 | Oryx dammah 59534 | ACG|GTAAGAGCTG...CTGTCTTTCTCT/CTGAGTCTGAAA...TACAG|GGA | 1 | 1 | 34.667 |
| 140015928 | GT-AG | 0 | 1.000000099473604e-05 | 35977 | rna-XM_040241685.1 25387408 | 7 | 104287042 | 104323018 | Oryx dammah 59534 | CCG|GTGAGCCATG...AGATCCTTTCCT/CAGTATTTCACA...TACAG|GAG | 1 | 1 | 38.893 |
| 140015929 | GT-AG | 0 | 1.000000099473604e-05 | 473 | rna-XM_040241685.1 25387408 | 8 | 104286484 | 104286956 | Oryx dammah 59534 | AGG|GTGAGTAGCA...CATCTCTTATCC/TTCTGACTAATA...CACAG|TCC | 2 | 1 | 41.031 |
| 140015930 | GT-AG | 0 | 1.000000099473604e-05 | 723 | rna-XM_040241685.1 25387408 | 9 | 104285686 | 104286408 | Oryx dammah 59534 | CAG|GTGAGTTGAC...AAACTCTTACAT/GAAACTCTTACA...TGCAG|GTC | 2 | 1 | 42.918 |
| 140015931 | GT-AG | 0 | 1.000000099473604e-05 | 124277 | rna-XM_040241685.1 25387408 | 10 | 104161271 | 104285547 | Oryx dammah 59534 | CAG|GTAGGGAAGT...TGAGATTTAACA/TGAGATTTAACA...CCAAG|GGA | 2 | 1 | 46.39 |
| 140015932 | GT-AG | 0 | 1.000000099473604e-05 | 44627 | rna-XM_040241685.1 25387408 | 11 | 104116493 | 104161119 | Oryx dammah 59534 | GTG|GTAAGTGCCC...CCAGCCGTAACC/CCAGCCGTAACC...AGCAG|TGC | 0 | 1 | 50.189 |
| 140015933 | GT-AG | 0 | 1.000000099473604e-05 | 16963 | rna-XM_040241685.1 25387408 | 12 | 104099363 | 104116325 | Oryx dammah 59534 | CGG|GTGAGTCTCT...CCTATTTTATCA/CCCTATTTTATC...TGCAG|CTG | 2 | 1 | 54.39 |
| 140015934 | GT-AG | 0 | 1.000000099473604e-05 | 68582 | rna-XM_040241685.1 25387408 | 13 | 104030592 | 104099173 | Oryx dammah 59534 | TAG|GTATGGGGGG...GCTTCCTCGACC/GCTTCCTCGACC...CACAG|GGA | 2 | 1 | 59.145 |
| 140015935 | GT-AG | 0 | 1.000000099473604e-05 | 3897 | rna-XM_040241685.1 25387408 | 14 | 104026570 | 104030466 | Oryx dammah 59534 | CTG|GTAAGACAGA...GTGACCTTCTTC/GTGGGGCTCACG...CCCAG|GAG | 1 | 1 | 62.289 |
| 140015936 | GT-AG | 0 | 1.000000099473604e-05 | 2900 | rna-XM_040241685.1 25387408 | 15 | 104023565 | 104026464 | Oryx dammah 59534 | CAG|GTGAGCCCCA...CCAACTCTGACC/CCAACTCTGACC...TCCAG|GCT | 1 | 1 | 64.931 |
| 140015937 | GT-AG | 0 | 5.1007705842136206e-05 | 68722 | rna-XM_040241685.1 25387408 | 16 | 103954663 | 104023384 | Oryx dammah 59534 | AAG|GTAAGCCTGC...GACCTTTTGACC/CCTTTACTGAAC...TCCAG|AGA | 1 | 1 | 69.459 |
| 140015938 | GT-AG | 0 | 1.000000099473604e-05 | 30233 | rna-XM_040241685.1 25387408 | 17 | 103924164 | 103954396 | Oryx dammah 59534 | GAG|GTGAGCTCCC...ACTCTCTTCTCT/ACCGTTGTCATC...TCCAG|GCC | 0 | 1 | 76.151 |
| 140015939 | GT-AG | 0 | 0.0004192498553096 | 1486 | rna-XM_040241685.1 25387408 | 18 | 103922544 | 103924029 | Oryx dammah 59534 | GGT|GTACGTATGT...CCCACCTTCCCT/TTCCCTGTCATC...CCCAG|GCT | 2 | 1 | 79.522 |
| 140015940 | GT-AG | 0 | 1.000000099473604e-05 | 113694 | rna-XM_040241685.1 25387408 | 19 | 103808701 | 103922394 | Oryx dammah 59534 | CGG|GTAAGTAGAA...CTTTCTTTGTCT/TGTCTGCTCACC...TCCAG|GAG | 1 | 1 | 83.27 |
| 140015941 | GT-AG | 0 | 1.000000099473604e-05 | 41134 | rna-XM_040241685.1 25387408 | 20 | 103767425 | 103808558 | Oryx dammah 59534 | CAA|GTAAGACATA...CTTTTCTTGTTG/TTTGCTCTGAAG...CACAG|GTT | 2 | 1 | 86.843 |
| 140015942 | GT-AG | 0 | 1.000000099473604e-05 | 1768 | rna-XM_040241685.1 25387408 | 21 | 103765556 | 103767323 | Oryx dammah 59534 | AAG|GTAGGTGACC...CGTCCCGTGATC/CCTTTTCCTACC...CCCAG|AGA | 1 | 1 | 89.384 |
| 140015943 | GT-AG | 0 | 6.311099669034081e-05 | 14786 | rna-XM_040241685.1 25387408 | 22 | 103750586 | 103765371 | Oryx dammah 59534 | CAG|GTACGCGGGC...GACCCTTTGACC/TCCAGCTTCATC...TCCAG|GAA | 2 | 1 | 94.013 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);