introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
28 rows where transcript_id = 25387379
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 140015305 | GT-AG | 0 | 1.000000099473604e-05 | 50454 | rna-XM_040238476.1 25387379 | 1 | 25181520 | 25231973 | Oryx dammah 59534 | CTG|GTAAATGCCT...GGACTCATACTG/CTCATACTGATC...CACAG|AGC | 0 | 1 | 1.191 |
| 140015306 | GT-AG | 0 | 1.000000099473604e-05 | 27351 | rna-XM_040238476.1 25387379 | 2 | 25154041 | 25181391 | Oryx dammah 59534 | CAA|GTAAGTCCTG...TGTTTTTTCTCC/TTGGTGGTAATG...CCCAG|GAG | 2 | 1 | 3.611 |
| 140015307 | GT-AG | 0 | 0.0004128722644111 | 47285 | rna-XM_040238476.1 25387379 | 3 | 25106710 | 25153994 | Oryx dammah 59534 | GTG|GTAAGCATTA...TTTCTTTTAACC/TTTCTTTTAACC...TCCAG|GAC | 0 | 1 | 4.481 |
| 140015308 | GT-AG | 0 | 1.000000099473604e-05 | 60802 | rna-XM_040238476.1 25387379 | 4 | 25045671 | 25106472 | Oryx dammah 59534 | CAA|GTAAGTGCCA...ATCCCTTTAGCA/AAATTACACATC...GTTAG|ATT | 0 | 1 | 8.962 |
| 140015309 | GT-AG | 0 | 1.000000099473604e-05 | 15595 | rna-XM_040238476.1 25387379 | 5 | 25029949 | 25045543 | Oryx dammah 59534 | AAT|GTAAGACACT...TGTGCTTTAAGA/TTTTGTATCAAA...TCTAG|TGG | 1 | 1 | 11.363 |
| 140015310 | GT-AG | 0 | 1.000000099473604e-05 | 4954 | rna-XM_040238476.1 25387379 | 6 | 25024920 | 25029873 | Oryx dammah 59534 | TGT|GTAAGTAAAC...CTGTGTTTGATT/CTGTGTTTGATT...TGTAG|ATC | 1 | 1 | 12.781 |
| 140015311 | GT-AG | 0 | 1.000000099473604e-05 | 9843 | rna-XM_040238476.1 25387379 | 7 | 25014919 | 25024761 | Oryx dammah 59534 | AAG|GTGAGCCCAT...TTTCCGTTGTCT/CTCCGTCTCACT...TGCAG|ATC | 0 | 1 | 15.769 |
| 140015312 | GT-AG | 0 | 1.000000099473604e-05 | 3707 | rna-XM_040238476.1 25387379 | 8 | 25011100 | 25014806 | Oryx dammah 59534 | GAG|GTAATGGTGT...ATTGCATTGATG/ATTGCATTGATG...CACAG|GTT | 1 | 1 | 17.886 |
| 140015313 | GT-AG | 0 | 1.000000099473604e-05 | 13358 | rna-XM_040238476.1 25387379 | 9 | 24997603 | 25010960 | Oryx dammah 59534 | CAG|GTCAGTTACA...TTGGCATTATTG/CTTCTACTCAGA...AACAG|TGA | 2 | 1 | 20.514 |
| 140015314 | GT-AG | 0 | 1.000000099473604e-05 | 4903 | rna-XM_040238476.1 25387379 | 10 | 24992649 | 24997551 | Oryx dammah 59534 | TCG|GTACGTAAAT...TCTGCCCTGATG/TGATGACTCACC...TGTAG|GTG | 2 | 1 | 21.479 |
| 140015315 | GT-AG | 0 | 0.001070472101085 | 1304 | rna-XM_040238476.1 25387379 | 11 | 24991140 | 24992443 | Oryx dammah 59534 | CCG|GTAACTGTGA...GTCTCCTTTCTT/TTGCCTATGAGT...TCCAG|TGT | 0 | 1 | 25.355 |
| 140015316 | GT-AG | 0 | 0.0007043738848701 | 2064 | rna-XM_040238476.1 25387379 | 12 | 24988928 | 24990991 | Oryx dammah 59534 | AAG|GTAACTTGAT...TCTTTTTTGTCT/CTGGTTCTAACC...CTTAG|AAA | 1 | 1 | 28.153 |
| 140015317 | GT-AG | 0 | 0.0003057712281285 | 20190 | rna-XM_040238476.1 25387379 | 13 | 24968653 | 24988842 | Oryx dammah 59534 | CTC|GTAAGTTTTC...GTCCTCTTGTTT/GGGCTTCTCATC...TGCAG|GTT | 2 | 1 | 29.76 |
| 140015318 | GT-AG | 0 | 1.000000099473604e-05 | 7274 | rna-XM_040238476.1 25387379 | 14 | 24961077 | 24968350 | Oryx dammah 59534 | GAG|GTAAGAAGGG...CTGGCCTTGATG/ATGGGTGTCATC...CACAG|GTG | 1 | 1 | 35.47 |
| 140015319 | GT-AG | 0 | 1.000000099473604e-05 | 42013 | rna-XM_040238476.1 25387379 | 15 | 24918934 | 24960946 | Oryx dammah 59534 | AAG|GTAAGGGGTG...CTTCCTCTGATT/CTTCCTCTGATT...CACAG|GTG | 2 | 1 | 37.928 |
| 140015320 | GT-AG | 0 | 1.000000099473604e-05 | 15131 | rna-XM_040238476.1 25387379 | 16 | 24903592 | 24918722 | Oryx dammah 59534 | CCG|GTGAGTTCTA...TTTCTCTTCCTC/TACTCTCTTATG...CCCAG|TGT | 0 | 1 | 41.917 |
| 140015321 | GT-AG | 0 | 0.0002430622222946 | 6025 | rna-XM_040238476.1 25387379 | 17 | 24897387 | 24903411 | Oryx dammah 59534 | GAG|GTATGTGTGC...TTGGCCTTTCTT/TCTGCATTTACA...ACCAG|TGT | 0 | 1 | 45.32 |
| 140015322 | GT-AG | 0 | 1.000000099473604e-05 | 1360 | rna-XM_040238476.1 25387379 | 18 | 24895873 | 24897232 | Oryx dammah 59534 | CAA|GTGAGTACGT...TTCTCTTTCTCC/TCTTTCTCCATC...TCCAG|GGC | 1 | 1 | 48.232 |
| 140015323 | GT-AG | 0 | 1.000000099473604e-05 | 21690 | rna-XM_040238476.1 25387379 | 19 | 24873057 | 24894746 | Oryx dammah 59534 | CAG|GTGAGTTTTG...CATTTCTTCTCT/ACTGACCTGACC...TCCAG|GAT | 2 | 1 | 69.522 |
| 140015324 | GT-AG | 0 | 1.000000099473604e-05 | 22226 | rna-XM_040238476.1 25387379 | 20 | 24850703 | 24872928 | Oryx dammah 59534 | CAG|GTAATGTGAA...GTGCCCAAAGCC/CCCCATCTAATA...CTCAG|GAA | 1 | 1 | 71.942 |
| 140015325 | GT-AG | 0 | 1.000000099473604e-05 | 9326 | rna-XM_040238476.1 25387379 | 21 | 24841248 | 24850573 | Oryx dammah 59534 | CAG|GTAAGAAATG...GTCACCTGAATG/TGGTGGCTGATG...CCTAG|GTG | 1 | 1 | 74.381 |
| 140015326 | GT-AG | 0 | 0.000204292839152 | 4062 | rna-XM_040238476.1 25387379 | 22 | 24837006 | 24841067 | Oryx dammah 59534 | TAG|GTAAACACCA...TATGCTTTAACC/TATGCTTTAACC...CACAG|AGC | 1 | 1 | 77.784 |
| 140015327 | GT-AG | 0 | 1.000000099473604e-05 | 48017 | rna-XM_040238476.1 25387379 | 23 | 24788854 | 24836870 | Oryx dammah 59534 | TTG|GTGAGTCCAA...GTGTCCTTTTTG/GCTGTATTCATG...TCTAG|GCT | 1 | 1 | 80.337 |
| 140015328 | GT-AG | 0 | 1.000000099473604e-05 | 2057 | rna-XM_040238476.1 25387379 | 24 | 24786584 | 24788640 | Oryx dammah 59534 | AAG|GTAAGAAACC...ACCTTCTTGTCA/CTTCTTGTCACC...GACAG|ATT | 1 | 1 | 84.364 |
| 140015329 | GT-AG | 0 | 1.000000099473604e-05 | 3162 | rna-XM_040238476.1 25387379 | 25 | 24783241 | 24786402 | Oryx dammah 59534 | CCG|GTGAGTGCAC...CAAGGCTTGACC/TTTGCACTAATC...CCCAG|GTG | 2 | 1 | 87.786 |
| 140015330 | GT-AG | 0 | 1.000000099473604e-05 | 34448 | rna-XM_040238476.1 25387379 | 26 | 24748585 | 24783032 | Oryx dammah 59534 | CAG|GTAAGACAGC...GTCACCTTTTTC/ATGTATGTCACC...CCCAG|TGC | 0 | 1 | 91.719 |
| 140015331 | GT-AG | 0 | 1.000000099473604e-05 | 781 | rna-XM_040238476.1 25387379 | 27 | 24747694 | 24748474 | Oryx dammah 59534 | GAG|GTAAGAGAAA...CAGACCCTAACC/CAGACCCTAACC...CACAG|GCC | 2 | 1 | 93.798 |
| 140015332 | GT-AG | 0 | 0.0304206362330483 | 1612 | rna-XM_040238476.1 25387379 | 28 | 24745861 | 24747472 | Oryx dammah 59534 | ACA|GTATGTTCCA...ATCTCCTTTCTG/CTGTTTCGCATC...CCCAG|CGG | 1 | 1 | 97.977 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);