introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
36 rows where transcript_id = 25387382
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 140015399 | GT-AG | 0 | 7.231706337680873e-05 | 1222 | rna-XM_040226774.1 25387382 | 3 | 61388208 | 61389429 | Oryx dammah 59534 | GAG|GTAGGCCTGT...GCTGCCTTCACC/GCTGCCTTCACC...TTCAG|GTG | 0 | 1 | 6.959 |
| 140015400 | GT-AG | 0 | 1.000000099473604e-05 | 2980 | rna-XM_040226774.1 25387382 | 4 | 61389621 | 61392600 | Oryx dammah 59534 | CAG|GTAGGTCCTG...TTTTCCTCTGCT/GTAGGGGTCAGT...CTCAG|GGA | 2 | 1 | 10.661 |
| 140015401 | GT-AG | 0 | 1.000000099473604e-05 | 1245 | rna-XM_040226774.1 25387382 | 5 | 61392690 | 61393934 | Oryx dammah 59534 | TTG|GTGAGCCTGT...CTCACCTTGACT/TCTGACCTCACC...TCTAG|TTC | 1 | 1 | 12.386 |
| 140015402 | GT-AG | 0 | 1.000000099473604e-05 | 1011 | rna-XM_040226774.1 25387382 | 6 | 61394045 | 61395055 | Oryx dammah 59534 | ATG|GTGAGAATTT...GATACCATAGCC/GGGGTGTTGATA...TTTAG|GAA | 0 | 1 | 14.518 |
| 140015403 | GT-AG | 0 | 2.4459090351450707e-05 | 107 | rna-XM_040226774.1 25387382 | 7 | 61395185 | 61395291 | Oryx dammah 59534 | CAA|GTAGGCGTCC...TCGTTCTCACAG/CTCGTTCTCACA...CACAG|ACC | 0 | 1 | 17.019 |
| 140015404 | GT-AG | 0 | 1.000000099473604e-05 | 119 | rna-XM_040226774.1 25387382 | 8 | 61395403 | 61395521 | Oryx dammah 59534 | AAA|GTGAGCTTGC...GGTGCCTTGTCA/GAGTCGCTCACT...TCTAG|CTA | 0 | 1 | 19.17 |
| 140015405 | GT-AG | 0 | 1.000000099473604e-05 | 1917 | rna-XM_040226774.1 25387382 | 9 | 61395618 | 61397534 | Oryx dammah 59534 | ATG|GTGAGTGGTT...CTGACCTTGGAG/CCCTGCTCCATC...CGCAG|ATC | 0 | 1 | 21.031 |
| 140015406 | GT-AG | 0 | 1.000000099473604e-05 | 1743 | rna-XM_040226774.1 25387382 | 10 | 61397699 | 61399441 | Oryx dammah 59534 | CAG|GTCAGTGGCT...TGTGTCTGGACA/CATGGTCCAATG...CCCAG|TGA | 2 | 1 | 24.21 |
| 140015407 | GT-AG | 0 | 1.000000099473604e-05 | 4849 | rna-XM_040226774.1 25387382 | 11 | 61399562 | 61404410 | Oryx dammah 59534 | CTG|GTACAGCAGG...TGAATTTTACTC/ATTTTACTCAAG...CCCAG|TGA | 2 | 1 | 26.536 |
| 140015408 | GT-AG | 0 | 1.000000099473604e-05 | 2228 | rna-XM_040226774.1 25387382 | 12 | 61404491 | 61406718 | Oryx dammah 59534 | TCG|GTGAGTGAGG...TTTTCCCTACCC/GAGCTGCTGATG...CGGAG|ACA | 1 | 1 | 28.087 |
| 140015409 | GT-AG | 0 | 1.000000099473604e-05 | 1683 | rna-XM_040226774.1 25387382 | 13 | 61406808 | 61408490 | Oryx dammah 59534 | AGG|GTGGGTGTCC...TCAGCCTAAGCC/ATCAGCCTAAGC...TCCAG|AAG | 0 | 1 | 29.812 |
| 140015410 | GT-AG | 0 | 1.000000099473604e-05 | 1100 | rna-XM_040226774.1 25387382 | 14 | 61408614 | 61409713 | Oryx dammah 59534 | GAC|GTGCGTAACT...TGACACTTAAAG/TTGACACTTAAA...CACAG|AAA | 0 | 1 | 32.196 |
| 140015411 | GT-AG | 0 | 1.000000099473604e-05 | 813 | rna-XM_040226774.1 25387382 | 15 | 61409888 | 61410700 | Oryx dammah 59534 | CAG|GTGTGGCCCC...CTGCTTCTATCC/TGGTGACTCACA...GCCAG|GCC | 0 | 1 | 35.569 |
| 140015412 | GT-AG | 0 | 1.000000099473604e-05 | 1058 | rna-XM_040226774.1 25387382 | 16 | 61410817 | 61411874 | Oryx dammah 59534 | CAG|GTAGGCAGAC...CTCCCATTGACA/AGTACTTTCATC...TCCAG|GTA | 2 | 1 | 37.817 |
| 140015413 | GT-AG | 0 | 1.000000099473604e-05 | 1626 | rna-XM_040226774.1 25387382 | 17 | 61412002 | 61413627 | Oryx dammah 59534 | CAG|GTATGGAAAG...GTGTTTTTGCCT/TGCATATTCAGT...CGTAG|AAC | 0 | 1 | 40.279 |
| 140015414 | GT-AG | 0 | 0.0002417603885484 | 128 | rna-XM_040226774.1 25387382 | 18 | 61413668 | 61413795 | Oryx dammah 59534 | CAG|GTAACATTTT...TGTCTCTTCCTG/TTGGGGCTGATC...AACAG|AAC | 1 | 1 | 41.054 |
| 140015415 | GT-AG | 0 | 1.000000099473604e-05 | 1237 | rna-XM_040226774.1 25387382 | 19 | 61414245 | 61415481 | Oryx dammah 59534 | GAG|GTAGGCCAGC...AAAGTCTTGTTT/AGTCTGTTCAAT...CTTAG|GTC | 0 | 1 | 49.758 |
| 140015416 | GT-AG | 0 | 1.000000099473604e-05 | 2595 | rna-XM_040226774.1 25387382 | 20 | 61415709 | 61418303 | Oryx dammah 59534 | ACA|GTGAGTGAAA...TGACCCTCACTG/CTGACCCTCACT...CTCAG|GCT | 2 | 1 | 54.158 |
| 140015417 | GT-AG | 0 | 1.000000099473604e-05 | 1368 | rna-XM_040226774.1 25387382 | 21 | 61418480 | 61419847 | Oryx dammah 59534 | CAG|GTACTGTGGC...AGGACCTCAGCC/GAGGACCTCAGC...TTCAG|CTG | 1 | 1 | 57.569 |
| 140015418 | GT-AG | 0 | 1.000000099473604e-05 | 901 | rna-XM_040226774.1 25387382 | 22 | 61420029 | 61420929 | Oryx dammah 59534 | GAA|GTAAGGGTCT...ACCACCCTGCCC/GCCCAGGTCACC...CCCAG|GCT | 2 | 1 | 61.078 |
| 140015419 | GT-AG | 0 | 1.000000099473604e-05 | 625 | rna-XM_040226774.1 25387382 | 23 | 61421077 | 61421701 | Oryx dammah 59534 | CAG|GTGGGAGCCA...TGGCTTTTATTT/ATGGCTTTTATT...TTCAG|ATT | 2 | 1 | 63.927 |
| 140015420 | GT-AG | 0 | 1.000000099473604e-05 | 190 | rna-XM_040226774.1 25387382 | 24 | 61421847 | 61422036 | Oryx dammah 59534 | CAG|GTAAGTAGGC...CACTCCTTTACT/CACTCCTTTACT...TTAAG|GCT | 0 | 1 | 66.738 |
| 140015421 | GT-AG | 0 | 1.000000099473604e-05 | 1204 | rna-XM_040226774.1 25387382 | 25 | 61422154 | 61423357 | Oryx dammah 59534 | GAG|GTAGGACAGA...AATCTCTGAACC/AAATCTCTGAAC...TCTAG|GTG | 0 | 1 | 69.006 |
| 140015422 | GT-AG | 0 | 1.000000099473604e-05 | 1188 | rna-XM_040226774.1 25387382 | 26 | 61423457 | 61424644 | Oryx dammah 59534 | CAA|GTAAGTGTTC...TTTTCCTCCATG/TTTTCCTCCATG...ACTAG|GTA | 0 | 1 | 70.925 |
| 140015423 | GT-AG | 0 | 1.000000099473604e-05 | 1608 | rna-XM_040226774.1 25387382 | 27 | 61424765 | 61426372 | Oryx dammah 59534 | CCC|GTAAGGAATG...GCCTCCCTGACA/GCCTCCCTGACA...TGCAG|GAC | 0 | 1 | 73.251 |
| 140015424 | GT-AG | 0 | 1.000000099473604e-05 | 255 | rna-XM_040226774.1 25387382 | 28 | 61426546 | 61426800 | Oryx dammah 59534 | GCA|GTGAGTGGCC...ACATCCTTTCCT/CTCTTGGTCATT...TTCAG|GTT | 2 | 1 | 76.604 |
| 140015425 | GT-AG | 0 | 1.000000099473604e-05 | 116 | rna-XM_040226774.1 25387382 | 29 | 61426857 | 61426972 | Oryx dammah 59534 | CAG|GTAGGGGCAG...TCACCTTGGATT/TGCCTGCTCACC...CAAAG|CCT | 1 | 1 | 77.689 |
| 140015426 | GT-AG | 0 | 1.000000099473604e-05 | 1710 | rna-XM_040226774.1 25387382 | 30 | 61427052 | 61428761 | Oryx dammah 59534 | AAG|GTAGAGAGGC...CCACCTTTGCCC/AGAGCACTAACC...CACAG|CAT | 2 | 1 | 79.221 |
| 140015427 | GT-AG | 0 | 1.000000099473604e-05 | 3949 | rna-XM_040226774.1 25387382 | 31 | 61428840 | 61432788 | Oryx dammah 59534 | AGA|GTAAGTGTCA...TGTGATTAGACA/ATTAGTGTGATT...TGCAG|GGA | 2 | 1 | 80.733 |
| 140015428 | GT-AG | 0 | 1.000000099473604e-05 | 658 | rna-XM_040226774.1 25387382 | 32 | 61432856 | 61433513 | Oryx dammah 59534 | GAG|GTGAGGACCC...GCCCCCTGGAGA/CACACTGTCAAC...CGTAG|GAG | 0 | 1 | 82.031 |
| 140015429 | GT-AG | 0 | 1.000000099473604e-05 | 3094 | rna-XM_040226774.1 25387382 | 33 | 61433656 | 61436749 | Oryx dammah 59534 | TAG|GTAGGTGTGC...TCTCCCCTGGCC/GCTCTGCTCAGT...TACAG|AAC | 1 | 1 | 84.784 |
| 140015430 | GT-AG | 0 | 1.000000099473604e-05 | 537 | rna-XM_040226774.1 25387382 | 34 | 61436911 | 61437447 | Oryx dammah 59534 | AAG|GTGAGGCCCC...GATTTCTGGATT/TTAGTCCTCAAG...TGAAG|GAT | 0 | 1 | 87.905 |
| 140015431 | GT-AG | 0 | 1.000000099473604e-05 | 496 | rna-XM_040226774.1 25387382 | 35 | 61437586 | 61438081 | Oryx dammah 59534 | GAG|GTCAGTAGTG...CTCTCCTTATAG/CCTCTCCTTATA...TCCAG|GAA | 0 | 1 | 90.58 |
| 140015432 | GT-AG | 0 | 0.1118507424932607 | 2435 | rna-XM_040226774.1 25387382 | 36 | 61438194 | 61440628 | Oryx dammah 59534 | CAA|GTATGCTCCC...CCATCTTTTGCT/CCATCAGTAACC...GTCAG|AGA | 1 | 1 | 92.751 |
| 140015433 | GT-AG | 0 | 1.000000099473604e-05 | 812 | rna-XM_040226774.1 25387382 | 37 | 61440735 | 61441546 | Oryx dammah 59534 | CAG|GTGAGAGCTG...GGACTTTTCATG/TGCATGTTTATT...TGTAG|AAA | 2 | 1 | 94.805 |
| 140015434 | GT-AG | 0 | 1.000000099473604e-05 | 1177 | rna-XM_040226774.1 25387382 | 38 | 61441683 | 61442859 | Oryx dammah 59534 | CTG|GTGAGTGAAG...AAGTCCTTCCTC/TCCTTCCTCATG...CCCAG|AAA | 0 | 1 | 97.441 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);