introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
60 rows where transcript_id = 25387375
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 140015149 | GT-AG | 0 | 1.000000099473604e-05 | 6520 | rna-XM_040239871.1 25387375 | 1 | 101491769 | 101498288 | Oryx dammah 59534 | GGG|GTGAGTACGG...GATGCCGTATCT/TGGAAGCTGATG...TCTAG|GGG | 2 | 1 | 1.283 |
| 140015150 | GT-AG | 0 | 0.0007517633193863 | 4825 | rna-XM_040239871.1 25387375 | 2 | 101498360 | 101503184 | Oryx dammah 59534 | AAG|GTAACTGTCT...CAGGCCCTGACT/CAGGCCCTGACT...TCCAG|ATG | 1 | 1 | 2.565 |
| 140015151 | GT-AG | 0 | 1.000000099473604e-05 | 8227 | rna-XM_040239871.1 25387375 | 3 | 101504903 | 101513129 | Oryx dammah 59534 | CCG|GTAAGAGTTG...ATCTTCTTGCTT/GTGGTACTGATG...TTCAG|GGT | 0 | 1 | 33.604 |
| 140015152 | GT-AG | 0 | 1.000000099473604e-05 | 4117 | rna-XM_040239871.1 25387375 | 4 | 101513184 | 101517300 | Oryx dammah 59534 | CGG|GTAAGTGATC...TTCCCCTCATCT/TTTCCCCTCATC...TTCAG|GGT | 0 | 1 | 34.58 |
| 140015153 | GT-AG | 0 | 1.000000099473604e-05 | 10249 | rna-XM_040239871.1 25387375 | 5 | 101517355 | 101527603 | Oryx dammah 59534 | AAA|GTGAGTATAT...CCCTCTTTAGAA/ACCCTCTTTAGA...TTCAG|GGA | 0 | 1 | 35.556 |
| 140015154 | GT-AG | 0 | 1.000000099473604e-05 | 1448 | rna-XM_040239871.1 25387375 | 6 | 101527658 | 101529105 | Oryx dammah 59534 | AAG|GTAGGTTTCC...TTTTCTGTGTTT/CCCCATCTCACC...TTCAG|GGC | 0 | 1 | 36.531 |
| 140015155 | GT-AG | 0 | 0.0015378074783428 | 9618 | rna-XM_040239871.1 25387375 | 7 | 101529160 | 101538777 | Oryx dammah 59534 | AAG|GTACACCTTG...GTTTCTTTCCCT/CCTAGGCTCAAG...CACAG|GGA | 0 | 1 | 37.507 |
| 140015156 | GT-AG | 0 | 1.000000099473604e-05 | 640 | rna-XM_040239871.1 25387375 | 8 | 101538823 | 101539462 | Oryx dammah 59534 | CAG|GTGAGGGCTG...CTTTCCTTACAT/CCTTTCCTTACA...TGCAG|GGG | 0 | 1 | 38.32 |
| 140015157 | GT-AG | 0 | 1.000000099473604e-05 | 422 | rna-XM_040239871.1 25387375 | 9 | 101539517 | 101539938 | Oryx dammah 59534 | CAG|GTGCAGTATA...ATGTCCTTGCCC/GACGTCTCCATA...TTCAG|GGG | 0 | 1 | 39.295 |
| 140015158 | GT-AG | 0 | 1.000000099473604e-05 | 3466 | rna-XM_040239871.1 25387375 | 10 | 101539984 | 101543449 | Oryx dammah 59534 | CGG|GTAAGTGTGA...CCCTTCTGACCT/GCCCTTCTGACC...CCTAG|GGC | 0 | 1 | 40.108 |
| 140015159 | GT-AG | 0 | 1.000000099473604e-05 | 883 | rna-XM_040239871.1 25387375 | 11 | 101543504 | 101544386 | Oryx dammah 59534 | CGA|GTGAGTATGC...CTGTCCTGAATC/CCTGTCCTGAAT...TACAG|GGT | 0 | 1 | 41.084 |
| 140015160 | GT-AG | 0 | 1.000000099473604e-05 | 8804 | rna-XM_040239871.1 25387375 | 12 | 101544432 | 101553235 | Oryx dammah 59534 | CCG|GTAAAGATTT...TACACACTAATC/TGCTCTCTCATG...CTCAG|GGG | 0 | 1 | 41.897 |
| 140015161 | GT-AG | 0 | 6.525716098269168e-05 | 2268 | rna-XM_040239871.1 25387375 | 13 | 101553290 | 101555557 | Oryx dammah 59534 | CCT|GTAAGTATTT...ACCACCTTGGTC/GAGCAAGTAACC...TGCAG|GGA | 0 | 1 | 42.873 |
| 140015162 | GT-AG | 0 | 1.000000099473604e-05 | 9264 | rna-XM_040239871.1 25387375 | 14 | 101555603 | 101564866 | Oryx dammah 59534 | ATT|GTAAGTACAC...TTCTCTTTCTCT/GCCTTTCTCATT...CCCAG|GGC | 0 | 1 | 43.686 |
| 140015163 | GT-AG | 0 | 1.000000099473604e-05 | 707 | rna-XM_040239871.1 25387375 | 15 | 101564921 | 101565627 | Oryx dammah 59534 | AAG|GTAAACAGAA...GGGGCTTTCACC/TTCACCCTCACA...TGCAG|GGA | 0 | 1 | 44.661 |
| 140015164 | GT-AG | 0 | 1.000000099473604e-05 | 3270 | rna-XM_040239871.1 25387375 | 16 | 101565673 | 101568942 | Oryx dammah 59534 | AAG|GTGATCTGAA...GTAACCTTCTCT/ATGGTTTCCATC...TTTAG|GGT | 0 | 1 | 45.474 |
| 140015165 | GT-AG | 0 | 0.0004557163492352 | 1243 | rna-XM_040239871.1 25387375 | 17 | 101568997 | 101570239 | Oryx dammah 59534 | AAG|GTAACCCCTG...GCGTCGCTAACC/GCGTCGCTAACC...TTCAG|GGG | 0 | 1 | 46.45 |
| 140015166 | GT-AG | 0 | 1.000000099473604e-05 | 829 | rna-XM_040239871.1 25387375 | 18 | 101570294 | 101571122 | Oryx dammah 59534 | GTG|GTGAGTACCT...AATCTCTTCTCT/CCCTCGTTTACC...CACAG|GGC | 0 | 1 | 47.425 |
| 140015167 | GT-AG | 0 | 0.0001339252473382 | 2807 | rna-XM_040239871.1 25387375 | 19 | 101571177 | 101573983 | Oryx dammah 59534 | GAG|GTATTTAATG...ATTTCCCTACGT/CTCTGGGTGACC...TTCAG|GGA | 0 | 1 | 48.401 |
| 140015168 | GT-AG | 0 | 1.000000099473604e-05 | 149 | rna-XM_040239871.1 25387375 | 20 | 101574038 | 101574186 | Oryx dammah 59534 | AAG|GTGAGTCCCT...CGCCTCTGAGCC/CCGCCTCTGAGC...ATCAG|GGT | 0 | 1 | 49.377 |
| 140015169 | GT-AG | 0 | 1.000000099473604e-05 | 2159 | rna-XM_040239871.1 25387375 | 21 | 101574241 | 101576399 | Oryx dammah 59534 | GAG|GTGAGACCAT...TTCTCCTTTTTC/ACTGAATTAACT...CCTAG|GGA | 0 | 1 | 50.352 |
| 140015170 | GT-AG | 0 | 1.000000099473604e-05 | 1355 | rna-XM_040239871.1 25387375 | 22 | 101576445 | 101577799 | Oryx dammah 59534 | GAG|GTGAGTGTTG...CTTCTCTCACTC/GCTTCTCTCACT...TACAG|GGT | 0 | 1 | 51.165 |
| 140015171 | GT-AG | 0 | 1.000000099473604e-05 | 1818 | rna-XM_040239871.1 25387375 | 23 | 101577854 | 101579671 | Oryx dammah 59534 | AAG|GTGAGGGGAC...CAGGCCTGGACT/TCCCGAGTGACC...TGCAG|GGC | 0 | 1 | 52.141 |
| 140015172 | GT-AG | 0 | 1.000000099473604e-05 | 5477 | rna-XM_040239871.1 25387375 | 24 | 101579717 | 101585193 | Oryx dammah 59534 | CAG|GTGAGTCACC...TTTCTCTTGCTT/CCTGAATTCATG...TCTAG|GGA | 0 | 1 | 52.954 |
| 140015173 | GT-AG | 0 | 1.000000099473604e-05 | 597 | rna-XM_040239871.1 25387375 | 25 | 101585248 | 101585844 | Oryx dammah 59534 | AAG|GTAAGTCACA...ACAGCCGTGACC/ACAGCCGTGACC...CACAG|GGT | 0 | 1 | 53.93 |
| 140015174 | GT-AG | 0 | 1.000000099473604e-05 | 236 | rna-XM_040239871.1 25387375 | 26 | 101585899 | 101586134 | Oryx dammah 59534 | ATG|GTAAGGAGCA...TCCTCCTTGTTC/TCCTTGTTCATC...GGTAG|GGC | 0 | 1 | 54.905 |
| 140015175 | GT-AG | 0 | 1.000000099473604e-05 | 3847 | rna-XM_040239871.1 25387375 | 27 | 101586189 | 101590035 | Oryx dammah 59534 | CTG|GTAAGCAAAG...GATTCTTTCTCC/CTTCTCCAGATT...CACAG|GGT | 0 | 1 | 55.881 |
| 140015176 | GT-AG | 0 | 1.000000099473604e-05 | 5438 | rna-XM_040239871.1 25387375 | 28 | 101590090 | 101595527 | Oryx dammah 59534 | CGG|GTAAGTGGGG...AGCCCCTTTTTC/CTGCTGTCCACT...TCCAG|GGA | 0 | 1 | 56.856 |
| 140015177 | GT-AG | 0 | 1.000000099473604e-05 | 556 | rna-XM_040239871.1 25387375 | 29 | 101595582 | 101596137 | Oryx dammah 59534 | AAG|GTACTGACCC...TCATGCTTGGCT/CCCCCCCTCATG...TGCAG|GGC | 0 | 1 | 57.832 |
| 140015178 | GT-AG | 0 | 1.1393559472830429e-05 | 83 | rna-XM_040239871.1 25387375 | 30 | 101596183 | 101596265 | Oryx dammah 59534 | CAG|GTATGTGAGG...TGTTCTGTGATA/GTGCTTCTAACA...TCCAG|GGC | 0 | 1 | 58.645 |
| 140015179 | GT-AG | 0 | 1.000000099473604e-05 | 285 | rna-XM_040239871.1 25387375 | 31 | 101596311 | 101596595 | Oryx dammah 59534 | CCT|GTAAGTAGCA...CTTACTTTGTCC/GGTCAGCTTACT...TGCAG|GGC | 0 | 1 | 59.458 |
| 140015180 | GT-AG | 0 | 1.000000099473604e-05 | 1091 | rna-XM_040239871.1 25387375 | 32 | 101596650 | 101597740 | Oryx dammah 59534 | CCG|GTAAGTGCCC...CTTCTCCCGACT/CTTCTCCCGACT...TCCAG|GGC | 0 | 1 | 60.434 |
| 140015181 | GT-AG | 0 | 1.000000099473604e-05 | 894 | rna-XM_040239871.1 25387375 | 33 | 101597795 | 101598688 | Oryx dammah 59534 | AAG|GTGAGTGCCG...CAGCCCTTGCTC/CTAGGATGGACC...TGCAG|GGA | 0 | 1 | 61.409 |
| 140015182 | GT-AG | 0 | 1.000000099473604e-05 | 1405 | rna-XM_040239871.1 25387375 | 34 | 101598743 | 101600147 | Oryx dammah 59534 | AAG|GTAAGAGGGG...TTGTTTTTGGCT/GCTGGTCCTATC...CCTAG|GGT | 0 | 1 | 62.385 |
| 140015183 | GT-AG | 0 | 1.000000099473604e-05 | 1889 | rna-XM_040239871.1 25387375 | 35 | 101600202 | 101602090 | Oryx dammah 59534 | CGG|GTAAGTCAAA...GTCTCCTCATCT/TGTCTCCTCATC...TCCAG|GGA | 0 | 1 | 63.36 |
| 140015184 | GT-AG | 0 | 1.000000099473604e-05 | 3974 | rna-XM_040239871.1 25387375 | 36 | 101602145 | 101606118 | Oryx dammah 59534 | AAG|GTAAGTGTCC...TCTTCCTTCCTC/TGGTGACTAATT...CCCAG|GGG | 0 | 1 | 64.336 |
| 140015185 | GT-AG | 0 | 1.000000099473604e-05 | 2189 | rna-XM_040239871.1 25387375 | 37 | 101606227 | 101608415 | Oryx dammah 59534 | CGG|GTGAGTGTGC...TCATCTTTTTCT/TTTTCTCTCACT...TTCAG|GGT | 0 | 1 | 66.287 |
| 140015186 | GT-AG | 0 | 1.000000099473604e-05 | 109 | rna-XM_040239871.1 25387375 | 38 | 101608470 | 101608578 | Oryx dammah 59534 | AAG|GTAGGGCCCC...GATGCCCTGTCT/TACCTGGTGATG...TGCAG|GGT | 0 | 1 | 67.263 |
| 140015187 | GT-AG | 0 | 1.000000099473604e-05 | 1176 | rna-XM_040239871.1 25387375 | 39 | 101608687 | 101609862 | Oryx dammah 59534 | ACG|GTGAGCACTC...CCTGCTGTGACA/CCTGCTGTGACA...CACAG|GGT | 0 | 1 | 69.214 |
| 140015188 | GT-AG | 0 | 1.000000099473604e-05 | 952 | rna-XM_040239871.1 25387375 | 40 | 101609917 | 101610868 | Oryx dammah 59534 | GAC|GTAAGGAGCT...GCCATCTTACCT/CGTGCTCTCACC...TGCAG|GGA | 0 | 1 | 70.19 |
| 140015189 | GT-AG | 0 | 1.000000099473604e-05 | 4577 | rna-XM_040239871.1 25387375 | 41 | 101610923 | 101615499 | Oryx dammah 59534 | AAG|GTGGGTGTCT...TTTGTCTTAATG/TTTGTCTTAATG...CACAG|GGG | 0 | 1 | 71.165 |
| 140015190 | GT-AG | 0 | 1.000000099473604e-05 | 168 | rna-XM_040239871.1 25387375 | 42 | 101615557 | 101615724 | Oryx dammah 59534 | CGG|GTAAGGGCCC...CTGTCCTTTTCA/CAGTCTTCTATT...TTTAG|GGC | 0 | 1 | 72.195 |
| 140015191 | GT-AG | 0 | 0.0001930520738783 | 756 | rna-XM_040239871.1 25387375 | 43 | 101615779 | 101616534 | Oryx dammah 59534 | CCT|GTAAGTATTC...CTCTGCTTGACT/CTCTGCTTGACT...TCCAG|GGA | 0 | 1 | 73.171 |
| 140015192 | GT-AG | 0 | 1.000000099473604e-05 | 284 | rna-XM_040239871.1 25387375 | 44 | 101616589 | 101616872 | Oryx dammah 59534 | CCC|GTGAGTGGTG...CTCACCTTGGTT/CGTCATCTCACC...TGCAG|GGG | 0 | 1 | 74.146 |
| 140015193 | GT-AG | 0 | 1.000000099473604e-05 | 850 | rna-XM_040239871.1 25387375 | 45 | 101616927 | 101617776 | Oryx dammah 59534 | GAG|GTAAGAGGCC...TGCCCCTTGATT/TGCCCCTTGATT...TTCAG|GGA | 0 | 1 | 75.122 |
| 140015194 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_040239871.1 25387375 | 46 | 101617831 | 101617912 | Oryx dammah 59534 | CAG|GTGAGTGCCT...GGCTTCTTGTTT/TTCTTGTTTACT...CCCAG|GGC | 0 | 1 | 76.098 |
| 140015195 | GT-AG | 0 | 1.3997017461361784e-05 | 467 | rna-XM_040239871.1 25387375 | 47 | 101618021 | 101618487 | Oryx dammah 59534 | CAG|GTAAGCTGGA...ATTTCCTGAAAC/TATTTCCTGAAA...CACAG|GGG | 0 | 1 | 78.049 |
| 140015196 | GT-AG | 0 | 1.000000099473604e-05 | 1122 | rna-XM_040239871.1 25387375 | 48 | 101618596 | 101619717 | Oryx dammah 59534 | AAG|GTCAGACACT...CTCCCTTTGACT/CTCCCTTTGACT...TTAAG|GGT | 0 | 1 | 80.0 |
| 140015197 | GT-AG | 0 | 1.000000099473604e-05 | 1738 | rna-XM_040239871.1 25387375 | 49 | 101619826 | 101621563 | Oryx dammah 59534 | CCG|GTGAGTGAGC...CTTGTCTTGGCC/CTTGGCCTCACT...CATAG|GGT | 0 | 1 | 81.951 |
| 140015198 | GT-AG | 0 | 0.0075039543755582 | 507 | rna-XM_040239871.1 25387375 | 50 | 101621618 | 101622124 | Oryx dammah 59534 | AAG|GTACCGTTCT...CAGCCCTTCTCT/GGAGCCCTCATC...CGCAG|GGC | 0 | 1 | 82.927 |
| 140015199 | GT-AG | 0 | 1.000000099473604e-05 | 524 | rna-XM_040239871.1 25387375 | 51 | 101622188 | 101622711 | Oryx dammah 59534 | GTG|GTGAGTCCTC...AAGCCTTTCTCT/CAAGGACACACA...TTTAG|GGA | 0 | 1 | 84.065 |
| 140015200 | GT-AG | 0 | 1.000000099473604e-05 | 142 | rna-XM_040239871.1 25387375 | 52 | 101622766 | 101622907 | Oryx dammah 59534 | CAG|GTATGTGCAG...CTCCCCTGAGCC/CCCCCTCTCACT...TGCAG|GGT | 0 | 1 | 85.041 |
| 140015201 | GT-AG | 0 | 1.000000099473604e-05 | 105 | rna-XM_040239871.1 25387375 | 53 | 101622944 | 101623048 | Oryx dammah 59534 | TTG|GTGAGTAGAC...GCTCCTCTAACT/GCTCCTCTAACT...TCCAG|GGA | 0 | 1 | 85.691 |
| 140015202 | GT-AG | 0 | 1.000000099473604e-05 | 206 | rna-XM_040239871.1 25387375 | 54 | 101623067 | 101623272 | Oryx dammah 59534 | AGG|GTGAGTGGGC...AGGACTTTGAGT/TGGGGCCTCACT...TCCAG|GGT | 0 | 1 | 86.016 |
| 140015203 | GT-AG | 0 | 1.000000099473604e-05 | 254 | rna-XM_040239871.1 25387375 | 55 | 101623309 | 101623562 | Oryx dammah 59534 | CCG|GTAGGTAGTA...AGCCTCTTCTTT/GCAGTCCCCATC...TGCAG|GGT | 0 | 1 | 86.667 |
| 140015204 | GT-AG | 0 | 0.0001503788495229 | 3161 | rna-XM_040239871.1 25387375 | 56 | 101623590 | 101626750 | Oryx dammah 59534 | TTT|GTAAGTTGGA...CCTGTCTTCTCT/AGGAGGCACACC...CACAG|CAA | 0 | 1 | 87.154 |
| 140015205 | GT-AG | 0 | 0.0002635148898321 | 848 | rna-XM_040239871.1 25387375 | 57 | 101626817 | 101627664 | Oryx dammah 59534 | GAG|GTACCACCCA...ACCCTCTTTTCT/AAGGGCCTGACG...AACAG|GGT | 0 | 1 | 88.347 |
| 140015206 | GT-AG | 0 | 1.000000099473604e-05 | 1290 | rna-XM_040239871.1 25387375 | 58 | 101627834 | 101629123 | Oryx dammah 59534 | ATG|GTATGAGGGC...GGTTCCTCCCCA/CATACATACACT...TGCAG|GTA | 1 | 1 | 91.4 |
| 140015207 | GT-AG | 0 | 0.0645743666679163 | 9605 | rna-XM_040239871.1 25387375 | 59 | 101629234 | 101638838 | Oryx dammah 59534 | AAG|GTACCCATCT...CCTGCCTGACCG/CCCTGCCTGACC...CACAG|GTG | 0 | 1 | 93.388 |
| 140015208 | GT-AG | 0 | 0.0026698818131376 | 1205 | rna-XM_040239871.1 25387375 | 60 | 101639058 | 101640262 | Oryx dammah 59534 | AAG|GTAACTCTTG...TACCCCTTTCCC/TGTGTGTGTACC...CTCAG|ATC | 0 | 1 | 97.344 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);