introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
33 rows where transcript_id = 19905836
This data as json, CSV (advanced)
Suggested facets: score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 106496346 | GT-AG | 0 | 1.000000099473604e-05 | 6475 | rna-XM_031506025.1 19905836 | 2 | 110370705 | 110377179 | Lonchura striata 40157 | GAG|GTAAGGGGGG...CAGTGCTTGCTC/TGGGAAGTGAGG...CACAG|CAT | 2 | 1 | 17.542 | 
| 106496347 | GT-AG | 0 | 1.000000099473604e-05 | 1504 | rna-XM_031506025.1 19905836 | 3 | 110369055 | 110370558 | Lonchura striata 40157 | TTG|GTGAGTACAA...GACCCCTTGCTC/CCCCAGCTGATT...GTCAG|ATG | 1 | 1 | 20.62 | 
| 106496348 | GT-AG | 0 | 1.000000099473604e-05 | 864 | rna-XM_031506025.1 19905836 | 4 | 110368123 | 110368986 | Lonchura striata 40157 | AAG|GTTGGTCCCA...CAGGTGTCACCA/CCAGGTGTCACC...TGCAG|GAG | 0 | 1 | 22.054 | 
| 106496349 | GT-AG | 0 | 2.5650760356189825e-05 | 901 | rna-XM_031506025.1 19905836 | 5 | 110367118 | 110368018 | Lonchura striata 40157 | CAG|GTATGAGCGT...CAGCTCTTAACC/CGGCTCCTCATC...CCCAG|TGG | 2 | 1 | 24.246 | 
| 106496350 | GT-AG | 0 | 1.000000099473604e-05 | 1494 | rna-XM_031506025.1 19905836 | 6 | 110365453 | 110366946 | Lonchura striata 40157 | GGG|GTGAGTGATG...GCATCCTGAGTT/AGCATCCTGAGT...CCCAG|GTC | 2 | 1 | 27.852 | 
| 106496351 | GT-AG | 0 | 1.000000099473604e-05 | 278 | rna-XM_031506025.1 19905836 | 7 | 110365105 | 110365382 | Lonchura striata 40157 | AAG|GTGGGTGGAG...ATTTCCCTGAGG/ATTTCCCTGAGG...CCCAG|GAT | 0 | 1 | 29.327 | 
| 106496352 | GT-AG | 0 | 1.000000099473604e-05 | 115 | rna-XM_031506025.1 19905836 | 8 | 110364869 | 110364983 | Lonchura striata 40157 | ATG|GTGAGTGACA...TGTTCCTGACCT/CTGTTCCTGACC...CGCAG|CAG | 1 | 1 | 31.879 | 
| 106496353 | GT-AG | 0 | 1.000000099473604e-05 | 373 | rna-XM_031506025.1 19905836 | 9 | 110364290 | 110364662 | Lonchura striata 40157 | GAG|GTGGGTTGCT...CATTCCTTGCCC/CCCCCCCTCATT...ACCAG|GAC | 0 | 1 | 36.222 | 
| 106496354 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_031506025.1 19905836 | 10 | 110364101 | 110364182 | Lonchura striata 40157 | CAG|GTGAGCCCAG...CCACCCTGAGCC/GTATAGCTCACC...GGCAG|CTT | 2 | 1 | 38.478 | 
| 106496355 | GT-AG | 0 | 0.0275453546485942 | 85 | rna-XM_031506025.1 19905836 | 11 | 110363816 | 110363900 | Lonchura striata 40157 | CAG|GTACCCATAA...GGTCCCTTACGG/TTACGGCTCATC...GGCAG|GGG | 1 | 1 | 42.694 | 
| 106496356 | GT-AG | 0 | 1.000000099473604e-05 | 1083 | rna-XM_031506025.1 19905836 | 12 | 110362647 | 110363729 | Lonchura striata 40157 | GAG|GTAGTGGCAC...ATCTCCTTGTCA/CTCCTTGTCACT...CACAG|CTC | 0 | 1 | 44.508 | 
| 106496357 | GT-AG | 0 | 1.000000099473604e-05 | 980 | rna-XM_031506025.1 19905836 | 13 | 110361484 | 110362463 | Lonchura striata 40157 | AGG|GTCAGTAGCC...TCAGCTTCACCA/ATCAGCTTCACC...TGCAG|GCT | 0 | 1 | 48.366 | 
| 106496358 | GT-AG | 0 | 1.000000099473604e-05 | 1398 | rna-XM_031506025.1 19905836 | 14 | 110359911 | 110361308 | Lonchura striata 40157 | CAG|GTAAGGGCTG...CTCCCCATGACA/GACAGTCTGATC...TGCAG|AGC | 1 | 1 | 52.056 | 
| 106496359 | GT-AG | 0 | 0.0002159038010154 | 226 | rna-XM_031506025.1 19905836 | 15 | 110359550 | 110359775 | Lonchura striata 40157 | AAG|GTACATTTGT...CTGTCCTGTGCT/AGGCTGCTCAGT...TACAG|AGT | 1 | 1 | 54.902 | 
| 106496360 | GT-AG | 0 | 1.000000099473604e-05 | 490 | rna-XM_031506025.1 19905836 | 16 | 110358924 | 110359413 | Lonchura striata 40157 | TGG|GTAAGGCTGC...CTCCCCTTTTCC/CTCTATCTCACC...TGAAG|GAT | 2 | 1 | 57.769 | 
| 106496361 | GT-AG | 0 | 1.000000099473604e-05 | 87 | rna-XM_031506025.1 19905836 | 17 | 110358734 | 110358820 | Lonchura striata 40157 | AAG|GTGGGATGCA...GATTCCTCTCCT/GTGGTGCTGATG...CTCAG|TCC | 0 | 1 | 59.941 | 
| 106496362 | GT-AG | 0 | 1.000000099473604e-05 | 326 | rna-XM_031506025.1 19905836 | 18 | 110358212 | 110358537 | Lonchura striata 40157 | TCT|GTGAGTACCT...CCTGCCTTCCTT/CCGTAGGTGATG...TCCAG|CCA | 1 | 1 | 64.073 | 
| 106496363 | GT-AG | 0 | 1.000000099473604e-05 | 207 | rna-XM_031506025.1 19905836 | 19 | 110357959 | 110358165 | Lonchura striata 40157 | GAG|GTAAGAAGGT...TGAGCCTAGGCA/AGAGAACTGAGC...GGCAG|GAC | 2 | 1 | 65.043 | 
| 106496364 | GT-AG | 0 | 1.000000099473604e-05 | 298 | rna-XM_031506025.1 19905836 | 20 | 110357497 | 110357794 | Lonchura striata 40157 | GTG|GTATGGGCCA...GGGCTCTCATTC/GGGGCTCTCATT...CACAG|GGC | 1 | 1 | 68.501 | 
| 106496365 | GT-AG | 0 | 1.000000099473604e-05 | 905 | rna-XM_031506025.1 19905836 | 21 | 110356379 | 110357283 | Lonchura striata 40157 | CGG|GTGAGCCCTG...TGAATCTTAATG/TCCATGTTCATT...GGCAG|CGC | 1 | 1 | 72.992 | 
| 106496366 | GT-AG | 0 | 0.0001233289004683 | 223 | rna-XM_031506025.1 19905836 | 22 | 110356050 | 110356272 | Lonchura striata 40157 | CCG|GTATGGCATC...GGAATCTTGACA/GGAATCTTGACA...CACAG|GGT | 2 | 1 | 75.227 | 
| 106496367 | GT-AG | 0 | 4.252740344345891e-05 | 211 | rna-XM_031506025.1 19905836 | 23 | 110355691 | 110355901 | Lonchura striata 40157 | AAC|GTAGGTTCAC...CTTCTCTTTTCT/TCGGCCCTGATG...GGTAG|GTC | 0 | 1 | 78.347 | 
| 106496368 | GT-AG | 0 | 1.000000099473604e-05 | 158 | rna-XM_031506025.1 19905836 | 24 | 110355449 | 110355606 | Lonchura striata 40157 | CAG|GTGGGTCCTG...AGCACTTTACTG/AAGCACTTTACT...TCCAG|CAA | 0 | 1 | 80.118 | 
| 106496369 | GT-AG | 0 | 1.000000099473604e-05 | 158 | rna-XM_031506025.1 19905836 | 25 | 110355222 | 110355379 | Lonchura striata 40157 | AAG|GTGAGTAGTT...GGGGCCTGGACA/TGGACACTGACT...CTCAG|ATC | 0 | 1 | 81.573 | 
| 106496370 | GT-AG | 0 | 1.000000099473604e-05 | 850 | rna-XM_031506025.1 19905836 | 26 | 110354254 | 110355103 | Lonchura striata 40157 | CAG|GTTGGTGCAG...TGTCCCCTGACT/CACTTTCTGAGA...TACAG|AGC | 1 | 1 | 84.061 | 
| 106496371 | GT-AG | 0 | 1.000000099473604e-05 | 391 | rna-XM_031506025.1 19905836 | 27 | 110353749 | 110354139 | Lonchura striata 40157 | TTG|GTGAGAGGCA...GGGGCCAGAGCC/GGGGGCCTGATG...TCCAG|CTA | 1 | 1 | 86.464 | 
| 106496372 | GT-AG | 0 | 1.000000099473604e-05 | 1694 | rna-XM_031506025.1 19905836 | 28 | 110351912 | 110353605 | Lonchura striata 40157 | CGG|GTGAGCCCTT...GGTTCCCTGTTC/CAGCCACCAACC...CCCAG|AGT | 0 | 1 | 89.479 | 
| 106496373 | GT-AG | 0 | 1.000000099473604e-05 | 457 | rna-XM_031506025.1 19905836 | 29 | 110351372 | 110351828 | Lonchura striata 40157 | GTG|GTGAGCAGCA...CATGCTTTCTCC/TTGGGATTCATG...TCCAG|CTG | 2 | 1 | 91.229 | 
| 106496374 | GT-AG | 0 | 1.000000099473604e-05 | 384 | rna-XM_031506025.1 19905836 | 30 | 110350937 | 110351320 | Lonchura striata 40157 | ATG|GTGAGGGAAG...CTTGCCTCCACC/TGGCTGCTGACA...CACAG|GTA | 2 | 1 | 92.304 | 
| 106496375 | GT-AG | 0 | 1.000000099473604e-05 | 176 | rna-XM_031506025.1 19905836 | 31 | 110350697 | 110350872 | Lonchura striata 40157 | CAG|GTAGATCACT...GTCTCCATCACC/GGGTGGCTGAGT...TGCAG|AAC | 0 | 1 | 93.654 | 
| 106496376 | GT-AG | 0 | 1.000000099473604e-05 | 877 | rna-XM_031506025.1 19905836 | 32 | 110349664 | 110350540 | Lonchura striata 40157 | ACT|GTGAGTCATC...CTGCCCTTTGTC/TGAAAGGTGATC...CCCAG|CTT | 0 | 1 | 96.943 | 
| 106505121 | GT-AG | 0 | 0.0001778710573693 | 7144 | rna-XM_031506025.1 19905836 | 1 | 110377926 | 110385069 | Lonchura striata 40157 | GAG|GTACCGGGTG...TGATCCTGATCC/CTGATCCTGATC...CCCAG|GTC | 0 | 3.458 | |
| 106505122 | GT-AG | 0 | 1.000000099473604e-05 | 181 | rna-XM_031506025.1 19905836 | 33 | 110349445 | 110349625 | Lonchura striata 40157 | CCA|GTGAGTTTCC...GACACTTTGCTC/CATTTGCTGACA...CACAG|GTT | 0 | 97.744 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);