introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
33 rows where transcript_id = 19905808
This data as json, CSV (advanced)
Suggested facets: score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 106495589 | GT-AG | 0 | 1.000000099473604e-05 | 395 | rna-XM_021538757.1 19905808 | 3 | 373257 | 373651 | Lonchura striata 40157 | AAA|GTAAGTGAAA...CGGGGCTCACCG/GCGGGGCTCACC...TGCAG|ATG | 1 | 1 | 5.309 | 
| 106495590 | GT-AG | 0 | 1.000000099473604e-05 | 172 | rna-XM_021538757.1 19905808 | 4 | 372983 | 373154 | Lonchura striata 40157 | CAG|GTACTGCCCG...GGAGGATTAACA/GGAGGATTAACA...TGCAG|GAG | 1 | 1 | 7.126 | 
| 106495591 | GT-AG | 0 | 1.000000099473604e-05 | 707 | rna-XM_021538757.1 19905808 | 5 | 372096 | 372802 | Lonchura striata 40157 | GAA|GTGAGTGAAG...TTTGTTTTAATA/TTTGTTTTAATA...TTCAG|ACT | 1 | 1 | 10.333 | 
| 106495592 | GT-AG | 0 | 0.0002766592969526 | 1481 | rna-XM_021538757.1 19905808 | 6 | 370475 | 371955 | Lonchura striata 40157 | AAT|GTAAGTTCTG...TGGATTTTAACG/TGGATTTTAACG...GGCAG|CCC | 0 | 1 | 12.827 | 
| 106495593 | GT-AG | 0 | 1.000000099473604e-05 | 575 | rna-XM_021538757.1 19905808 | 7 | 369792 | 370366 | Lonchura striata 40157 | GAG|GTCAGTGCAG...CTGCCCTTATCC/CCTGCCCTTATC...TCTAG|GAA | 0 | 1 | 14.751 | 
| 106495594 | GT-AG | 0 | 1.988076672181948e-05 | 839 | rna-XM_021538757.1 19905808 | 8 | 368769 | 369607 | Lonchura striata 40157 | CCA|GTAAGTACTG...GGGTCTCTAACT/GGGTCTCTAACT...CCCAG|GTA | 1 | 1 | 18.03 | 
| 106495595 | GT-AG | 0 | 1.000000099473604e-05 | 693 | rna-XM_021538757.1 19905808 | 9 | 367912 | 368604 | Lonchura striata 40157 | ATG|GTAAGAGGGG...ATTACCTTAACC/ATTACCTTAACC...TGTAG|GGT | 0 | 1 | 20.951 | 
| 106495596 | GT-AG | 0 | 0.0008186931255979 | 565 | rna-XM_021538757.1 19905808 | 10 | 367209 | 367773 | Lonchura striata 40157 | TCG|GTATGTCTCT...GGTTTCCAAATT/TGTGGTATCAGC...TTCAG|ACC | 0 | 1 | 23.41 | 
| 106495597 | GT-AG | 0 | 1.000000099473604e-05 | 2444 | rna-XM_021538757.1 19905808 | 11 | 364677 | 367120 | Lonchura striata 40157 | TCG|GTAAGAAACC...TCATCTCTAATG/ATGGTTTTCATT...TGAAG|GTT | 1 | 1 | 24.978 | 
| 106495598 | GT-AG | 0 | 1.000000099473604e-05 | 355 | rna-XM_021538757.1 19905808 | 12 | 364229 | 364583 | Lonchura striata 40157 | CAG|GTAAGCAGTT...GTGACCTTGTCA/TAGTAACTGACA...CACAG|CTC | 1 | 1 | 26.635 | 
| 106495599 | GT-AG | 0 | 1.000000099473604e-05 | 899 | rna-XM_021538757.1 19905808 | 13 | 363189 | 364087 | Lonchura striata 40157 | TAG|GTGAGTGCCC...GAGCTCTAAAAC/CTAAAACTGAAA...TGTAG|CTC | 1 | 1 | 29.147 | 
| 106495600 | GT-AG | 0 | 1.000000099473604e-05 | 691 | rna-XM_021538757.1 19905808 | 14 | 362364 | 363054 | Lonchura striata 40157 | GAG|GTAAGTGCCC...CGTGCCTGAGAT/CCGTGCCTGAGA...TCCAG|AGG | 0 | 1 | 31.534 | 
| 106495601 | GT-AG | 0 | 1.000000099473604e-05 | 860 | rna-XM_021538757.1 19905808 | 15 | 361316 | 362175 | Lonchura striata 40157 | AAA|GTGAGCATCT...CCTTCCTTGCTG/TAGATCCAAATT...TTTAG|GAA | 2 | 1 | 34.883 | 
| 106495602 | GT-AG | 0 | 1.000000099473604e-05 | 1015 | rna-XM_021538757.1 19905808 | 16 | 360184 | 361198 | Lonchura striata 40157 | CAG|GTGAGCGAGT...CAGTCCTTCCTC/AAGTAATTCACA...CGCAG|GTT | 2 | 1 | 36.968 | 
| 106495603 | GT-AG | 0 | 1.000000099473604e-05 | 748 | rna-XM_021538757.1 19905808 | 17 | 359131 | 359878 | Lonchura striata 40157 | CAG|GTGAGCCATT...CTGTTCTCAGGG/CCTGTTCTCAGG...TGCAG|GGA | 1 | 1 | 42.402 | 
| 106495604 | GT-AG | 0 | 1.000000099473604e-05 | 740 | rna-XM_021538757.1 19905808 | 18 | 358277 | 359016 | Lonchura striata 40157 | CGG|GTGAGACCCC...GACAATTTAATT/TGACTTTTCACA...TGCAG|GTT | 1 | 1 | 44.433 | 
| 106495605 | GT-AG | 0 | 1.000000099473604e-05 | 205 | rna-XM_021538757.1 19905808 | 19 | 357933 | 358137 | Lonchura striata 40157 | TAG|GTAAGTTAGA...GCTGCCCTGCCC/AGGTTGCCCAGC...TGCAG|GCG | 2 | 1 | 46.909 | 
| 106495606 | GT-AG | 0 | 1.000000099473604e-05 | 1000 | rna-XM_021538757.1 19905808 | 20 | 356755 | 357754 | Lonchura striata 40157 | AAG|GTGAGCCCCG...TTGTCCTTCTTA/CTAGCTGTGACA...CACAG|GTA | 0 | 1 | 50.08 | 
| 106495607 | GT-AG | 0 | 1.000000099473604e-05 | 2855 | rna-XM_021538757.1 19905808 | 21 | 353735 | 356589 | Lonchura striata 40157 | CAG|GTAGAAGGAG...CTGTCCTGGCTG/TGTGGTGTGACC...TGCAG|CCC | 0 | 1 | 53.02 | 
| 106495608 | GT-AG | 0 | 1.000000099473604e-05 | 993 | rna-XM_021538757.1 19905808 | 22 | 352565 | 353557 | Lonchura striata 40157 | CAG|GTCAGTGTCC...TCTGGCTTGGCT/GGGTTGCTGATG...CTCAG|ATC | 0 | 1 | 56.173 | 
| 106495609 | GT-AG | 0 | 1.714558978999625e-05 | 870 | rna-XM_021538757.1 19905808 | 23 | 351544 | 352413 | Lonchura striata 40157 | CAG|GTATGGTGAG...GTGCCCTTGCAC/CTTGCACTGACA...GTCAG|CTG | 1 | 1 | 58.863 | 
| 106495610 | GT-AG | 0 | 1.000000099473604e-05 | 787 | rna-XM_021538757.1 19905808 | 24 | 350336 | 351122 | Lonchura striata 40157 | ATC|GTGAGTAGTG...GCTACCTGATCT/TGCTACCTGATC...TCCAG|ACT | 2 | 1 | 66.364 | 
| 106495611 | GT-AG | 0 | 1.000000099473604e-05 | 281 | rna-XM_021538757.1 19905808 | 25 | 349825 | 350105 | Lonchura striata 40157 | AGA|GTGAGTACAG...CCACTCCTGACG/CCACTCCTGACG...CGCAG|CCA | 1 | 1 | 70.461 | 
| 106495612 | GT-AG | 0 | 1.000000099473604e-05 | 829 | rna-XM_021538757.1 19905808 | 26 | 348726 | 349554 | Lonchura striata 40157 | CAG|GTGAGCACCC...AAGGCCTGAGGG/CAAGGCCTGAGG...TGCAG|GTG | 1 | 1 | 75.272 | 
| 106495613 | GT-AG | 0 | 1.000000099473604e-05 | 865 | rna-XM_021538757.1 19905808 | 27 | 347703 | 348567 | Lonchura striata 40157 | CCG|GTAAGGACAG...TGTGGCTGAGCA/GTGTGGCTGAGC...ACCAG|GTG | 0 | 1 | 78.087 | 
| 106495614 | GT-AG | 0 | 1.000000099473604e-05 | 1232 | rna-XM_021538757.1 19905808 | 28 | 346327 | 347558 | Lonchura striata 40157 | CAG|GTGGGTCACT...CTATCTTCAAAC/TTCAAACTTACT...CCTAG|AAC | 0 | 1 | 80.652 | 
| 106495615 | GT-AG | 0 | 1.000000099473604e-05 | 511 | rna-XM_021538757.1 19905808 | 29 | 345673 | 346183 | Lonchura striata 40157 | CAG|GTAAGTGGGC...TTTGACTTTGTG/CTCCCAGTTACC...TGCAG|GTC | 2 | 1 | 83.2 | 
| 106495616 | GT-AG | 0 | 1.000000099473604e-05 | 630 | rna-XM_021538757.1 19905808 | 30 | 344821 | 345450 | Lonchura striata 40157 | GCA|GTGAGTGACC...AGAGCTGTGACA/AGAGCTGTGACA...CCCAG|TGT | 2 | 1 | 87.155 | 
| 106495617 | GT-AG | 0 | 1.000000099473604e-05 | 523 | rna-XM_021538757.1 19905808 | 31 | 344056 | 344578 | Lonchura striata 40157 | CAG|GTGGGTCTGG...TGTTCCTCTCCT/CTGTGGGAGACG...TCCAG|ATG | 1 | 1 | 91.466 | 
| 106495618 | GT-AG | 0 | 1.000000099473604e-05 | 381 | rna-XM_021538757.1 19905808 | 32 | 343520 | 343900 | Lonchura striata 40157 | CAG|GTAGGAGCAG...GCTGCCTTGGAG/TTGGAGCTGACT...TCCAG|CTG | 0 | 1 | 94.228 | 
| 106495619 | GT-AG | 0 | 1.000000099473604e-05 | 567 | rna-XM_021538757.1 19905808 | 33 | 342841 | 343407 | Lonchura striata 40157 | CAG|GTATGGTGAC...CTGTCCCCGCTC/CCGGGGCGGAGC...TGCAG|ACA | 1 | 1 | 96.223 | 
| 106505099 | GT-AG | 0 | 1.000000099473604e-05 | 1359 | rna-XM_021538757.1 19905808 | 1 | 375903 | 377261 | Lonchura striata 40157 | GCG|GTGAGCACCA...TTTTTCTTAGAA/CTTTTTCTTAGA...TTTAG|TTC | 0 | 1.39 | |
| 106505100 | GT-AG | 0 | 1.000000099473604e-05 | 2000 | rna-XM_021538757.1 19905808 | 2 | 373756 | 375755 | Lonchura striata 40157 | CAG|GTGATTTTTA...AAAACCTGAATT/TGAGCTTTCAAT...TCCAG|ATC | 0 | 4.009 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);