introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
17 rows where transcript_id = 24215978
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 132129693 | GT-AG | 0 | 1.000000099473604e-05 | 997 | rna-XM_031638199.1 24215978 | 1 | 34429555 | 34430551 | Nymphaea colorata 210225 | TCG|GTTAAGTGAC...AATTTCCTGATA/TAATATCTAACT...TTCAG|GTT | 0 | 1 | 13.893 | 
| 132129694 | GT-AG | 0 | 1.000000099473604e-05 | 113 | rna-XM_031638199.1 24215978 | 2 | 34429294 | 34429406 | Nymphaea colorata 210225 | CTG|GTAAAGCTTC...TCTGTCTTGGTT/TTGGTTATCATC...TGCAG|TAG | 1 | 1 | 17.558 | 
| 132129695 | GT-AG | 0 | 1.000000099473604e-05 | 107 | rna-XM_031638199.1 24215978 | 3 | 34429108 | 34429214 | Nymphaea colorata 210225 | GAG|GTCATAAAGG...ATTTCTTTTTCA/TTCTTTTTCATC...GACAG|GGC | 2 | 1 | 19.515 | 
| 132129696 | GT-AG | 0 | 1.000000099473604e-05 | 87 | rna-XM_031638199.1 24215978 | 4 | 34428867 | 34428953 | Nymphaea colorata 210225 | GAG|GTGAAAGAAA...TTTGTCCTATTA/TAGGCATTTACA...TGCAG|ATG | 0 | 1 | 23.328 | 
| 132129697 | GT-AG | 0 | 0.0001982974578938 | 95 | rna-XM_031638199.1 24215978 | 5 | 34428562 | 34428656 | Nymphaea colorata 210225 | GTG|GTATGTAATC...TTATACTTACAT/GTTATACTTACA...GGAAG|GTG | 0 | 1 | 28.529 | 
| 132129698 | GT-AG | 0 | 0.0574047301984927 | 242 | rna-XM_031638199.1 24215978 | 6 | 34428074 | 34428315 | Nymphaea colorata 210225 | GAG|GTACTCTTTT...AATGTTTTAATA/AATGTTTTAATA...TGCAG|GTA | 0 | 1 | 34.621 | 
| 132129699 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_031638199.1 24215978 | 7 | 34427829 | 34427910 | Nymphaea colorata 210225 | TTG|GTTAGTACTT...TTGACTTTAATG/TAATGTTTCACA...CTTAG|GGG | 1 | 1 | 38.658 | 
| 132129700 | GT-AG | 0 | 1.000000099473604e-05 | 77 | rna-XM_031638199.1 24215978 | 8 | 34427491 | 34427567 | Nymphaea colorata 210225 | TAG|GTGGGAACTT...CTGTCATTGATT/TGGTTATTCACT...GTCAG|GAA | 1 | 1 | 45.121 | 
| 132129701 | GT-AG | 0 | 1.000000099473604e-05 | 81 | rna-XM_031638199.1 24215978 | 9 | 34427288 | 34427368 | Nymphaea colorata 210225 | AAG|GTTTGATAAA...TTTTTCTTACAA/GTTTTTCTTACA...TTCAG|CAT | 0 | 1 | 48.143 | 
| 132129702 | GT-AG | 0 | 8.752040537093878e-05 | 1055 | rna-XM_031638199.1 24215978 | 10 | 34426071 | 34427125 | Nymphaea colorata 210225 | CAG|GTATTATCAT...AACTTCTTTTTT/TTTTTTCCCATC...AACAG|TAT | 0 | 1 | 52.155 | 
| 132129703 | GT-AG | 0 | 1.000000099473604e-05 | 124 | rna-XM_031638199.1 24215978 | 11 | 34425745 | 34425868 | Nymphaea colorata 210225 | ATG|GTAGGAGAAA...TTCCTCTGAACG/TGTAGACTGACA...TCTAG|ATG | 1 | 1 | 57.157 | 
| 132129704 | GC-AG | 0 | 1.000000099473604e-05 | 93 | rna-XM_031638199.1 24215978 | 12 | 34425515 | 34425607 | Nymphaea colorata 210225 | AAG|GCGAGCATAG...AAAATTTTGATT/AAAATTTTGATT...TATAG|ACT | 0 | 1 | 60.55 | 
| 132129705 | GT-AG | 0 | 1.000000099473604e-05 | 114 | rna-XM_031638199.1 24215978 | 13 | 34425259 | 34425372 | Nymphaea colorata 210225 | CAG|GTAAAGCCAT...GGCCTTTTGATT/GATTTTCTCATA...GCTAG|TTG | 1 | 1 | 64.066 | 
| 132129706 | GT-AG | 0 | 0.000749860720617 | 571 | rna-XM_031638199.1 24215978 | 14 | 34424487 | 34425057 | Nymphaea colorata 210225 | CAG|GTTCCCCCAT...CTGCACTTAAAG/GTTGCTTTCAAA...TGCAG|TGG | 1 | 1 | 69.044 | 
| 132129707 | GT-AG | 0 | 1.000000099473604e-05 | 88 | rna-XM_031638199.1 24215978 | 15 | 34423909 | 34423996 | Nymphaea colorata 210225 | AAG|GTCAGATGCT...TATTTCTTGATT/CTTCTTTTCATC...TTCAG|TTG | 2 | 1 | 81.179 | 
| 132129708 | GT-AG | 0 | 6.194546553779725e-05 | 86 | rna-XM_031638199.1 24215978 | 16 | 34423606 | 34423691 | Nymphaea colorata 210225 | CAG|GTACTTGTTC...TCTGTTTTGAAG/TTGCTATTCAAT...TGAAG|GTT | 0 | 1 | 86.553 | 
| 132129709 | GT-AG | 0 | 1.000000099473604e-05 | 366 | rna-XM_031638199.1 24215978 | 17 | 34423150 | 34423515 | Nymphaea colorata 210225 | ATG|GTGCGTCATA...TTGTGTTTGACA/TTAATTCTGACT...TGCAG|GTT | 0 | 1 | 88.782 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);