introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
25 rows where transcript_id = 32739502
This data as json, CSV (advanced)
Suggested facets: score, length, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 183117105 | GT-AG | 0 | 1.000000099473604e-05 | 2048 | rna-XM_011085037.2 32739502 | 3 | 13303153 | 13305200 | Sesamum indicum 4182 | CAG|GTTAATTTAT...TTTACTTTATTT/CTTTATTTTACA...TGTAG|GTG | 0 | 1 | 31.601 | 
| 183117106 | GT-AG | 0 | 1.000000099473604e-05 | 206 | rna-XM_011085037.2 32739502 | 4 | 13302737 | 13302942 | Sesamum indicum 4182 | CCG|GTGAGCAATA...TTTCTCTTATTT/TTTTCTCTTATT...GCAAG|CCT | 0 | 1 | 37.564 | 
| 183117107 | GT-AG | 0 | 1.000000099473604e-05 | 179 | rna-XM_011085037.2 32739502 | 5 | 13302483 | 13302661 | Sesamum indicum 4182 | CAG|GTTAAGTATC...AGGTTCTAATTG/GAGGTTCTAATT...ATTAG|ATT | 0 | 1 | 39.693 | 
| 183117108 | GT-AG | 0 | 1.000000099473604e-05 | 299 | rna-XM_011085037.2 32739502 | 6 | 13302085 | 13302383 | Sesamum indicum 4182 | CAT|GTAATGTGAA...GCTGCTTTAGTG/AATTTCGTAATT...GGTAG|GTT | 0 | 1 | 42.504 | 
| 183117109 | GT-AG | 0 | 1.000000099473604e-05 | 440 | rna-XM_011085037.2 32739502 | 7 | 13301533 | 13301972 | Sesamum indicum 4182 | GTG|GTAAGAACAA...TTGTCCTTTATA/TTGTCCTTTATA...TGCAG|GAT | 1 | 1 | 45.684 | 
| 183117110 | GT-AG | 0 | 1.000000099473604e-05 | 2330 | rna-XM_011085037.2 32739502 | 8 | 13299075 | 13301404 | Sesamum indicum 4182 | ATG|GTTAGTGCTA...TCATTCTTACAC/GTACTTTTCATT...TTCAG|GTC | 0 | 1 | 49.319 | 
| 183117111 | GT-AG | 0 | 1.000000099473604e-05 | 367 | rna-XM_011085037.2 32739502 | 9 | 13298588 | 13298954 | Sesamum indicum 4182 | CCT|GTGAGTTCAT...TTACGGTTGATG/TACTGACTGATC...TGCAG|GAG | 0 | 1 | 52.726 | 
| 183117112 | GT-AG | 0 | 1.000000099473604e-05 | 272 | rna-XM_011085037.2 32739502 | 10 | 13298235 | 13298506 | Sesamum indicum 4182 | CAG|GTTGGGGAGG...ATGTTCTTGTTC/CAGACTCTAATG...TTCAG|CCA | 0 | 1 | 55.026 | 
| 183117113 | GT-AG | 0 | 1.000000099473604e-05 | 239 | rna-XM_011085037.2 32739502 | 11 | 13297918 | 13298156 | Sesamum indicum 4182 | GAG|GTTGGTTAAT...CATATGTTAAAT/AATATTTTCAAA...TGCAG|TGC | 0 | 1 | 57.24 | 
| 183117114 | GT-AG | 0 | 1.000000099473604e-05 | 447 | rna-XM_011085037.2 32739502 | 12 | 13297378 | 13297824 | Sesamum indicum 4182 | AAG|GTATGAGCAT...CATGTCTCAGTA/TATAGGCTCACT...TTTAG|GCT | 0 | 1 | 59.881 | 
| 183117115 | GT-AG | 0 | 0.0005721643524237 | 215 | rna-XM_011085037.2 32739502 | 13 | 13297108 | 13297322 | Sesamum indicum 4182 | CTG|GTAAACTGAC...CTTGTCTTGATA/TAGAATTTTACT...TGCAG|TAT | 1 | 1 | 61.442 | 
| 183117116 | GT-AG | 0 | 1.000000099473604e-05 | 936 | rna-XM_011085037.2 32739502 | 14 | 13296095 | 13297030 | Sesamum indicum 4182 | AAG|GTATGAACAC...GATCTATTAATT/GATCTATTAATT...TGCAG|GAG | 0 | 1 | 63.629 | 
| 183117117 | GT-AG | 0 | 0.00161446856709 | 122 | rna-XM_011085037.2 32739502 | 15 | 13295901 | 13296022 | Sesamum indicum 4182 | CAG|GTAACATTAA...TATTTCTTATCG/TTATTTCTTATC...CACAG|GTC | 0 | 1 | 65.673 | 
| 183117118 | GT-AG | 0 | 1.000000099473604e-05 | 118 | rna-XM_011085037.2 32739502 | 16 | 13295699 | 13295816 | Sesamum indicum 4182 | CAG|GTAATTAAGA...TTATTTTTAAGT/TTATTTTTAAGT...TCCAG|GTG | 0 | 1 | 68.058 | 
| 183117119 | GT-AG | 0 | 1.000000099473604e-05 | 114 | rna-XM_011085037.2 32739502 | 17 | 13295465 | 13295578 | Sesamum indicum 4182 | CAG|GTTAGCTTCT...TATGTGTTCTTC/TAGGGTATTATG...AATAG|GGT | 0 | 1 | 71.465 | 
| 183117120 | GT-AG | 0 | 0.0391034024059908 | 1015 | rna-XM_011085037.2 32739502 | 18 | 13294381 | 13295395 | Sesamum indicum 4182 | GCA|GTATGTCTCT...TCATCTTCAATT/TCCGTACTCACT...CCCAG|ATT | 0 | 1 | 73.424 | 
| 183117121 | GT-AG | 0 | 1.737259651516825e-05 | 165 | rna-XM_011085037.2 32739502 | 19 | 13294138 | 13294302 | Sesamum indicum 4182 | CAG|GTATAGCGTC...TCACCTGTGATT/TCGTTGGTCATC...TTTAG|TGT | 0 | 1 | 75.639 | 
| 183117122 | GT-AG | 0 | 0.0008945176688041 | 296 | rna-XM_011085037.2 32739502 | 20 | 13293703 | 13293998 | Sesamum indicum 4182 | AAG|GTACTTTGCC...CCTTCTTTAGCT/ATTTTTCTCATC...TGCAG|TGG | 1 | 1 | 79.585 | 
| 183117123 | GT-AG | 0 | 0.0055164633978622 | 824 | rna-XM_011085037.2 32739502 | 21 | 13292714 | 13293537 | Sesamum indicum 4182 | TTG|GTACATTCTA...TCATTTTTAGTT/TAGTTTCTAACA...TTAAG|CTT | 1 | 1 | 84.27 | 
| 183117124 | GT-AG | 0 | 1.000000099473604e-05 | 79 | rna-XM_011085037.2 32739502 | 22 | 13292489 | 13292567 | Sesamum indicum 4182 | AAG|GTAGGGAGTT...TTGGTTTTAACT/TTGGTTTTAACT...GTCAG|GAG | 0 | 1 | 88.416 | 
| 183117125 | GT-AG | 0 | 0.0383042843251151 | 419 | rna-XM_011085037.2 32739502 | 23 | 13291890 | 13292308 | Sesamum indicum 4182 | CAG|GTATTCTTTC...ATTTGTTCAATT/AATTTGTTCAAT...ATCAG|TTT | 0 | 1 | 93.526 | 
| 183117126 | GT-AG | 0 | 2.4041829056730835e-05 | 112 | rna-XM_011085037.2 32739502 | 24 | 13291689 | 13291800 | Sesamum indicum 4182 | ACG|GTACGAATAT...TTTCTCTTATTC/CACTTTCTCACT...TGCAG|CTT | 2 | 1 | 96.053 | 
| 183117127 | GT-AG | 0 | 1.000000099473604e-05 | 152 | rna-XM_011085037.2 32739502 | 25 | 13291505 | 13291656 | Sesamum indicum 4182 | CAG|GTTAGTGTAT...ATTTTCTTTCTT/TTCTCTTTCAAG...CACAG|GGA | 1 | 1 | 96.962 | 
| 183125175 | GT-AG | 0 | 1.000000099473604e-05 | 116 | rna-XM_011085037.2 32739502 | 1 | 13306318 | 13306433 | Sesamum indicum 4182 | GAG|GTAAGTTCAA...GTCTCTTTGTTT/TGGATCCAAATT...GTCAG|ATC | 0 | 6.104 | |
| 183125176 | GT-AG | 0 | 8.627522168232467e-05 | 116 | rna-XM_011085037.2 32739502 | 2 | 13306135 | 13306250 | Sesamum indicum 4182 | CAG|GTTCCAAATA...TGCGTCTTGATT/GGTTTTTTTATA...TGTAG|ATT | 0 | 8.007 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);