introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
20 rows where transcript_id = 32739457
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 183116428 | GT-AG | 0 | 1.21729201215511e-05 | 102 | rna-XM_020696274.1 32739457 | 1 | 9126878 | 9126979 | Sesamum indicum 4182 | GGC|GTGCGTATAA...ATTTCCTTTGTT/TTATGATTCATT...GGCAG|AGG | 0 | 1 | 3.442 | 
| 183116429 | GT-AG | 0 | 4.652449465268437e-05 | 1048 | rna-XM_020696274.1 32739457 | 2 | 9127024 | 9128071 | Sesamum indicum 4182 | CCC|GTAAGTTATA...ATTCTTCTGATA/ATTCTTCTGATA...TACAG|GAA | 2 | 1 | 4.343 | 
| 183116430 | GT-AG | 0 | 0.0004455983049459 | 105 | rna-XM_020696274.1 32739457 | 3 | 9128172 | 9128276 | Sesamum indicum 4182 | CCT|GTAAGTTTTT...GAATTGTTGATT/GAATTGTTGATT...TACAG|GAC | 0 | 1 | 6.392 | 
| 183116431 | GT-AG | 0 | 1.000000099473604e-05 | 712 | rna-XM_020696274.1 32739457 | 4 | 9129258 | 9129969 | Sesamum indicum 4182 | GAG|GTAATGTCTT...ACAGTTTTAATT/GCTTTATTCATT...GGTAG|GAG | 0 | 1 | 26.49 | 
| 183116432 | GT-AG | 0 | 1.000000099473604e-05 | 952 | rna-XM_020696274.1 32739457 | 5 | 9130205 | 9131156 | Sesamum indicum 4182 | CAG|GTAAGAATTC...AAATTCTTAACC/TTATTATTTACT...TGCAG|AAA | 1 | 1 | 31.305 | 
| 183116433 | GT-AG | 0 | 1.000000099473604e-05 | 234 | rna-XM_020696274.1 32739457 | 6 | 9131375 | 9131608 | Sesamum indicum 4182 | AAG|GTAGAGTCTC...TTCATTTTGACT/GACTTTTTCATT...GGTAG|GTG | 0 | 1 | 35.771 | 
| 183116434 | GT-AG | 0 | 5.414007053932296e-05 | 591 | rna-XM_020696274.1 32739457 | 7 | 9131817 | 9132407 | Sesamum indicum 4182 | AAG|GTACTTACTC...CTTTTCTGATCT/GCTTTTCTGATC...CCAAG|TAT | 1 | 1 | 40.033 | 
| 183116435 | GT-AG | 0 | 0.0001056809103515 | 271 | rna-XM_020696274.1 32739457 | 8 | 9132695 | 9132965 | Sesamum indicum 4182 | CAG|GTATGACTGC...CTTATTTTGACT/CTTATTTTGACT...AACAG|GTT | 0 | 1 | 45.913 | 
| 183116436 | GT-AG | 0 | 0.0050574784159339 | 3102 | rna-XM_020696274.1 32739457 | 9 | 9133050 | 9136151 | Sesamum indicum 4182 | GCG|GTATTTGTTT...TGTTTCCTATTG/TTTGTTTTCAAA...TGCAG|CTA | 0 | 1 | 47.634 | 
| 183116437 | GT-AG | 0 | 1.000000099473604e-05 | 831 | rna-XM_020696274.1 32739457 | 10 | 9136247 | 9137077 | Sesamum indicum 4182 | CAG|GTGAAAACTC...AAATTCTTTTCT/TCTATGCTTACG...TCTAG|GTA | 2 | 1 | 49.58 | 
| 183116438 | GT-AG | 0 | 1.000000099473604e-05 | 79 | rna-XM_020696274.1 32739457 | 11 | 9137241 | 9137319 | Sesamum indicum 4182 | AAG|GTTGAGGATG...ATTGCTTTGGCG/TTATTTTGCACT...TTCAG|GGT | 0 | 1 | 52.919 | 
| 183116439 | GT-AG | 0 | 1.000000099473604e-05 | 1050 | rna-XM_020696274.1 32739457 | 12 | 9137566 | 9138615 | Sesamum indicum 4182 | CAG|GTACTTGATA...AAATTTATGACA/GTTTAGTTGATA...GGCAG|GCA | 0 | 1 | 57.959 | 
| 183116440 | GT-AG | 0 | 0.0002310863812038 | 150 | rna-XM_020696274.1 32739457 | 13 | 9138787 | 9138936 | Sesamum indicum 4182 | CTT|GTAAGTTTCA...CTCTTCTCATCT/TCTCTTCTCATC...TACAG|GGT | 0 | 1 | 61.463 | 
| 183116441 | GT-AG | 0 | 8.033063130604661e-05 | 117 | rna-XM_020696274.1 32739457 | 14 | 9139051 | 9139167 | Sesamum indicum 4182 | CAG|GTGTATTCTC...TGCTTTTTATTG/TTTTTATTGATG...ATCAG|GAT | 0 | 1 | 63.798 | 
| 183116442 | GT-AG | 0 | 0.0311989998281456 | 1284 | rna-XM_020696274.1 32739457 | 15 | 9139294 | 9140577 | Sesamum indicum 4182 | GTG|GTATGTTTGT...TTTTCCTTTTCA/TAGTTATTTATT...GATAG|ATA | 0 | 1 | 66.38 | 
| 183116443 | GT-AG | 0 | 1.1656831504406192e-05 | 1330 | rna-XM_020696274.1 32739457 | 16 | 9140727 | 9142056 | Sesamum indicum 4182 | TAG|GTAATATATT...TTTATCTTGACA/TTTATCTTGACA...ACCAG|GTA | 2 | 1 | 69.432 | 
| 183116444 | GT-AG | 0 | 1.000000099473604e-05 | 84 | rna-XM_020696274.1 32739457 | 17 | 9142298 | 9142381 | Sesamum indicum 4182 | AAG|GTGCTGATGA...TCTTTCTTATTA/ATCTTTCTTATT...CTCAG|ATT | 0 | 1 | 74.37 | 
| 183116445 | GT-AG | 0 | 0.0705495475806634 | 393 | rna-XM_020696274.1 32739457 | 18 | 9143145 | 9143537 | Sesamum indicum 4182 | TTG|GTATGCTCCT...CAATCCTTGTCC/CTTGAGCTCAAT...TACAG|GTA | 1 | 1 | 90.002 | 
| 183116446 | GT-AG | 0 | 5.089020400293939e-05 | 1084 | rna-XM_020696274.1 32739457 | 19 | 9143720 | 9144803 | Sesamum indicum 4182 | AAG|GTATGGATGT...TATATTTTGAAA/TGATTTCTAATA...GCCAG|ATA | 0 | 1 | 93.731 | 
| 183116447 | GT-AG | 0 | 0.0039766058865183 | 86 | rna-XM_020696274.1 32739457 | 20 | 9144908 | 9144993 | Sesamum indicum 4182 | CCT|GTAAGCTTAT...CTACCATTAGCT/TAATTACTAATT...TTCAG|GCA | 2 | 1 | 95.862 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);