introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
13 rows where transcript_id = 29402353
This data as json, CSV (advanced)
Suggested facets: score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 163707257 | GT-AG | 0 | 1.000000099473604e-05 | 1140 | rna-XM_020562916.1 29402353 | 1 | 10877052 | 10878191 | Prunus persica 3760 | ATT|GTAAGGGCAT...TATTTCTGATCT/ATATTTCTGATC...GCAAG|GAT | 0 | 1 | 1.781 | 
| 163707258 | GT-AG | 0 | 1.000000099473604e-05 | 119 | rna-XM_020562916.1 29402353 | 2 | 10876860 | 10876978 | Prunus persica 3760 | TGG|GTAAGTGACG...TTGACTTTATTG/GGTATATTGACT...GTCAG|GGC | 1 | 1 | 2.953 | 
| 163707259 | GT-AG | 0 | 0.0047267112760132 | 109 | rna-XM_020562916.1 29402353 | 3 | 10876626 | 10876734 | Prunus persica 3760 | GAG|GTATATTGAA...TATATTTTAGTT/TTATATTTTAGT...TGCAG|GGT | 0 | 1 | 4.959 | 
| 163707260 | GT-AG | 0 | 1.000000099473604e-05 | 106 | rna-XM_020562916.1 29402353 | 4 | 10876127 | 10876232 | Prunus persica 3760 | CAG|GTAAGGTCAG...TTTGTCTTTTTT/GTTGCATTCATG...AACAG|GTT | 0 | 1 | 11.266 | 
| 163707261 | GT-AG | 0 | 0.0044613752269734 | 275 | rna-XM_020562916.1 29402353 | 5 | 10874581 | 10874855 | Prunus persica 3760 | GCT|GTAAGCTTCC...TGAGTATTGACA/TGAGTATTGACA...TGTAG|GCC | 2 | 1 | 31.664 | 
| 163707262 | GT-AG | 0 | 7.554359502655562e-05 | 108 | rna-XM_020562916.1 29402353 | 6 | 10874039 | 10874146 | Prunus persica 3760 | GAG|GTATGTAATT...ATTTATTTATTT/TATTTATTTATT...TGCAG|GTG | 1 | 1 | 38.629 | 
| 163707263 | GT-AG | 0 | 0.2522401424188724 | 95 | rna-XM_020562916.1 29402353 | 7 | 10871941 | 10872035 | Prunus persica 3760 | AAG|GTTTCTTCTT...GTTCTCTTAATC/GTTCTCTTAATC...TGTAG|GAC | 0 | 1 | 70.775 | 
| 163707264 | GT-AG | 0 | 4.063590506680229e-05 | 1594 | rna-XM_020562916.1 29402353 | 8 | 10870189 | 10871782 | Prunus persica 3760 | CGA|GTAAGTTAAA...AACCTTTTGAAT/TCTGTGCTGAAC...CACAG|ATT | 2 | 1 | 73.311 | 
| 163707265 | GT-AG | 0 | 1.000000099473604e-05 | 248 | rna-XM_020562916.1 29402353 | 9 | 10869780 | 10870027 | Prunus persica 3760 | CAG|GTAATGGAGC...AAACCCTTTACT/AAGCAACTCACA...TTTAG|GTG | 1 | 1 | 75.895 | 
| 163707266 | GT-AG | 0 | 0.0001478495178296 | 584 | rna-XM_020562916.1 29402353 | 10 | 10869038 | 10869621 | Prunus persica 3760 | TTT|GTAAGTTGAT...ATGGTTTTACCA/CATGGTTTTACC...TGCAG|ACA | 0 | 1 | 78.43 | 
| 163729423 | GT-AG | 0 | 1.000000099473604e-05 | 111 | rna-XM_020562916.1 29402353 | 11 | 10868110 | 10868220 | Prunus persica 3760 | CAG|GTACGTAATC...GATTTTTTATGT/GGATTTTTTATG...TGTAG|GTG | 0 | 91.542 | |
| 163729424 | GT-AG | 0 | 1.000000099473604e-05 | 401 | rna-XM_020562916.1 29402353 | 12 | 10867597 | 10867997 | Prunus persica 3760 | CAT|GTGAGTTCAA...GCTGCTTTACAT/TGGTAACTCATA...TTCAG|TGC | 0 | 93.34 | |
| 163729425 | GT-AG | 0 | 1.000000099473604e-05 | 298 | rna-XM_020562916.1 29402353 | 13 | 10867202 | 10867499 | Prunus persica 3760 | ATG|GTGGTGCTCT...GTTCTTTTATCA/TGTTCTTTTATC...AGCAG|GAT | 0 | 94.896 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);