introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
17 rows where transcript_id = 10378473
This data as json, CSV (advanced)
Suggested facets: score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 57023163 | GT-AG | 0 | 2.410917882605894e-05 | 1243 | rna-XM_025121868.1 10378473 | 2 | 43692217 | 43693459 | Cynara cardunculus 4265 | AAG|GTAATTTCGC...TTTCCCTTGCCG/CTTCCCCTGACG...TCCAG|CGA | 2 | 1 | 9.82 | 
| 57023164 | GT-AG | 0 | 0.0043846036931666 | 2168 | rna-XM_025121868.1 10378473 | 3 | 43689944 | 43692111 | Cynara cardunculus 4265 | CAT|GTATGGATTC...AAGGTCTTAATT/TCTTAATTTATT...TACAG|AGA | 2 | 1 | 12.925 | 
| 57023165 | GT-AG | 0 | 1.000000099473604e-05 | 127 | rna-XM_025121868.1 10378473 | 4 | 43689687 | 43689813 | Cynara cardunculus 4265 | AAG|GTAAAATAGA...CTGGCTTTGGCT/AGAATGCTCACT...TGCAG|GAC | 0 | 1 | 16.77 | 
| 57023166 | GT-AG | 0 | 1.000000099473604e-05 | 278 | rna-XM_025121868.1 10378473 | 5 | 43689371 | 43689648 | Cynara cardunculus 4265 | GAG|GTCCGTAATC...ATTATCTTATTA/CATTTATTCATA...TGCAG|CAA | 2 | 1 | 17.894 | 
| 57023167 | GT-AG | 0 | 0.0001504312802516 | 1259 | rna-XM_025121868.1 10378473 | 6 | 43688018 | 43689276 | Cynara cardunculus 4265 | GAG|GTATTGCTTG...CTATACTTAAAG/TAAAGTTTGACT...CTCAG|GAC | 0 | 1 | 20.674 | 
| 57023168 | GT-AG | 0 | 3.526902310654045e-05 | 589 | rna-XM_025121868.1 10378473 | 7 | 43687345 | 43687933 | Cynara cardunculus 4265 | CAG|GTCTTTTGAA...GTTCATTTAATA/TCTATGTTCATT...TCCAG|TTC | 0 | 1 | 23.159 | 
| 57023169 | GT-AG | 0 | 1.000000099473604e-05 | 73 | rna-XM_025121868.1 10378473 | 8 | 43685950 | 43686022 | Cynara cardunculus 4265 | AGT|GTGAGATTTC...TCTTCTTTAGTT/TAGTTGTTCATA...TACAG|GTG | 2 | 1 | 62.26 | 
| 57023170 | GT-AG | 0 | 0.0001031352490942 | 351 | rna-XM_025121868.1 10378473 | 9 | 43685467 | 43685817 | Cynara cardunculus 4265 | AAG|GTAATATTTT...TTTTTCTTGACC/TTTTTCTTGACC...TACAG|CAT | 2 | 1 | 66.164 | 
| 57023171 | GT-AG | 0 | 1.2747701720554483e-05 | 290 | rna-XM_025121868.1 10378473 | 10 | 43685104 | 43685393 | Cynara cardunculus 4265 | GTG|GTAATTTTAG...TAGCTATTGAAG/TTCTTGTTCACA...TCTAG|GTT | 0 | 1 | 68.323 | 
| 57023172 | GT-AG | 0 | 0.0042426265735843 | 233 | rna-XM_025121868.1 10378473 | 11 | 43684831 | 43685063 | Cynara cardunculus 4265 | AAG|GTACTCATGC...TATCTTTTGATT/TATCTTTTGATT...TGCAG|ATA | 1 | 1 | 69.506 | 
| 57023173 | GT-AG | 0 | 1.000000099473604e-05 | 925 | rna-XM_025121868.1 10378473 | 12 | 43683833 | 43684757 | Cynara cardunculus 4265 | AAG|GTCAGTCATT...TGGTTTTTAGTT/TTTTTGTTGATA...TGCAG|CGA | 2 | 1 | 71.665 | 
| 57023174 | GT-AG | 0 | 1.000000099473604e-05 | 550 | rna-XM_025121868.1 10378473 | 13 | 43683217 | 43683766 | Cynara cardunculus 4265 | ACG|GTAAGGATAT...TATATCTTGACA/TATATCTTGACA...TGTAG|TGA | 2 | 1 | 73.617 | 
| 57023175 | GT-AG | 0 | 0.3080620158550602 | 80 | rna-XM_025121868.1 10378473 | 14 | 43683059 | 43683138 | Cynara cardunculus 4265 | AAG|GTATCATATG...TTCGTTTTAACT/TTTTAACTCATA...TATAG|ATG | 2 | 1 | 75.924 | 
| 57023176 | GT-AG | 0 | 1.000000099473604e-05 | 186 | rna-XM_025121868.1 10378473 | 15 | 43682700 | 43682885 | Cynara cardunculus 4265 | CAG|GTGAGTTCCC...TATTTCGTAATT/GTTTGATTGACA...CTTAG|GCA | 1 | 1 | 81.041 | 
| 57023177 | GT-AG | 0 | 8.380334257345671e-05 | 374 | rna-XM_025121868.1 10378473 | 16 | 43682279 | 43682652 | Cynara cardunculus 4265 | CAG|GTCTGTTTCT...ATGAGTTTGATC/ATGAGTTTGATC...TTCAG|CTT | 0 | 1 | 82.431 | 
| 57023178 | GT-AG | 0 | 0.0008184674941544 | 78 | rna-XM_025121868.1 10378473 | 17 | 43681954 | 43682031 | Cynara cardunculus 4265 | TAG|GTTTGTTTCA...TTGTTTTTATTC/TTTGTTTTTATT...GGTAG|CTG | 1 | 1 | 89.737 | 
| 57033684 | GT-AG | 0 | 1.000000099473604e-05 | 238 | rna-XM_025121868.1 10378473 | 1 | 43693693 | 43693930 | Cynara cardunculus 4265 | TAG|GTACTTGTAT...GATTGCGTAATA/TTATATATGATT...TACAG|GCA | 0 | 3.194 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);