introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
25 rows where transcript_id = 15495844
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, length, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 83763276 | GT-AG | 0 | 1.000000099473604e-05 | 83 | rna-XM_003516526.5 15495844 | 1 | 52406949 | 52407031 | Glycine max 3847 | AAG|GTCATTCTTC...TCCTTCTCAATT/ATCCTTCTCAAT...CGCAG|GTA | 0 | 1 | 5.019 | 
| 83763277 | GT-AG | 0 | 2.801496157187723e-05 | 142 | rna-XM_003516526.5 15495844 | 2 | 52406645 | 52406786 | Glycine max 3847 | AAG|GTACTATCAT...GATCTTTTAACG/CCTGTTTTCATG...GTTAG|GAA | 0 | 1 | 10.133 | 
| 83763278 | GT-AG | 0 | 4.4165423228889816e-05 | 84 | rna-XM_003516526.5 15495844 | 3 | 52406395 | 52406478 | Glycine max 3847 | CAG|GTTTTTACTC...ATGCCTTTGAAA/GTGATGCTAACA...TGCAG|CTG | 1 | 1 | 15.372 | 
| 83763279 | GT-AG | 0 | 1.63929033686092e-05 | 95 | rna-XM_003516526.5 15495844 | 4 | 52406183 | 52406277 | Glycine max 3847 | ATG|GTCTGTGCCT...CTTCTTTTGATA/CTTCTTTTGATA...TGAAG|GGA | 1 | 1 | 19.066 | 
| 83763280 | GT-AG | 0 | 1.000000099473604e-05 | 101 | rna-XM_003516526.5 15495844 | 5 | 52405951 | 52406051 | Glycine max 3847 | AAG|GTTTGATATA...CTTGTCTTCATT/CTTGTCTTCATT...TTTAG|GTT | 0 | 1 | 23.201 | 
| 83763281 | GT-AG | 0 | 0.0005337762891612 | 521 | rna-XM_003516526.5 15495844 | 6 | 52405279 | 52405799 | Glycine max 3847 | TTG|GTATGTGTAT...TATTTATTAATG/TAAGTATTTATT...TGCAG|CCA | 1 | 1 | 27.967 | 
| 83763282 | GT-AG | 0 | 1.000000099473604e-05 | 326 | rna-XM_003516526.5 15495844 | 7 | 52404885 | 52405210 | Glycine max 3847 | GAG|GTCCTGATCT...TATTTTTTATTC/TTATTTTTTATT...TGCAG|CAA | 0 | 1 | 30.114 | 
| 83763283 | GT-AG | 0 | 0.0021326153382737 | 98 | rna-XM_003516526.5 15495844 | 8 | 52404688 | 52404785 | Glycine max 3847 | CAG|GTACTCATGG...CTCATTTTGATT/TATATATTTATT...TTCAG|CTT | 0 | 1 | 33.239 | 
| 83763284 | GT-AG | 0 | 1.000000099473604e-05 | 1294 | rna-XM_003516526.5 15495844 | 9 | 52403278 | 52404571 | Glycine max 3847 | GAG|GTAATGCTTC...TTTATATTATCT/TATTATCTGATG...TATAG|AAT | 2 | 1 | 36.9 | 
| 83763285 | GT-AG | 0 | 0.0036164990457647 | 94 | rna-XM_003516526.5 15495844 | 10 | 52403009 | 52403102 | Glycine max 3847 | GAT|GTATGATTTT...TGTTTCTAATTG/CTGTTTCTAATT...TTCAG|GGC | 0 | 1 | 42.424 | 
| 83763286 | GT-AG | 0 | 0.0099217268280659 | 90 | rna-XM_003516526.5 15495844 | 11 | 52402808 | 52402897 | Glycine max 3847 | GAG|GTATATTCTA...TTACCCATGATT/ATGATTTTCACT...AGCAG|GCT | 0 | 1 | 45.928 | 
| 83763287 | GT-AG | 0 | 1.000000099473604e-05 | 132 | rna-XM_003516526.5 15495844 | 12 | 52402597 | 52402728 | Glycine max 3847 | CAG|GTAAGGCATA...AGTATCTTGATG/AGTATCTTGATG...TCCAG|TAT | 1 | 1 | 48.422 | 
| 83763288 | GT-AG | 0 | 0.0003116644360428 | 95 | rna-XM_003516526.5 15495844 | 13 | 52402358 | 52402452 | Glycine max 3847 | GAG|GTAACAATCT...CTTATCTTATTA/ATCTTATTAACT...TACAG|ATC | 1 | 1 | 52.967 | 
| 83763289 | GT-AG | 0 | 0.0046644755885139 | 248 | rna-XM_003516526.5 15495844 | 14 | 52401996 | 52402243 | Glycine max 3847 | CTG|GTATTTTACC...CTCTGCTTATTG/CTTATTGTCATT...TACAG|CTT | 1 | 1 | 56.566 | 
| 83763290 | GT-AG | 0 | 4.110822486980553e-05 | 70 | rna-XM_003516526.5 15495844 | 15 | 52401804 | 52401873 | Glycine max 3847 | CAG|GTATGGCTTC...GTGTTTTTACAG/GGTGTTTTTACA...TACAG|CTG | 0 | 1 | 60.417 | 
| 83763291 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_003516526.5 15495844 | 16 | 52401639 | 52401720 | Glycine max 3847 | GAG|GTAGGGGTAT...AGGATCTTATTC/TTCTTTTTCAAT...GGCAG|TCT | 2 | 1 | 63.037 | 
| 83763292 | GT-AG | 0 | 0.0053955629974608 | 95 | rna-XM_003516526.5 15495844 | 17 | 52401419 | 52401513 | Glycine max 3847 | AAA|GTATGTACTT...ACCATTTTAACA/ATTTCACTCATC...TGCAG|TTG | 1 | 1 | 66.982 | 
| 83763293 | GT-AG | 0 | 1.962093529605792e-05 | 78 | rna-XM_003516526.5 15495844 | 18 | 52401220 | 52401297 | Glycine max 3847 | TAG|GTAAATATTT...GACCTTTTATAT/CAATTTGTAAAT...TCTAG|ACT | 2 | 1 | 70.802 | 
| 83763294 | GT-AG | 0 | 1.000000099473604e-05 | 696 | rna-XM_003516526.5 15495844 | 19 | 52400386 | 52401081 | Glycine max 3847 | GAG|GTGAGTTTCC...GTCTTCTTAAAA/ATTGATTTCATT...GACAG|GTT | 2 | 1 | 75.158 | 
| 83763295 | GT-AG | 0 | 3.939484944784615e-05 | 87 | rna-XM_003516526.5 15495844 | 20 | 52400202 | 52400288 | Glycine max 3847 | AAT|GTAAGTTGTG...TTTTGTTTGATT/TTTTGTTTGATT...TTCAG|GAC | 0 | 1 | 78.22 | 
| 83763296 | GT-AG | 0 | 1.000000099473604e-05 | 421 | rna-XM_003516526.5 15495844 | 21 | 52399655 | 52400075 | Glycine max 3847 | ATG|GTTAGTTGCC...GACTTGTTAATT/TGATTATTTATC...ACCAG|GAA | 0 | 1 | 82.197 | 
| 83763297 | GT-AG | 0 | 1.000000099473604e-05 | 101 | rna-XM_003516526.5 15495844 | 22 | 52399461 | 52399561 | Glycine max 3847 | GAG|GTGAGTGGAG...TATCTTTTGAGA/TATCTTTTGAGA...TGCAG|TGC | 0 | 1 | 85.133 | 
| 83763298 | GT-AG | 0 | 0.0027085736260404 | 368 | rna-XM_003516526.5 15495844 | 23 | 52398987 | 52399354 | Glycine max 3847 | ACG|GTATAATTAG...TTATGCTTAATT/CATATTCTCATT...GGCAG|GAA | 1 | 1 | 88.479 | 
| 83763299 | GC-AG | 0 | 1.000000099473604e-05 | 99 | rna-XM_003516526.5 15495844 | 24 | 52398745 | 52398843 | Glycine max 3847 | AAG|GCACGTACAG...TATCACTTATCA/TCTTTGCTAATT...TGCAG|CAA | 0 | 1 | 92.992 | 
| 83763300 | GT-AG | 0 | 3.6428773645433446e-05 | 113 | rna-XM_003516526.5 15495844 | 25 | 52398542 | 52398654 | Glycine max 3847 | AAG|GTATAAAATT...TTTTTCTTTCTT/GATCTGCTGATC...AAAAG|AAG | 0 | 1 | 95.833 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);