introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
15 rows where transcript_id = 10378434
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 57022710 | GT-AG | 0 | 0.0011868697032791 | 4101 | rna-XM_025113679.1 10378434 | 1 | 7480960 | 7485060 | Cynara cardunculus 4265 | TAG|GTAATCATTT...CACTTCTTAATT/AATTGCTTCACT...GACAG|ACT | 1 | 1 | 3.352 | 
| 57022711 | GT-AG | 0 | 1.000000099473604e-05 | 329 | rna-XM_025113679.1 10378434 | 2 | 7485323 | 7485651 | Cynara cardunculus 4265 | GGG|GTTAGTTTGT...TACTTTTTGCCA/TTTGGACTGATT...TGCAG|TAA | 2 | 1 | 10.435 | 
| 57022712 | GT-AG | 0 | 1.000000099473604e-05 | 98 | rna-XM_025113679.1 10378434 | 3 | 7485750 | 7485847 | Cynara cardunculus 4265 | ATG|GTTGGTATCG...TGATTCTTATCC/TTTCTTCTGATT...TATAG|AGA | 1 | 1 | 13.085 | 
| 57022713 | GT-AG | 0 | 1.000000099473604e-05 | 1122 | rna-XM_025113679.1 10378434 | 4 | 7485892 | 7487013 | Cynara cardunculus 4265 | GAG|GTAAATAAGT...ATGAGTTTATCT/CATGAGTTTATC...AGCAG|GAA | 0 | 1 | 14.274 | 
| 57022714 | GT-AG | 0 | 0.031759729919883 | 198 | rna-XM_025113679.1 10378434 | 5 | 7487073 | 7487270 | Cynara cardunculus 4265 | AGA|GTACGCTCTC...ACATCCTTCAAT/AAGGTTCTAACA...CTCAG|TTT | 2 | 1 | 15.869 | 
| 57022715 | GT-AG | 0 | 1.000000099473604e-05 | 97 | rna-XM_025113679.1 10378434 | 6 | 7487380 | 7487476 | Cynara cardunculus 4265 | CAG|GTCCATACAA...TGCTTCTTTTCT/TGTGGCCTCACA...ACCAG|CAA | 0 | 1 | 18.816 | 
| 57022716 | GC-AG | 0 | 1.978068886942361e-05 | 96 | rna-XM_025113679.1 10378434 | 7 | 7487970 | 7488065 | Cynara cardunculus 4265 | AAG|GCATGTTGAA...TTTCTCTTAATG/TGGATATTCATT...CGCAG|GTA | 1 | 1 | 32.144 | 
| 57022717 | GT-AG | 0 | 1.000000099473604e-05 | 91 | rna-XM_025113679.1 10378434 | 8 | 7488393 | 7488483 | Cynara cardunculus 4265 | AAG|GTTTGTCAAA...GTGTTCTCAATT/AAATGTCTGATT...TCCAG|GGG | 1 | 1 | 40.984 | 
| 57022718 | GT-AG | 0 | 3.872015479801716e-05 | 144 | rna-XM_025113679.1 10378434 | 9 | 7488931 | 7489074 | Cynara cardunculus 4265 | TAG|GTATGAGACT...TAGTTCTTAATG/TTAGTTCTTAAT...TGCAG|TTG | 1 | 1 | 53.068 | 
| 57022719 | GT-AG | 0 | 0.0507695478395126 | 377 | rna-XM_025113679.1 10378434 | 10 | 7489217 | 7489593 | Cynara cardunculus 4265 | CGA|GTATGTTCCA...TTTTTCTTTTCA/TCTGTTATCACT...AAAAG|CAC | 2 | 1 | 56.907 | 
| 57022720 | GT-AG | 0 | 1.000000099473604e-05 | 689 | rna-XM_025113679.1 10378434 | 11 | 7489731 | 7490419 | Cynara cardunculus 4265 | CTG|GTGAGTTGTT...ATTCTCTTGCTG/GCTGGACTAACA...TACAG|GGG | 1 | 1 | 60.611 | 
| 57022721 | GT-AG | 0 | 0.0003127011712296 | 204 | rna-XM_025113679.1 10378434 | 12 | 7491496 | 7491699 | Cynara cardunculus 4265 | AAT|GTAAGTTATT...TAATTCTTATTT/ATAATTCTTATT...TGCAG|GAG | 0 | 1 | 89.7 | 
| 57022722 | GT-AG | 0 | 0.0002387040578416 | 767 | rna-XM_025113679.1 10378434 | 13 | 7491734 | 7492500 | Cynara cardunculus 4265 | CAG|GTTTGCATCC...ATTTACTTACCG/AATTTACTTACC...TTCAG|ATT | 1 | 1 | 90.619 | 
| 57022723 | GT-AG | 0 | 0.0009227063650564 | 2066 | rna-XM_025113679.1 10378434 | 14 | 7492619 | 7494684 | Cynara cardunculus 4265 | AAA|GTATGTATAT...TTCTGCTTATAC/AGGGTACTGATT...GGCAG|GGC | 2 | 1 | 93.809 | 
| 57022724 | GT-AG | 0 | 0.0151457407759411 | 711 | rna-XM_025113679.1 10378434 | 15 | 7494815 | 7495525 | Cynara cardunculus 4265 | CTG|GTATGCTCAT...CCTCCATTAACA/CCTCCATTAACA...TACAG|GTT | 0 | 1 | 97.324 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);