introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
14 rows where transcript_id = 16613737
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 88330709 | GT-AG | 0 | 1.000000099473604e-05 | 12752 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 1 | 39280 | 52031 | Grallaria varia 117165 | TGG|GTAAGTGCTA...TTTTTCTTTGTG/TCTTTGTGCATG...TGCAG|GTA | 1 | 1 | 3.622 | 
| 88330710 | GT-AG | 0 | 1.000000099473604e-05 | 1510 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 2 | 53098 | 54607 | Grallaria varia 117165 | AAG|GTGAGGTGGT...ATAGTCTAAACA/TTCTGGTTAATT...TTCAG|GAT | 2 | 1 | 39.05 | 
| 88330711 | GT-AG | 0 | 1.000000099473604e-05 | 12549 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 3 | 54989 | 67537 | Grallaria varia 117165 | AAG|GTAAAAGCAG...GTTATCTTATTT/ATTCTTTTCATC...CATAG|CAA | 2 | 1 | 51.712 | 
| 88330712 | GT-AG | 0 | 0.0023914993136298 | 104 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 4 | 67748 | 67851 | Grallaria varia 117165 | AAA|GTATGTGCTG...TAACCTTTATTT/CCTTTATTTATT...TATAG|CAA | 2 | 1 | 58.691 | 
| 88330713 | GT-AG | 0 | 1.000000099473604e-05 | 8919 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 5 | 67933 | 76851 | Grallaria varia 117165 | CAG|GTACAAGCCC...ATTACTTTAATT/CTTTTTTTTATT...TATAG|GAG | 2 | 1 | 61.383 | 
| 88330714 | GT-AG | 0 | 0.0374688093020425 | 2141 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 6 | 76965 | 79105 | Grallaria varia 117165 | AAG|GTAACTTTGT...CTGTTCTTAAAG/CTCATTTTCAGC...TGCAG|ATG | 1 | 1 | 65.138 | 
| 88330715 | GT-AG | 0 | 1.000000099473604e-05 | 3600 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 7 | 79165 | 82764 | Grallaria varia 117165 | CAT|GTGAGTACGC...GCTTCTCTGACA/GCTTCTCTGACA...TCCAG|AAC | 0 | 1 | 67.099 | 
| 88330716 | GT-AG | 0 | 1.000000099473604e-05 | 22750 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 8 | 82855 | 105604 | Grallaria varia 117165 | AAG|GTAAGGAATT...TCCATCTCATTT/TTCCATCTCATT...TGCAG|GCC | 0 | 1 | 70.09 | 
| 88330717 | GT-AG | 0 | 0.0001080068177589 | 7909 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 9 | 105649 | 113557 | Grallaria varia 117165 | AGT|GTAAGTATAC...TATGCTTTATTT/ACTTTGCTGATC...TTAAG|GGA | 2 | 1 | 71.552 | 
| 88330718 | GT-AG | 0 | 1.000000099473604e-05 | 2423 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 10 | 113752 | 116174 | Grallaria varia 117165 | AAA|GTGAGTATTT...TGGATCTGAGTT/TGGGTTTTCATT...TGCAG|CTC | 1 | 1 | 77.999 | 
| 88330719 | GT-AG | 0 | 1.000000099473604e-05 | 5856 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 11 | 116246 | 122101 | Grallaria varia 117165 | AAG|GTAGGGGAAA...CCACTGTTAACT/CCACTGTTAACT...TGCAG|GAT | 0 | 1 | 80.359 | 
| 88330720 | GT-AG | 0 | 1.000000099473604e-05 | 827 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 12 | 122260 | 123086 | Grallaria varia 117165 | CCA|GTAAGTGCTT...ACGTGCTTAATA/ACGTGCTTAATA...CCCAG|GAG | 2 | 1 | 85.61 | 
| 88330721 | GT-AG | 0 | 1.000000099473604e-05 | 3171 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 13 | 123232 | 126402 | Grallaria varia 117165 | CAG|GTGAGACCTT...GATATTTTAGAT/GATTCTGTCACT...TGAAG|GAT | 0 | 1 | 90.429 | 
| 88330722 | GT-AG | 0 | 0.0026938279902883 | 6279 | rna-gnl|WGS:VWZG|GRAVAR_R11349_mrna 16613737 | 14 | 126547 | 132825 | Grallaria varia 117165 | GAG|GTATTTATGG...TTCTTCCTGACT/TTTCTTCTCATT...CTCAG|AAA | 0 | 1 | 95.214 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);