introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
13 rows where transcript_id = 2637809
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, length, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 14302996 | GT-AG | 0 | 0.0361333447545425 | 311 | Araha.0038s0003.1.v1.1 2637809 | 1 | 10934 | 11244 | Arabidopsis halleri 81970 | ATG|GTATGTTCTT...TGATCTTTGATG/AGTTTGCTGATC...TACAG|TGT | 1 | 1 | 3.293 | 
| 14302997 | GT-AG | 0 | 1.000000099473604e-05 | 98 | Araha.0038s0003.1.v1.1 2637809 | 2 | 11946 | 12043 | Arabidopsis halleri 81970 | CAG|GTGATACCAA...ATAGTCCTAACT/ATAGTCCTAACT...TGCAG|GCA | 0 | 1 | 34.912 | 
| 14302998 | GT-AG | 0 | 1.284995363146566e-05 | 348 | Araha.0038s0003.1.v1.1 2637809 | 3 | 12266 | 12613 | Arabidopsis halleri 81970 | GAG|GTGACTATTT...ATTGTCTTTCCA/AAAGGAGTAACA...TTCAG|GTT | 0 | 1 | 44.926 | 
| 14302999 | GT-AG | 0 | 0.030543243011491 | 136 | Araha.0038s0003.1.v1.1 2637809 | 5 | 14573 | 14708 | Arabidopsis halleri 81970 | AAG|GTATTTTTAT...GTTTTCTTACTT/GGTTTTCTTACT...TGTAG|GGC | 0 | 1 | 63.058 | 
| 14303000 | GT-AG | 0 | 1.000000099473604e-05 | 334 | Araha.0038s0003.1.v1.1 2637809 | 6 | 14751 | 15084 | Arabidopsis halleri 81970 | CAG|GTTAGTCGAG...TTTATTTTATTT/TTTTATTTTATT...GATAG|TTC | 0 | 1 | 64.953 | 
| 14303001 | GT-AG | 0 | 1.000000099473604e-05 | 93 | Araha.0038s0003.1.v1.1 2637809 | 7 | 15166 | 15258 | Arabidopsis halleri 81970 | CAG|GTAGGAGAAT...TGGATCTTATAT/TAGTTTCTAATA...TTCAG|GTT | 0 | 1 | 68.606 | 
| 14303002 | GC-AG | 0 | 1.000000099473604e-05 | 93 | Araha.0038s0003.1.v1.1 2637809 | 8 | 15310 | 15402 | Arabidopsis halleri 81970 | GAG|GCAAGTCGAT...TGATTTTCAATT/TCAATTCTGACT...TCTAG|GTT | 0 | 1 | 70.907 | 
| 14303003 | GT-AG | 0 | 1.000000099473604e-05 | 105 | Araha.0038s0003.1.v1.1 2637809 | 9 | 15485 | 15589 | Arabidopsis halleri 81970 | GGG|GTGAGCATAT...GTTTTTTTATAT/TGTTTTTTTATA...GACAG|GCT | 1 | 1 | 74.605 | 
| 14303004 | GT-AG | 0 | 1.000000099473604e-05 | 169 | Araha.0038s0003.1.v1.1 2637809 | 10 | 15685 | 15853 | Arabidopsis halleri 81970 | AAG|GTATGAGATA...GGTTTCTTCTCA/TTTCTTCTCACA...TTCAG|GTG | 0 | 1 | 78.89 | 
| 14303005 | GT-AG | 0 | 0.1621442629886691 | 97 | Araha.0038s0003.1.v1.1 2637809 | 11 | 15926 | 16022 | Arabidopsis halleri 81970 | AAG|GTACCTTTTT...GTGCCTTTGGTG/TTGGTGATAATC...GATAG|ATT | 0 | 1 | 82.138 | 
| 14303006 | GT-AG | 0 | 1.1569877318119894e-05 | 90 | Araha.0038s0003.1.v1.1 2637809 | 12 | 16140 | 16229 | Arabidopsis halleri 81970 | ATG|GTAAGCTAAA...ATCTGCTTACAC/TCGTGTTTCATC...TGCAG|AAC | 0 | 1 | 87.415 | 
| 14303007 | GT-AG | 0 | 1.000000099473604e-05 | 120 | Araha.0038s0003.1.v1.1 2637809 | 13 | 16299 | 16418 | Arabidopsis halleri 81970 | GTG|GTAAGAATTC...GATTCTTTGGCG/TGTTTTCTCATG...ATTAG|GGT | 0 | 1 | 90.528 | 
| 14303008 | GT-AG | 0 | 0.1037237073945271 | 121 | Araha.0038s0003.1.v1.1 2637809 | 14 | 16486 | 16606 | Arabidopsis halleri 81970 | AAG|GTTTCTTCTC...CTGTCCCTGACC/TTGCGTTTGATT...TGCAG|TTG | 1 | 1 | 93.55 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);