introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
16 rows where transcript_id = 19905860
This data as json, CSV (advanced)
Suggested facets: score, phase, in_cds
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 106496981 | GT-AG | 0 | 1.000000099473604e-05 | 1044 | rna-XM_021525711.2 19905860 | 2 | 45577376 | 45578419 | Lonchura striata 40157 | CAG|GTAATAAATA...ATTTATTTATTT/TATTTATTTATT...AAAAG|CTG | 0 | 1 | 10.343 | 
| 106496982 | GT-AG | 0 | 1.000000099473604e-05 | 772 | rna-XM_021525711.2 19905860 | 3 | 45576480 | 45577251 | Lonchura striata 40157 | TTG|GTAAGTGGAG...TATTCCTTCTCC/AGTTTTGTGATA...TCAAG|GTT | 1 | 1 | 13.426 | 
| 106496983 | GT-AG | 0 | 1.000000099473604e-05 | 650 | rna-XM_021525711.2 19905860 | 4 | 45575599 | 45576248 | Lonchura striata 40157 | AAG|GTCTGTGTGT...GATTTGTTGTTG/TGAAAACTGATT...CACAG|GAA | 1 | 1 | 19.17 | 
| 106496984 | GT-AG | 0 | 1.000000099473604e-05 | 1132 | rna-XM_021525711.2 19905860 | 5 | 45574322 | 45575453 | Lonchura striata 40157 | AAG|GTAATTCAGA...GTTATTTTATAC/AGTTATTTTATA...TCTAG|ACC | 2 | 1 | 22.775 | 
| 106496985 | GT-AG | 0 | 1.000000099473604e-05 | 288 | rna-XM_021525711.2 19905860 | 6 | 45573928 | 45574215 | Lonchura striata 40157 | CAG|GTTATTTATT...AGCTTTTTAACA/AGCTTTTTAACA...CTCAG|GAG | 0 | 1 | 25.41 | 
| 106496986 | GT-AG | 0 | 1.000000099473604e-05 | 3247 | rna-XM_021525711.2 19905860 | 7 | 45569057 | 45572303 | Lonchura striata 40157 | GAG|GTGAGAGAAG...TCAGTCTTATGA/TTCAGTCTTATG...GACAG|GAA | 1 | 1 | 65.788 | 
| 106496987 | GT-AG | 0 | 1.000000099473604e-05 | 826 | rna-XM_021525711.2 19905860 | 8 | 45568098 | 45568923 | Lonchura striata 40157 | CAG|GTAATTTTTA...AAATCCTGATAT/CTTTGTTTCATA...TATAG|GAA | 2 | 1 | 69.095 | 
| 106496988 | GT-AG | 0 | 1.000000099473604e-05 | 1041 | rna-XM_021525711.2 19905860 | 9 | 45566891 | 45567931 | Lonchura striata 40157 | CAG|GTATAAAAAT...ATATATTTGATT/ATATATTTGATT...CTAAG|GCT | 0 | 1 | 73.222 | 
| 106496989 | GT-AG | 0 | 1.000000099473604e-05 | 598 | rna-XM_021525711.2 19905860 | 10 | 45566053 | 45566650 | Lonchura striata 40157 | TCG|GTAAGTTATA...ACAGTTATGATT/ACAGTTATGATT...TTTAG|TGT | 0 | 1 | 79.189 | 
| 106496990 | GT-AG | 0 | 1.000000099473604e-05 | 1167 | rna-XM_021525711.2 19905860 | 11 | 45564786 | 45565952 | Lonchura striata 40157 | AAG|GTAAAAATAT...ATTTACTTATTA/AATTTACTTATT...CTCAG|TAG | 1 | 1 | 81.676 | 
| 106496991 | GT-AG | 0 | 1.0020508161476364e-05 | 674 | rna-XM_021525711.2 19905860 | 12 | 45564011 | 45564684 | Lonchura striata 40157 | GTA|GTAAGTCCTG...CAAAGCTTGATT/CTTGATTTGAGT...CTCAG|GAC | 0 | 1 | 84.187 | 
| 106496992 | GT-AG | 0 | 1.000000099473604e-05 | 104 | rna-XM_021525711.2 19905860 | 13 | 45563811 | 45563914 | Lonchura striata 40157 | AAG|GTGAGATCTT...GAGGGCTTAATA/ACTGATCTCACT...ATTAG|GTT | 0 | 1 | 86.574 | 
| 106496993 | GT-AG | 0 | 0.0008887407126984 | 106 | rna-XM_021525711.2 19905860 | 14 | 45563564 | 45563669 | Lonchura striata 40157 | GTT|GTAGGTATCC...CACTCTTTAAAA/AAACTTCTCATT...TGCAG|ATT | 0 | 1 | 90.08 | 
| 106496994 | GT-AG | 0 | 1.000000099473604e-05 | 89 | rna-XM_021525711.2 19905860 | 15 | 45563390 | 45563478 | Lonchura striata 40157 | TAG|GTAAAGAAAT...ATTGTCTCAAAA/TATTGTCTCAAA...TTCAG|AGA | 1 | 1 | 92.193 | 
| 106496995 | GT-AG | 0 | 1.6451591886390545e-05 | 588 | rna-XM_021525711.2 19905860 | 16 | 45562681 | 45563268 | Lonchura striata 40157 | GCG|GTGAGCTTTT...CTAATCTTACAC/ACTAATCTTACA...TACAG|AGA | 2 | 1 | 95.201 | 
| 106505138 | GT-AG | 0 | 1.000000099473604e-05 | 1439 | rna-XM_021525711.2 19905860 | 1 | 45578931 | 45580369 | Lonchura striata 40157 | CAG|GTTTGTAATA...CTGATTTTATCT/AAATTTCTGATT...TCTAG|GTG | 0 | 0.945 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);