introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
24 rows where transcript_id = 1668809
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 9478937 | GT-AG | 0 | 3.6809979402917646e-05 | 216 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 1 | 861771 | 861986 | Anhinga anhinga 56067 | GCA|GTAAGTACCA...TTCCCCTTGGCA/AAAGTATTTATA...TTTAG|AGA | 2 | 1 | 2.404 | 
| 9478938 | GT-AG | 0 | 1.000000099473604e-05 | 1429 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 2 | 862090 | 863518 | Anhinga anhinga 56067 | ATT|GTAAGTGAAT...CTAGCATTACAC/CAGAGGCTGATA...TGTAG|ACT | 0 | 1 | 4.385 | 
| 9478939 | GT-AG | 0 | 4.616309157664299e-05 | 589 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 3 | 863799 | 864387 | Anhinga anhinga 56067 | AAG|GTAATTTGTA...TTTCTTTTATTC/TTTTCTTTTATT...TAAAG|AGT | 1 | 1 | 9.771 | 
| 9478940 | GT-AG | 0 | 1.000000099473604e-05 | 748 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 4 | 864492 | 865239 | Anhinga anhinga 56067 | AAG|GTAAGGTAAA...CTTCTCTTATTT/TCTTCTCTTATT...TCCAG|ATA | 0 | 1 | 11.771 | 
| 9478941 | GT-AG | 0 | 1.000000099473604e-05 | 363 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 5 | 865409 | 865771 | Anhinga anhinga 56067 | ATG|GTGAGTATAA...ACCATTTTAATT/ACCATTTTAATT...AACAG|ACA | 1 | 1 | 15.022 | 
| 9478942 | GT-AG | 0 | 1.000000099473604e-05 | 7212 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 6 | 865917 | 873128 | Anhinga anhinga 56067 | CAG|GTGATGGCAG...ATCTTTTTTTCT/AAATTCTATATG...TATAG|TCT | 2 | 1 | 17.811 | 
| 9478943 | GT-AG | 0 | 1.000000099473604e-05 | 2538 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 7 | 873266 | 875803 | Anhinga anhinga 56067 | CAG|GTAAAAACCT...TCATCTTTAAAT/AATCTTCTGATA...AATAG|AAC | 1 | 1 | 20.446 | 
| 9478944 | GT-AG | 0 | 1.000000099473604e-05 | 844 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 8 | 875910 | 876753 | Anhinga anhinga 56067 | TAG|GTAATGTGAT...ATTTTCTAAATC/TATTTTCTAAAT...TCTAG|GCC | 2 | 1 | 22.485 | 
| 9478945 | GT-AG | 0 | 6.575518121628575e-05 | 553 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 9 | 876905 | 877457 | Anhinga anhinga 56067 | AGG|GTATGTCAGA...GATTACTTCACT/GATTACTTCACT...ACCAG|GTA | 0 | 1 | 25.389 | 
| 9478946 | GT-AG | 0 | 1.000000099473604e-05 | 624 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 10 | 877567 | 878190 | Anhinga anhinga 56067 | ATG|GTAAATATTT...TTGTACTTACAT/CTTGTACTTACA...TTCAG|TTT | 1 | 1 | 27.486 | 
| 9478947 | GT-AG | 0 | 0.0001325246308916 | 415 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 11 | 878411 | 878825 | Anhinga anhinga 56067 | CAG|GTACGATCTT...ACTTCCTTGATA/CAGAAGCTGACT...CTTAG|AGC | 2 | 1 | 31.718 | 
| 9478948 | GT-AG | 0 | 1.2442417967536856e-05 | 116 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 12 | 879011 | 879126 | Anhinga anhinga 56067 | AAG|GTATGGCCTT...TTTCTTTTAAGC/TTTATTATGACC...TCTAG|CTG | 1 | 1 | 35.276 | 
| 9478949 | GT-AG | 0 | 0.008311527926804 | 442 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 13 | 879223 | 879664 | Anhinga anhinga 56067 | CAA|GTATGTATGA...GATTTTTTACTG/AGATTTTTTACT...ACCAG|AAA | 1 | 1 | 37.123 | 
| 9478950 | GT-AG | 0 | 0.0001297792682475 | 1052 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 14 | 879748 | 880799 | Anhinga anhinga 56067 | AGA|GTAAGTCTTT...CTTTTTTTATCA/TCTTTTTTTATC...AACAG|GAC | 0 | 1 | 38.719 | 
| 9478951 | GT-AG | 0 | 1.000000099473604e-05 | 419 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 15 | 881011 | 881429 | Anhinga anhinga 56067 | CAA|GTAAGTAATT...AAATCCTAAGTT/GTTAAACTAACT...TCTAG|CTA | 1 | 1 | 42.777 | 
| 9478952 | GT-AG | 0 | 1.000000099473604e-05 | 1178 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 16 | 881531 | 882708 | Anhinga anhinga 56067 | AAG|GTAAGAAATA...TGTTCTTTAGAA/TATACTCTAATT...CACAG|GCA | 0 | 1 | 44.72 | 
| 9478953 | GT-AG | 0 | 1.000000099473604e-05 | 416 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 17 | 883063 | 883478 | Anhinga anhinga 56067 | CCG|GTAAGAAAGT...AATATTTTAAAC/AATATTTTAAAC...CACAG|AAA | 0 | 1 | 51.529 | 
| 9478954 | GT-AG | 0 | 0.0328082880642264 | 797 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 18 | 883731 | 884527 | Anhinga anhinga 56067 | AAG|GTACCTGTGC...TTCATTTTAACT/TTTCTCTTCATT...AACAG|GTA | 0 | 1 | 56.376 | 
| 9478955 | GT-AG | 0 | 1.000000099473604e-05 | 334 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 19 | 885428 | 885761 | Anhinga anhinga 56067 | AAG|GTAAGTAATT...ATCTTTTTAAAT/ATCTTTTTAAAT...TACAG|CCT | 0 | 1 | 73.687 | 
| 9478956 | GT-AG | 0 | 1.000000099473604e-05 | 510 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 20 | 885857 | 886366 | Anhinga anhinga 56067 | CAG|GTAGATGCAC...ATGTTGTTATTC/TATGTTGTTATT...GTTAG|GGC | 2 | 1 | 75.515 | 
| 9478957 | GT-AG | 0 | 0.0001169709135078 | 5132 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 21 | 886592 | 891723 | Anhinga anhinga 56067 | TAA|GTAAGTTTGG...GGTTTTTTGTCT/AGAGCAGTCAAA...AACAG|GGG | 2 | 1 | 79.842 | 
| 9478958 | GT-AG | 0 | 1.000000099473604e-05 | 699 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 22 | 891907 | 892605 | Anhinga anhinga 56067 | GCA|GTTGGAATGT...TTTCTATTGATT/TTTCTATTGATT...ATGAG|TTC | 2 | 1 | 83.362 | 
| 9478959 | GT-AG | 0 | 4.190081830802384e-05 | 2630 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 23 | 893074 | 895703 | Anhinga anhinga 56067 | AAG|GTAAGCTGCT...TTCATTTTGAAA/TCCTATTTCATT...CTGAG|TGC | 2 | 1 | 92.364 | 
| 9478960 | GT-AG | 0 | 0.0172604497780941 | 3255 | rna-gnl|WGS:WBMU|ANHANH_R05888_mrna 1668809 | 25 | 896011 | 899265 | Anhinga anhinga 56067 | CGG|GTATGCTGTC...CACTGTTTGACA/CACTGTTTGACA...CACAG|GTG | 1 | 1 | 98.23 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);