introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
30 rows where transcript_id = 1668763
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 9478561 | GT-AG | 0 | 0.0058360765778829 | 2279 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 1 | 1151289 | 1153567 | Anhinga anhinga 56067 | CAG|GTAACTTGAG...GATTTCTTATTT/AGATTTCTTATT...CCAAG|GGA | 2 | 1 | 21.233 | 
| 9478562 | GT-AG | 0 | 1.000000099473604e-05 | 944 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 2 | 1150252 | 1151195 | Anhinga anhinga 56067 | AAG|GTAAGGAAGG...TTTGCTTTCTCC/TCAGTGTTAAAA...CTAAG|CCG | 2 | 1 | 23.553 | 
| 9478563 | GT-AG | 0 | 0.0719736952437041 | 826 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 3 | 1149194 | 1150019 | Anhinga anhinga 56067 | GTG|GTATGTTTCT...TGTTTTTTAATT/TGTTTTTTAATT...AACAG|GGG | 0 | 1 | 29.341 | 
| 9478564 | GT-AG | 0 | 1.000000099473604e-05 | 3672 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 4 | 1145380 | 1149051 | Anhinga anhinga 56067 | TAG|GTAGGCAGAA...GTGTTTTTCACC/GTGTTTTTCACC...ATCAG|AGA | 1 | 1 | 32.884 | 
| 9478565 | GT-AG | 0 | 1.000000099473604e-05 | 3065 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 5 | 1142160 | 1145224 | Anhinga anhinga 56067 | CAG|GTAAGGTGTG...CATTTTTCAATA/CCATTTTTCAAT...GACAG|ATG | 0 | 1 | 36.751 | 
| 9478566 | GT-AG | 0 | 1.3211855989496318e-05 | 1663 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 6 | 1140416 | 1142078 | Anhinga anhinga 56067 | GAG|GTAAGTAATT...TTTGCCTTGACT/ATTCTACTTATC...TTAAG|CCC | 0 | 1 | 38.772 | 
| 9478567 | GT-AG | 0 | 2.112072245760226e-05 | 109 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 7 | 1140220 | 1140328 | Anhinga anhinga 56067 | TTA|GTAAGTACTT...TACTTCTTGCTT/TTCTTGCTTACT...TTTAG|ACA | 0 | 1 | 40.943 | 
| 9478568 | GT-AG | 0 | 3.392088375064855e-05 | 3044 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 8 | 1137089 | 1140132 | Anhinga anhinga 56067 | AAC|GTAAGTATTT...TAGTTCTTCATG/TAGTTCTTCATG...TCTAG|ATT | 0 | 1 | 43.114 | 
| 9478569 | GT-AG | 0 | 1.000000099473604e-05 | 1564 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 9 | 1135453 | 1137016 | Anhinga anhinga 56067 | GAG|GTAAGAAGGA...TATTTTTTTTCT/TTCTCGTTTATT...CCCAG|AAT | 0 | 1 | 44.91 | 
| 9478570 | GT-AG | 0 | 0.1634756490817675 | 1300 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 10 | 1134071 | 1135370 | Anhinga anhinga 56067 | AAG|GTAACTTTTA...TTTTCCTTATTT/TATTTTTTCATA...TTAAG|GTC | 1 | 1 | 46.956 | 
| 9478571 | GT-AG | 0 | 1.000000099473604e-05 | 3359 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 11 | 1130637 | 1133995 | Anhinga anhinga 56067 | CAG|GTAATGTTTG...TGTGTTTTATTT/TATTTATTTATT...TTAAG|ATG | 1 | 1 | 48.827 | 
| 9478572 | GT-AG | 0 | 1.000000099473604e-05 | 5868 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 12 | 1124599 | 1130466 | Anhinga anhinga 56067 | ATG|GTAGGGCAAA...CTGTTGTCAATT/GCTGTTGTCAAT...CCTAG|AAA | 0 | 1 | 53.069 | 
| 9478573 | GT-AG | 0 | 1.8557062977105903e-05 | 3144 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 13 | 1121330 | 1124473 | Anhinga anhinga 56067 | TCA|GTAAGATGCT...GTTTTTTTGTTT/GTGGTATCGACC...TTCAG|ATA | 2 | 1 | 56.188 | 
| 9478574 | GT-AG | 0 | 0.009609776272526 | 2978 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 14 | 1118252 | 1121229 | Anhinga anhinga 56067 | GAG|GTATGCTGGG...AAGTTCTTCACA/AAGTTCTTCACA...TCTAG|GAA | 0 | 1 | 58.683 | 
| 9478575 | GT-AG | 0 | 1.000000099473604e-05 | 4636 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 15 | 1113508 | 1118143 | Anhinga anhinga 56067 | CAG|GTGACTAAAC...TTTTCCTTATTG/CTTTTCCTTATT...TTTAG|CAC | 0 | 1 | 61.377 | 
| 9478576 | GT-AG | 0 | 1.000000099473604e-05 | 2412 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 16 | 1110988 | 1113399 | Anhinga anhinga 56067 | CAG|GTAAGATATG...TTTTCCTGTATG/ATACATCTAAGA...TATAG|CTG | 0 | 1 | 64.072 | 
| 9478577 | GT-AG | 0 | 0.012362672071541 | 662 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 17 | 1110187 | 1110848 | Anhinga anhinga 56067 | AAG|GTATGCTGTT...GTTTATTTAATA/TGGTTGTTTATT...TCTAG|GGA | 1 | 1 | 67.54 | 
| 9478578 | GT-AG | 0 | 1.000000099473604e-05 | 1957 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 18 | 1108169 | 1110125 | Anhinga anhinga 56067 | CAG|GTAATGAAAA...TAAACCTTAAAT/ACTTAGCTGATA...TTCAG|GAT | 2 | 1 | 69.062 | 
| 9478579 | GT-AG | 0 | 1.000000099473604e-05 | 1980 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 19 | 1106129 | 1108108 | Anhinga anhinga 56067 | AAG|GTAAATGGGG...TCATCTTTAACC/TTAATTTTTATT...GCCAG|TGT | 2 | 1 | 70.559 | 
| 9478580 | GT-AG | 0 | 0.000377732519857 | 2731 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 20 | 1103298 | 1106028 | Anhinga anhinga 56067 | AAG|GTACAGTTTT...ATGGTTTTAACT/ATGGTTTTAACT...TGCAG|AAG | 0 | 1 | 73.054 | 
| 9478581 | GT-AG | 0 | 1.000000099473604e-05 | 2468 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 21 | 1100727 | 1103194 | Anhinga anhinga 56067 | TAG|GTAAAGAATG...AATGCCTTATTG/TAATGCCTTATT...TGCAG|GAG | 1 | 1 | 75.624 | 
| 9478582 | GT-AG | 0 | 5.222309871746941e-05 | 1329 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 22 | 1099327 | 1100655 | Anhinga anhinga 56067 | AAG|GTACTTATGT...ACTCCCTTGAGC/AATTTGTTAAAT...TGCAG|GAC | 0 | 1 | 77.395 | 
| 9478583 | GT-AG | 0 | 1.000000099473604e-05 | 3012 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 23 | 1096270 | 1099281 | Anhinga anhinga 56067 | CAA|GTAAGTGTAT...TCATTCTTTGCA/CAGTTTATCATT...TACAG|CTG | 0 | 1 | 78.518 | 
| 9478584 | GT-AG | 0 | 1.000000099473604e-05 | 1452 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 24 | 1094660 | 1096111 | Anhinga anhinga 56067 | TCT|GTGAGTACAC...TGCTTATTGATT/TGATGTCTCATT...TTCAG|AGG | 2 | 1 | 82.46 | 
| 9478585 | GT-AG | 0 | 1.000000099473604e-05 | 3693 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 25 | 1090861 | 1094553 | Anhinga anhinga 56067 | ACG|GTGAGACTGC...GAACTCCTATCT/GCATTGCTAATT...TGCAG|CTG | 0 | 1 | 85.105 | 
| 9478586 | GT-AG | 0 | 1.000000099473604e-05 | 981 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 26 | 1089738 | 1090718 | Anhinga anhinga 56067 | AAT|GTGAGTTAAT...TTCTCCTTGGAT/AACCTATTAACG...CTCAG|CCT | 1 | 1 | 88.648 | 
| 9478587 | GT-AG | 0 | 1.000000099473604e-05 | 113 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 27 | 1089542 | 1089654 | Anhinga anhinga 56067 | AAG|GTAAGACCAG...GGACTCCTACCA/CACAGTCTCACA...TGCAG|GAG | 0 | 1 | 90.719 | 
| 9478588 | GT-AG | 0 | 1.000000099473604e-05 | 2031 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 28 | 1087407 | 1089437 | Anhinga anhinga 56067 | CAA|GTAAGAACTG...TGGTTTTTAATA/TGGTTTTTAATA...TTCAG|GAC | 2 | 1 | 93.313 | 
| 9478589 | GT-AG | 0 | 9.058536232236412e-05 | 803 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 29 | 1086511 | 1087313 | Anhinga anhinga 56067 | AAG|GTATAGTGAA...ATGTTTTTGTCT/TTGGATATCATG...CACAG|TAT | 2 | 1 | 95.634 | 
| 9478590 | GT-AG | 0 | 1.000000099473604e-05 | 3000 | rna-gnl|WGS:WBMU|ANHANH_R05231_mrna 1668763 | 30 | 1083464 | 1086463 | Anhinga anhinga 56067 | AAT|GTAAGATATT...TGTTTATTAATG/AGTTTGTTTATT...GTCAG|ATA | 1 | 1 | 96.806 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);