introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
50 rows where transcript_id = 1668784
This data as json, CSV (advanced)
Suggested facets: is_minor, score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 9478708 | GT-AG | 0 | 1.000000099473604e-05 | 3023 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 1 | 1100468 | 1103490 | Anhinga anhinga 56067 | AAG|GTAAGTCAGC...TGCACTTTTTCT/GTCATACTAAGT...TTTAG|ATT | 1 | 1 | 1.554 | 
| 9478709 | GT-AG | 0 | 1.000000099473604e-05 | 2586 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 2 | 1097841 | 1100426 | Anhinga anhinga 56067 | GAG|GTAAGACCAC...TGTTCTTGGATA/TCTTGGATAATA...AACAG|GGA | 0 | 1 | 2.304 | 
| 9478710 | GT-AG | 0 | 7.369579017980495e-05 | 160 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 3 | 1097625 | 1097784 | Anhinga anhinga 56067 | GAG|GTATTGAATT...ATTTTCTTCTCT/CTCTTTTTCATT...CCTAG|ACA | 2 | 1 | 3.328 | 
| 9478711 | GT-AG | 0 | 3.711813185668666e-05 | 1621 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 4 | 1095907 | 1097527 | Anhinga anhinga 56067 | GTG|GTATGACGTT...TTCACTTCAACT/TCGTGTTTCACT...CTTAG|ACA | 0 | 1 | 5.101 | 
| 9478712 | GT-AG | 0 | 1.000000099473604e-05 | 2034 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 5 | 1093724 | 1095757 | Anhinga anhinga 56067 | CAG|GTAAGTGGCC...TTATTTTTATAG/TTTATTTTTATA...CACAG|GAT | 2 | 1 | 7.826 | 
| 9478713 | GT-AG | 0 | 1.000000099473604e-05 | 2188 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 6 | 1091400 | 1093587 | Anhinga anhinga 56067 | ATG|GTAGGAATGA...ACCATTTTAATT/TTTTAATTCATG...AGTAG|TCA | 0 | 1 | 10.313 | 
| 9478714 | GT-AG | 0 | 0.000306576624225 | 636 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 7 | 1090609 | 1091244 | Anhinga anhinga 56067 | AAG|GTAAGCTTTC...AGAATTTTAAAA/AAGATATTTATC...AACAG|TGA | 2 | 1 | 13.147 | 
| 9478715 | GT-AG | 0 | 1.4921219055204018e-05 | 465 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 8 | 1090062 | 1090526 | Anhinga anhinga 56067 | ACA|GTAAGTGTTT...AATTCTTTGTTT/TAATATTTCAAT...CTTAG|GAT | 0 | 1 | 14.646 | 
| 9478716 | GT-AG | 0 | 0.0002815827132664 | 574 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 9 | 1089352 | 1089925 | Anhinga anhinga 56067 | CAG|GTAACTGATG...TTTTCTTTTACT/TTTTCTTTTACT...TCTAG|TTA | 1 | 1 | 17.133 | 
| 9478717 | GT-AG | 0 | 1.100196929144721e-05 | 999 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 10 | 1088277 | 1089275 | Anhinga anhinga 56067 | CCC|GTAAGATAGT...TGTTTTTTATCC/CTGTTTTTTATC...TGCAG|GGT | 2 | 1 | 18.523 | 
| 9478718 | GT-AG | 0 | 1.000000099473604e-05 | 381 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 11 | 1087819 | 1088199 | Anhinga anhinga 56067 | AAG|GTAAAATAGG...TTTTCTTTACCC/TTTTTCTTTACC...AATAG|GTC | 1 | 1 | 19.931 | 
| 9478719 | GT-AG | 0 | 1.000000099473604e-05 | 875 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 12 | 1086818 | 1087692 | Anhinga anhinga 56067 | CAG|GTAGGAGGCA...TTTTTTTTAACC/TTTTTTTTAACC...TTTAG|GAG | 1 | 1 | 22.234 | 
| 9478720 | GT-AG | 0 | 2.512265682693271e-05 | 2790 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 13 | 1083903 | 1086692 | Anhinga anhinga 56067 | CCA|GTAAGTGTAT...CTTTCCTTTTTT/CAGAAATTAACG...TTAAG|AAT | 0 | 1 | 24.52 | 
| 9478721 | GT-AG | 0 | 3.9789759199036416e-05 | 1466 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 14 | 1082338 | 1083803 | Anhinga anhinga 56067 | AAG|GTATGGCGGA...TATTTTTTGATT/TATTTTTTGATT...AAAAG|GTA | 0 | 1 | 26.33 | 
| 9478722 | GT-AG | 0 | 1.9513489557225492e-05 | 75 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 15 | 1082190 | 1082264 | Anhinga anhinga 56067 | AGT|GTAAGTAGGG...TGAATTTTAATT/TTTTAATTCATT...TGCAG|CTA | 1 | 1 | 27.665 | 
| 9478723 | GT-AG | 0 | 1.8702094118283007e-05 | 3405 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 16 | 1078681 | 1082085 | Anhinga anhinga 56067 | AAG|GTATTGGATC...CTATTTTTAAAT/CTATTTTTAAAT...TTCAG|GGG | 0 | 1 | 29.567 | 
| 9478724 | GT-AG | 0 | 0.0032699446152972 | 95 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 17 | 1078402 | 1078496 | Anhinga anhinga 56067 | ATG|GTATGTATCT...TACATTTTAATG/TACATTTTAATG...ATTAG|TGG | 1 | 1 | 32.931 | 
| 9478725 | GT-AG | 0 | 0.0046971816125874 | 1352 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 18 | 1076952 | 1078303 | Anhinga anhinga 56067 | AAG|GTATATCTTT...AATTGCTTATCA/CAATTTGTCATT...TGTAG|TTT | 0 | 1 | 34.723 | 
| 9478726 | GT-AG | 0 | 1.000000099473604e-05 | 254 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 19 | 1076608 | 1076861 | Anhinga anhinga 56067 | CTG|GTAAGAATCG...GTGACTTTAGAA/TTAAATTTAAAA...TTTAG|ATA | 0 | 1 | 36.369 | 
| 9478727 | GT-AG | 0 | 0.0004573855236534 | 2706 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 20 | 1073801 | 1076506 | Anhinga anhinga 56067 | CAA|GTAAGTTTTG...TATTTTTTAAAA/TATTTTTTAAAA...TTCAG|GAA | 2 | 1 | 38.215 | 
| 9478728 | GT-AG | 0 | 1.6757275966034752e-05 | 3936 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 21 | 1069730 | 1073665 | Anhinga anhinga 56067 | ACA|GTAAGTACCC...CTGATTTTGAAA/AACTTTCTGATT...AACAG|ATT | 2 | 1 | 40.684 | 
| 9478729 | GT-AG | 0 | 1.000000099473604e-05 | 9559 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 22 | 1060062 | 1069620 | Anhinga anhinga 56067 | CAG|GTTGGTGTGT...ATTAACTCAATC/AATTAACTCAAT...TGCAG|GTT | 0 | 1 | 42.677 | 
| 9478730 | GT-AG | 0 | 1.000000099473604e-05 | 623 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 23 | 1059368 | 1059990 | Anhinga anhinga 56067 | GAG|GTGGGCTGCT...CTGTCTTTATTA/TCTTTATTAACA...TGCAG|CCA | 2 | 1 | 43.975 | 
| 9478731 | GT-AG | 0 | 1.000000099473604e-05 | 18027 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 24 | 1041234 | 1059260 | Anhinga anhinga 56067 | AAG|GTAAATATAA...TTGTTCTTAAGA/TAGTATTTGATT...TTCAG|AAT | 1 | 1 | 45.932 | 
| 9478732 | GT-AG | 0 | 2.487128529979065e-05 | 12165 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 25 | 1028920 | 1041084 | Anhinga anhinga 56067 | CCT|GTAAGTGTTG...TTTTTTTTTTTT/ATGGATTTAATA...TACAG|GCA | 0 | 1 | 48.656 | 
| 9478733 | GT-AG | 0 | 1.000000099473604e-05 | 49645 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 26 | 979179 | 1028823 | Anhinga anhinga 56067 | ATT|GTGAGTAATA...GATATCTTAAAT/CATGTATTAATT...TTCAG|AGT | 0 | 1 | 50.411 | 
| 9478734 | GT-AG | 0 | 1.000000099473604e-05 | 1717 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 27 | 977363 | 979079 | Anhinga anhinga 56067 | GTG|GTGAGTACAA...TGTATTTTATTG/TTGTATTTTATT...TCTAG|GAC | 0 | 1 | 52.222 | 
| 9478735 | GT-AG | 0 | 1.000000099473604e-05 | 14229 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 28 | 963039 | 977267 | Anhinga anhinga 56067 | CAG|GTAAAGTGGT...TTATCTATATCA/ATTACATTCATT...TTTAG|GGT | 2 | 1 | 53.959 | 
| 9478736 | GT-AG | 0 | 5.061065875424587e-05 | 13996 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 29 | 948964 | 962959 | Anhinga anhinga 56067 | CAA|GTAAGTGTTT...ATTTCCTTATAT/CTTATATTTATT...TACAG|CTG | 0 | 1 | 55.403 | 
| 9478737 | GT-AG | 0 | 1.4156131972204804e-05 | 94 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 30 | 948769 | 948862 | Anhinga anhinga 56067 | CAA|GTAAGCAAAA...ATATCTTTCATA/ATATCTTTCATA...TCTAG|ATA | 2 | 1 | 57.25 | 
| 9478738 | GT-AG | 0 | 1.000000099473604e-05 | 1901 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 31 | 946809 | 948709 | Anhinga anhinga 56067 | TTG|GTGAGTAGGC...TTTTTTTTCTCT/TCTCCTCTCAAA...TTCAG|GCC | 1 | 1 | 58.329 | 
| 9478739 | GT-AG | 0 | 1.000000099473604e-05 | 7593 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 32 | 939067 | 946659 | Anhinga anhinga 56067 | AAG|GTAATTAAAA...AGTGTTTTGATT/AGTGTTTTGATT...ATTAG|TTT | 0 | 1 | 61.053 | 
| 9478740 | GT-AG | 0 | 1.000000099473604e-05 | 5985 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 33 | 932996 | 938980 | Anhinga anhinga 56067 | CAT|GTAAGTACTG...CTGATTTTCACA/CTGATTTTCACA...TGCAG|TCT | 2 | 1 | 62.626 | 
| 9478741 | GT-AG | 0 | 0.0140941309339456 | 1156 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 34 | 931683 | 932838 | Anhinga anhinga 56067 | CTG|GTATGTTCTC...TAACTTTTAAAT/TGTGATTTAATA...CCTAG|AAT | 0 | 1 | 65.496 | 
| 9478742 | GT-AG | 0 | 1.000000099473604e-05 | 1483 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 35 | 930159 | 931641 | Anhinga anhinga 56067 | CAG|GTACGGCAGT...TAATTCTTGTTC/CCTACTCTAATT...AACAG|ATA | 2 | 1 | 66.246 | 
| 9478743 | GT-AG | 0 | 1.000000099473604e-05 | 1089 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 36 | 928979 | 930067 | Anhinga anhinga 56067 | AAG|GTTAGATTTT...GGTTTTTTAATG/TGTGGTTTTATT...CTCAG|TGG | 0 | 1 | 67.91 | 
| 9478744 | GT-AG | 0 | 1.000000099473604e-05 | 1823 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 37 | 927036 | 928858 | Anhinga anhinga 56067 | AAG|GTAGGTCTGT...ACTTTTTCAATA/TACTTTTTCAAT...TGCAG|ATG | 0 | 1 | 70.104 | 
| 9478745 | GT-AG | 0 | 1.000000099473604e-05 | 1345 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 38 | 925601 | 926945 | Anhinga anhinga 56067 | CTG|GTAAGATGAT...GTTGCTTTTGCT/ACAGAAGTAATT...TTCAG|ATT | 0 | 1 | 71.75 | 
| 9478746 | GT-AG | 0 | 5.899018252044201e-05 | 2033 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 39 | 923463 | 925495 | Anhinga anhinga 56067 | AGG|GTAAACCTGT...TCTGCCTCAGCA/AAGCTATTTATT...TGCAG|AAC | 0 | 1 | 73.67 | 
| 9478747 | GT-AG | 1 | 99.19992812903745 | 1690 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 40 | 921631 | 923320 | Anhinga anhinga 56067 | AAT|GTATCCTTGA...ATGCCCTTAACT/CAGTATTTCATA...TTCAG|ATA | 1 | 1 | 76.266 | 
| 9478748 | GT-AG | 0 | 1.000000099473604e-05 | 2982 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 41 | 918567 | 921548 | Anhinga anhinga 56067 | AAA|GTAAGTGAAT...TCCTTTTTAAAT/CTGTGTTTTACC...TTCAG|TTT | 2 | 1 | 77.766 | 
| 9478749 | GT-AG | 0 | 1.000000099473604e-05 | 1525 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 42 | 916957 | 918481 | Anhinga anhinga 56067 | GCC|GTAAGTAAAT...TAAAGTTTAAAT/TAAAGTTTAAAT...AATAG|TCT | 0 | 1 | 79.32 | 
| 9478750 | GT-AG | 0 | 1.000000099473604e-05 | 325 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 43 | 916545 | 916869 | Anhinga anhinga 56067 | CAG|GTGCGTATTA...TAAGCCTTAAAA/CTTTTTATCACT...TATAG|ACT | 0 | 1 | 80.911 | 
| 9478751 | GT-AG | 0 | 1.000000099473604e-05 | 1341 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 44 | 915027 | 916367 | Anhinga anhinga 56067 | AAG|GTAAGAGCTT...ATTTCTTTACCT/GATAGACTGATA...CTAAG|GCT | 0 | 1 | 84.147 | 
| 9478752 | GT-AG | 0 | 0.0060214780895041 | 4295 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 45 | 910648 | 914942 | Anhinga anhinga 56067 | CAG|GTAACTTCTT...TTTTTCTTCTTT/AATAGTCTCACT...TCAAG|ATA | 0 | 1 | 85.683 | 
| 9478753 | GT-AG | 0 | 0.000332432196777 | 2228 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 46 | 908282 | 910509 | Anhinga anhinga 56067 | TTG|GTATTGCTCT...AGTTGTTTGATA/AGTTGTTTGATA...TGTAG|CCA | 0 | 1 | 88.206 | 
| 9478754 | GT-AG | 0 | 1.000000099473604e-05 | 1710 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 47 | 906444 | 908153 | Anhinga anhinga 56067 | AAG|GTTGGTTATG...TTTTCTTTTGCT/ATATCACTCAGC...TGCAG|CTT | 2 | 1 | 90.547 | 
| 9478755 | GT-AG | 0 | 1.0071769139614386 | 1484 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 48 | 904779 | 906262 | Anhinga anhinga 56067 | TGT|GTATGTTGCT...TTTTTTTTAATT/TTTTTTTTAATT...AACAG|CTG | 0 | 1 | 93.856 | 
| 9478756 | GT-AG | 0 | 1.3054184871887166e-05 | 1041 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 49 | 903617 | 904657 | Anhinga anhinga 56067 | CAG|GTAAGCTGCT...CTTTTTTTCATT/CTTTTTTTCATT...CTAAG|GAT | 1 | 1 | 96.069 | 
| 9478757 | GT-AG | 0 | 3.278121383142226e-05 | 1282 | rna-gnl|WGS:WBMU|ANHANH_R10054_mrna 1668784 | 50 | 902192 | 903473 | Anhinga anhinga 56067 | ATG|GTAAGTTCTG...GTCGTTTTAATA/GTCGTTTTAATA...TGCAG|CGC | 0 | 1 | 98.683 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);