introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
41 rows where transcript_id = 10378390
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 57022000 | GT-AG | 0 | 3.914211389666558 | 220 | rna-XM_025140998.1 10378390 | 1 | 21026730 | 21026949 | Cynara cardunculus 4265 | TAT|GTATCTCTTC...GTTTTTCTATAA/TCACGATTAACT...AAAAG|GTC | 1 | 1 | 3.491 | 
| 57022001 | GT-AG | 0 | 0.0865443199024387 | 1463 | rna-XM_025140998.1 10378390 | 2 | 21025166 | 21026628 | Cynara cardunculus 4265 | CGG|GTACCCAGCT...GAAACCCTAATC/GAAACCCTAATC...ATCAG|GAA | 0 | 1 | 5.236 | 
| 57022002 | GT-AG | 0 | 1.000000099473604e-05 | 120 | rna-XM_025140998.1 10378390 | 3 | 21024924 | 21025043 | Cynara cardunculus 4265 | TAG|GTAAATTGAT...TTGCTGTTAATG/TTAATGTTAATC...ATCAG|AGC | 2 | 1 | 7.344 | 
| 57022003 | GT-AG | 0 | 9.742533606871092e-05 | 84 | rna-XM_025140998.1 10378390 | 4 | 21024743 | 21024826 | Cynara cardunculus 4265 | GAT|GTCAGTTTCC...GTTTCCTTATAA/CGTTTCCTTATA...TTTAG|ATC | 0 | 1 | 9.02 | 
| 57022004 | GT-AG | 0 | 0.0062363223477547 | 90 | rna-XM_025140998.1 10378390 | 5 | 21024542 | 21024631 | Cynara cardunculus 4265 | GAG|GTGCCCACTC...AAGTTTTTAATT/AAGTTTTTAATT...TACAG|ATT | 0 | 1 | 10.938 | 
| 57022005 | GC-AG | 0 | 1.000000099473604e-05 | 113 | rna-XM_025140998.1 10378390 | 6 | 21024300 | 21024412 | Cynara cardunculus 4265 | CAG|GCATGTGGTC...TATCTTTTAACA/TATCTTTTAACA...TCCAG|AGA | 0 | 1 | 13.167 | 
| 57022006 | GC-AG | 0 | 1.000000099473604e-05 | 370 | rna-XM_025140998.1 10378390 | 7 | 21023837 | 21024206 | Cynara cardunculus 4265 | AAG|GCATGGACTT...GGCTACTTAATT/TAATTTCTAAAA...TGCAG|CTT | 0 | 1 | 14.774 | 
| 57022007 | GT-AG | 0 | 1.000000099473604e-05 | 113 | rna-XM_025140998.1 10378390 | 8 | 21023632 | 21023744 | Cynara cardunculus 4265 | AAG|GTGAGTAGTG...CGTGCTTTATAA/CTTGTGTTAATG...TGCAG|GCT | 2 | 1 | 16.364 | 
| 57022008 | GT-AG | 0 | 3.195162500745275e-05 | 109 | rna-XM_025140998.1 10378390 | 9 | 21023396 | 21023504 | Cynara cardunculus 4265 | AAT|GTAAGTATTT...AAGCTCCTGACC/AAGCTCCTGACC...TTCAG|ATG | 0 | 1 | 18.559 | 
| 57022009 | GT-AG | 0 | 0.0010721728907839 | 87 | rna-XM_025140998.1 10378390 | 10 | 21023171 | 21023257 | Cynara cardunculus 4265 | CAG|GTACCACTTG...TCGATTTTATTA/ATGGTGCTCATT...TCTAG|GAA | 0 | 1 | 20.943 | 
| 57022010 | GT-AG | 0 | 1.000000099473604e-05 | 89 | rna-XM_025140998.1 10378390 | 11 | 21023005 | 21023093 | Cynara cardunculus 4265 | CTG|GTAAGGTCTT...TATCTTTTGATA/TATCTTTTGATA...TATAG|GTC | 2 | 1 | 22.274 | 
| 57022011 | GT-AG | 0 | 7.956963019278065e-05 | 79 | rna-XM_025140998.1 10378390 | 12 | 21022847 | 21022925 | Cynara cardunculus 4265 | CAG|GTTCACATCT...TACTTTTTGATT/TACTTTTTGATT...GTCAG|GGG | 0 | 1 | 23.639 | 
| 57022012 | GT-AG | 0 | 1.000000099473604e-05 | 76 | rna-XM_025140998.1 10378390 | 13 | 21022645 | 21022720 | Cynara cardunculus 4265 | CAG|GTTAGAAACA...TAATTATTAATT/TAATTATTAATT...TGCAG|GTT | 0 | 1 | 25.816 | 
| 57022013 | GT-AG | 0 | 0.0494565195678297 | 3552 | rna-XM_025140998.1 10378390 | 14 | 21018978 | 21022529 | Cynara cardunculus 4265 | AAA|GTATGTTCTT...TATTACTTAACC/ATATTACTTAAC...TGTAG|GTA | 1 | 1 | 27.804 | 
| 57022014 | GT-AG | 0 | 0.0045260822425997 | 813 | rna-XM_025140998.1 10378390 | 15 | 21017821 | 21018633 | Cynara cardunculus 4265 | CAG|GTATACCATG...ATGTCCTTTGTC/AAGTAATTCATC...TGCAG|CCC | 0 | 1 | 33.748 | 
| 57022015 | GT-AG | 0 | 0.0217474569664767 | 76 | rna-XM_025140998.1 10378390 | 16 | 21017692 | 21017767 | Cynara cardunculus 4265 | AAA|GTATGTACTT...ATTTCTTTGACA/AGTTATCTTACT...AATAG|GTA | 2 | 1 | 34.664 | 
| 57022016 | GT-AG | 0 | 0.0014501601163352 | 80 | rna-XM_025140998.1 10378390 | 17 | 21017551 | 21017630 | Cynara cardunculus 4265 | CAG|GTATTGTTCT...TCTTTCTTTTCG/AATGGAATAACA...CTTAG|ATA | 0 | 1 | 35.718 | 
| 57022017 | GT-AG | 0 | 0.0067734795333728 | 71 | rna-XM_025140998.1 10378390 | 18 | 21017398 | 21017468 | Cynara cardunculus 4265 | AAG|GTATGTTTTG...CTTTTCTTCTTT/ATTAATTTTATA...TGCAG|CTA | 1 | 1 | 37.135 | 
| 57022018 | GT-AG | 0 | 0.0002875227556113 | 131 | rna-XM_025140998.1 10378390 | 19 | 21017217 | 21017347 | Cynara cardunculus 4265 | TTG|GTGTGTTATA...TTAATTTTAACA/TTAATTTTAACA...CCCAG|GTT | 0 | 1 | 37.999 | 
| 57022019 | GT-AG | 0 | 1.000000099473604e-05 | 1418 | rna-XM_025140998.1 10378390 | 20 | 21015712 | 21017129 | Cynara cardunculus 4265 | GAG|GTACTGCATT...GTGGTCTTTTTT/GGTTGTCTCATG...CACAG|ATA | 0 | 1 | 39.502 | 
| 57022020 | GT-AG | 0 | 0.0001311728838433 | 89 | rna-XM_025140998.1 10378390 | 21 | 21015503 | 21015591 | Cynara cardunculus 4265 | GAG|GTACATTTTG...ACTATTCTACTG/AGAAATCTGATG...AATAG|GTT | 0 | 1 | 41.576 | 
| 57022021 | GT-AG | 0 | 3.0071909468546863e-05 | 74 | rna-XM_025140998.1 10378390 | 22 | 21015326 | 21015399 | Cynara cardunculus 4265 | GCT|GTTTGACCAA...TGAAACTTAACT/TTGTTTATCACT...GGTAG|TTA | 1 | 1 | 43.356 | 
| 57022022 | GT-AG | 0 | 1.000000099473604e-05 | 72 | rna-XM_025140998.1 10378390 | 23 | 21015156 | 21015227 | Cynara cardunculus 4265 | AAG|GTTGGTTTAG...CATCCTTTGGCT/CTTTGGCTGATT...TTTAG|ATC | 0 | 1 | 45.049 | 
| 57022023 | GT-AG | 0 | 1.000000099473604e-05 | 507 | rna-XM_025140998.1 10378390 | 24 | 21014488 | 21014994 | Cynara cardunculus 4265 | AAG|GTTGTCCATG...AGAACCTTATTC/AAGAACCTTATT...GACAG|GAT | 2 | 1 | 47.831 | 
| 57022024 | GT-AG | 0 | 1.000000099473604e-05 | 82 | rna-XM_025140998.1 10378390 | 25 | 21014282 | 21014363 | Cynara cardunculus 4265 | TTG|GTGAGTACTT...TAGTTGTTAACT/AGTAAACTCATT...TGCAG|AAA | 0 | 1 | 49.974 | 
| 57022025 | GT-AG | 0 | 1.000000099473604e-05 | 100 | rna-XM_025140998.1 10378390 | 26 | 21014087 | 21014186 | Cynara cardunculus 4265 | TCG|GTTAGTGACC...CTTCTCTTATAT/TCTTCTCTTATA...TTCAG|TGA | 2 | 1 | 51.616 | 
| 57022026 | GT-AG | 0 | 1.000000099473604e-05 | 106 | rna-XM_025140998.1 10378390 | 27 | 21013869 | 21013974 | Cynara cardunculus 4265 | CAG|GTTATACTTA...CACCATTTAACT/ACTGTTATCATT...CACAG|ATA | 0 | 1 | 53.551 | 
| 57022027 | GT-AG | 0 | 1.000000099473604e-05 | 409 | rna-XM_025140998.1 10378390 | 28 | 21013308 | 21013716 | Cynara cardunculus 4265 | TAG|GTAAAACAAA...AATGTTTTAACT/ATTATATTCACT...TGCAG|TGT | 2 | 1 | 56.178 | 
| 57022028 | GT-AG | 0 | 1.000000099473604e-05 | 91 | rna-XM_025140998.1 10378390 | 29 | 21013107 | 21013197 | Cynara cardunculus 4265 | CAG|GTTTGGATAT...ATTATTTTACTT/TATTATTTTACT...TTCAG|ATG | 1 | 1 | 58.078 | 
| 57022029 | GT-AG | 0 | 1.000000099473604e-05 | 78 | rna-XM_025140998.1 10378390 | 30 | 21012903 | 21012980 | Cynara cardunculus 4265 | CAG|GTACATGGAA...GGAATTTTAGTT/TTTTAGTTCAAT...TCCAG|TTA | 1 | 1 | 60.256 | 
| 57022030 | GC-AG | 0 | 1.000000099473604e-05 | 858 | rna-XM_025140998.1 10378390 | 31 | 21011976 | 21012833 | Cynara cardunculus 4265 | AAG|GCAAGAACAT...TTGTCCCTAACT/TTGTCCCTAACT...AGCAG|AAA | 1 | 1 | 61.448 | 
| 57022031 | GT-AG | 0 | 9.707299152931954e-05 | 85 | rna-XM_025140998.1 10378390 | 32 | 21011701 | 21011785 | Cynara cardunculus 4265 | TCA|GTAAGTATTT...GCTTTCTTCCCG/TTTGTGGTCAAT...TACAG|CAA | 2 | 1 | 64.731 | 
| 57022032 | GT-AG | 0 | 1.000000099473604e-05 | 105 | rna-XM_025140998.1 10378390 | 33 | 21011484 | 21011588 | Cynara cardunculus 4265 | CAG|GTGATTGACA...CATGTTTTTTCT/ATGATATTCATA...TGTAG|GAA | 0 | 1 | 66.667 | 
| 57022033 | GT-AG | 0 | 0.0033145419890776 | 72 | rna-XM_025140998.1 10378390 | 34 | 21011292 | 21011363 | Cynara cardunculus 4265 | CAA|GTATATCCCC...TAATTGTTGACT/TAATTGTTGACT...CTCAG|GAC | 0 | 1 | 68.74 | 
| 57022034 | GT-AG | 0 | 1.000000099473604e-05 | 81 | rna-XM_025140998.1 10378390 | 35 | 21011095 | 21011175 | Cynara cardunculus 4265 | AAG|GTTGGATAGA...TTTTGTTTAAAT/ATATGACTCATA...TGCAG|TGT | 2 | 1 | 70.745 | 
| 57022035 | GT-AG | 0 | 0.1283840547009129 | 361 | rna-XM_025140998.1 10378390 | 36 | 21010650 | 21011010 | Cynara cardunculus 4265 | GAA|GTATGTTTTA...CCTTCCATAATT/CCATAATTCATT...TACAG|GGT | 2 | 1 | 72.196 | 
| 57022036 | GT-AG | 0 | 7.63911980142888e-05 | 114 | rna-XM_025140998.1 10378390 | 37 | 21010423 | 21010536 | Cynara cardunculus 4265 | CAG|GTAGATTTGT...TACTCATTGACA/TGGATACTCATT...TGTAG|GGT | 1 | 1 | 74.149 | 
| 57022037 | GT-AG | 0 | 0.0001604324580075 | 488 | rna-XM_025140998.1 10378390 | 38 | 21009705 | 21010192 | Cynara cardunculus 4265 | ATG|GTAAATTTCT...TTCCTCCTAGCT/CTGACATTGATT...TCCAG|ATG | 0 | 1 | 78.123 | 
| 57022038 | GT-AG | 0 | 1.000000099473604e-05 | 89 | rna-XM_025140998.1 10378390 | 39 | 21008818 | 21008906 | Cynara cardunculus 4265 | TTG|GTAAGCACAA...TTGATCTGAACC/AACTGTTTGATC...TACAG|GTG | 0 | 1 | 91.913 | 
| 57022039 | GT-AG | 0 | 1.000000099473604e-05 | 93 | rna-XM_025140998.1 10378390 | 40 | 21008674 | 21008766 | Cynara cardunculus 4265 | AAG|GTCAGTCACT...GTATTTTTAGAT/TTTAGATTCAAG...TGCAG|ATT | 0 | 1 | 92.794 | 
| 57022040 | GT-AG | 0 | 1.000000099473604e-05 | 107 | rna-XM_025140998.1 10378390 | 41 | 21008381 | 21008487 | Cynara cardunculus 4265 | CAG|GTCGTCTGCA...GTAACTTGAATT/TTCATTTTCATT...TGCAG|ATA | 0 | 1 | 96.008 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);