introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
 - INTEGER (primary key), globally unique identifier for each intron
 - dinucleotide_pair
 - TEXT, terminal dinucleotide sequences of the intron
 - is_minor
 - INTEGER, indicates if the intron is a minor intron (1) or not (0)
 - score
 - REAL, score representing the probability (0-100%) of the intron being minor
 - length
 - INTEGER, length of the intron in base pairs
 - transcript_id
 - INTEGER (foreign key referencing transcripts(id)), parent transcript
 - ordinal_index
 - INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
 - start
 - INTEGER, start position of the intron in the genome
 - end
 - INTEGER, end position of the intron in the genome
 - taxonomy_id
 - INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
 - scored_motifs
 - TEXT, motifs scored for the intron
 - phase
 - INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
 - in_cds
 - INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
 - relative_position
 - REAL, relative position of the intron within the transcript (as a percentage of coding length)
 
34 rows where transcript_id = 19905802
This data as json, CSV (advanced)
Suggested facets: dinucleotide_pair, score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position | 
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 106495373 | GT-AG | 0 | 1.63106065722961e-05 | 19178 | rna-XM_021545589.2 19905802 | 1 | 23834181 | 23853358 | Lonchura striata 40157 | GCT|GTAAGTAACA...TTGTGTTTAATT/TTGTGTTTAATT...TGCAG|GCT | 1 | 1 | 0.485 | 
| 106495374 | GT-AG | 0 | 0.001850232316946 | 22688 | rna-XM_021545589.2 19905802 | 2 | 23853623 | 23876310 | Lonchura striata 40157 | AAG|GTACATATTA...TTTTCTTTGATA/GTTATATTAACT...TTCAG|TGC | 1 | 1 | 5.054 | 
| 106495375 | GT-AG | 0 | 1.000000099473604e-05 | 3825 | rna-XM_021545589.2 19905802 | 3 | 23876382 | 23880206 | Lonchura striata 40157 | CTG|GTAAGAGTGA...TGCTCTTTTTCC/CCATTGCTAATC...TCCAG|TGT | 0 | 1 | 6.282 | 
| 106495376 | GT-AG | 0 | 1.000000099473604e-05 | 21426 | rna-XM_021545589.2 19905802 | 4 | 23880351 | 23901776 | Lonchura striata 40157 | CTA|GTAAGTAAAG...ATGCTTTTAATT/ATGCTTTTAATT...TGTAG|GCT | 0 | 1 | 8.775 | 
| 106495377 | GT-AG | 0 | 1.000000099473604e-05 | 13107 | rna-XM_021545589.2 19905802 | 5 | 23901886 | 23914992 | Lonchura striata 40157 | ATG|GTAAGTCAGC...TGCTCTTTATTG/TCTTTATTGACG...TCCAG|GTG | 1 | 1 | 10.661 | 
| 106495378 | GT-AG | 0 | 1.000000099473604e-05 | 3818 | rna-XM_021545589.2 19905802 | 6 | 23915118 | 23918935 | Lonchura striata 40157 | CTG|GTGAGTGGCA...AGTTCTTTAAAC/CAAAAATTAACC...TGCAG|CTG | 0 | 1 | 12.825 | 
| 106495379 | GT-AG | 0 | 1.000000099473604e-05 | 13123 | rna-XM_021545589.2 19905802 | 7 | 23919062 | 23932184 | Lonchura striata 40157 | CAG|GTAAGGCATG...CTGGTTTTGCCC/TCCCATTTCAAA...TTTAG|ACC | 0 | 1 | 15.005 | 
| 106495380 | GT-AG | 0 | 1.000000099473604e-05 | 1314 | rna-XM_021545589.2 19905802 | 8 | 23932261 | 23933574 | Lonchura striata 40157 | CAG|GTAGGTGAAA...ATTTTCTTGTCT/TCTTGTCTGATA...CTTAG|ATG | 1 | 1 | 16.321 | 
| 106495381 | GT-AG | 0 | 1.5342646065023918e-05 | 7569 | rna-XM_021545589.2 19905802 | 9 | 23933729 | 23941297 | Lonchura striata 40157 | ACT|GTAAGTAAGT...ATTGCTTTATTG/GCTTTATTGATT...TGTAG|GAA | 2 | 1 | 18.986 | 
| 106495382 | GT-AG | 0 | 1.000000099473604e-05 | 5969 | rna-XM_021545589.2 19905802 | 10 | 23941449 | 23947417 | Lonchura striata 40157 | CAG|GTAACAGAAT...GTGACTTTATTT/ATTTCTCTAATT...TCTAG|ATC | 0 | 1 | 21.599 | 
| 106495383 | GT-AG | 0 | 1.000000099473604e-05 | 2794 | rna-XM_021545589.2 19905802 | 11 | 23947529 | 23950322 | Lonchura striata 40157 | TAT|GTGAGTTGCT...TATTACTTAATA/TTATTACTTAAT...TTCAG|ACC | 0 | 1 | 23.52 | 
| 106495384 | GT-AG | 0 | 9.03842469337754e-05 | 2560 | rna-XM_021545589.2 19905802 | 12 | 23950389 | 23952948 | Lonchura striata 40157 | ATG|GTAAGCATTC...ATAATTTTAATT/ATAATTTTAATT...TTCAG|GTC | 0 | 1 | 24.663 | 
| 106495385 | GT-AG | 0 | 1.000000099473604e-05 | 4752 | rna-XM_021545589.2 19905802 | 13 | 23953077 | 23957828 | Lonchura striata 40157 | CAG|GTGAAAATTT...TCTTCCTTGCCT/CTAGCACTGATT...TGCAG|TGG | 2 | 1 | 26.878 | 
| 106495386 | GT-AG | 0 | 2.232621043565205e-05 | 1840 | rna-XM_021545589.2 19905802 | 14 | 23957935 | 23959774 | Lonchura striata 40157 | CAT|GTAAGTAGCA...ACTTCTTTAATA/TCTCTTTTTACT...TGCAG|GTA | 0 | 1 | 28.712 | 
| 106495387 | GT-AG | 0 | 1.000000099473604e-05 | 5967 | rna-XM_021545589.2 19905802 | 15 | 23959893 | 23965859 | Lonchura striata 40157 | CAG|GTAAGTATCA...TTAAGTTTAGAA/GATGAGTTTATA...ATCAG|CTA | 1 | 1 | 30.755 | 
| 106495388 | GT-AG | 0 | 1.000000099473604e-05 | 23549 | rna-XM_021545589.2 19905802 | 16 | 23966008 | 23989556 | Lonchura striata 40157 | CAG|GTAGGAAAAC...CCAGCCTTGTAA/AGCCTTGTAAAT...TGCAG|GTA | 2 | 1 | 33.316 | 
| 106495389 | GT-AG | 0 | 5.200950048888225e-05 | 3295 | rna-XM_021545589.2 19905802 | 17 | 23989669 | 23992963 | Lonchura striata 40157 | CTG|GTAAGTTACA...TTATCTTTAATT/TTATCTTTAATT...TGCAG|GAG | 0 | 1 | 35.254 | 
| 106495390 | GT-AG | 0 | 1.000000099473604e-05 | 775 | rna-XM_021545589.2 19905802 | 18 | 23993082 | 23993856 | Lonchura striata 40157 | AAG|GTCAGTAGGA...ATTTTCTTTTCC/TCAGTCTTCACA...TTCAG|TGG | 1 | 1 | 37.297 | 
| 106495391 | GT-AG | 0 | 1.9332300955995883e-05 | 676 | rna-XM_021545589.2 19905802 | 19 | 23993929 | 23994604 | Lonchura striata 40157 | AAG|GTAATCTGCT...TCTGCTTTTTCT/CACACTTTCATC...CTTAG|GAG | 1 | 1 | 38.543 | 
| 106495392 | GT-AG | 0 | 1.000000099473604e-05 | 9072 | rna-XM_021545589.2 19905802 | 20 | 23994747 | 24003818 | Lonchura striata 40157 | CAG|GTAGGAGTGC...GAATTCTTATTA/GTATTATTCACT...CCCAG|TGA | 2 | 1 | 41.0 | 
| 106495393 | GC-AG | 0 | 1.000000099473604e-05 | 9376 | rna-XM_021545589.2 19905802 | 21 | 24003892 | 24013267 | Lonchura striata 40157 | CAG|GCAAGTGTGG...TTTTTCTTCATT/TTTTTCTTCATT...AATAG|CTG | 0 | 1 | 42.264 | 
| 106495394 | GT-AG | 0 | 1.8994786765492848e-05 | 562 | rna-XM_021545589.2 19905802 | 22 | 24013421 | 24013982 | Lonchura striata 40157 | CAG|GTAGTTTCCA...TCTCCCGTATAA/CAAAATTCTATT...TTCAG|AAA | 0 | 1 | 44.912 | 
| 106495395 | GT-AG | 0 | 1.000000099473604e-05 | 8423 | rna-XM_021545589.2 19905802 | 23 | 24014184 | 24022606 | Lonchura striata 40157 | AGG|GTAAGTTGTT...TGGTCATTACTA/TCATTACTAATG...TATAG|GTT | 0 | 1 | 48.39 | 
| 106495396 | GT-AG | 0 | 1.000000099473604e-05 | 2709 | rna-XM_021545589.2 19905802 | 24 | 24022683 | 24025391 | Lonchura striata 40157 | AAA|GTAAGTAAAT...TATATTTTATCT/TATTTTTTTATT...GCCAG|CAA | 1 | 1 | 49.706 | 
| 106495397 | GT-AG | 0 | 1.000000099473604e-05 | 4265 | rna-XM_021545589.2 19905802 | 25 | 24025568 | 24029832 | Lonchura striata 40157 | AAG|GTAAGAATTT...CCTATCTTGAGA/CCTATCTTGAGA...CACAG|CTG | 0 | 1 | 52.752 | 
| 106495398 | GT-AG | 0 | 1.000000099473604e-05 | 251 | rna-XM_021545589.2 19905802 | 26 | 24029914 | 24030164 | Lonchura striata 40157 | AGG|GTCAGTGAAC...TAATTATTGATA/TAATTATTGATA...CCCAG|AAA | 0 | 1 | 54.154 | 
| 106495399 | GT-AG | 0 | 1.000000099473604e-05 | 18111 | rna-XM_021545589.2 19905802 | 27 | 24030371 | 24048481 | Lonchura striata 40157 | AAG|GTAAATTCTT...TTCTGCTGATTT/CTTCTGCTGATT...TCTAG|GTA | 2 | 1 | 57.719 | 
| 106495400 | GT-AG | 0 | 1.000000099473604e-05 | 12440 | rna-XM_021545589.2 19905802 | 28 | 24048585 | 24061024 | Lonchura striata 40157 | CAG|GTTTGTGATC...ATTTTGTTGATG/TTTGGCTTCATT...TTTAG|ATA | 0 | 1 | 59.502 | 
| 106495401 | GT-AG | 0 | 5.6897563770698895e-05 | 5315 | rna-XM_021545589.2 19905802 | 29 | 24061122 | 24066436 | Lonchura striata 40157 | AAG|GTAACAGTTA...CTGTCTTTCACT/CTGTCTTTCACT...GGCAG|TTG | 1 | 1 | 61.18 | 
| 106495402 | GT-AG | 0 | 1.000000099473604e-05 | 1804 | rna-XM_021545589.2 19905802 | 30 | 24066684 | 24068487 | Lonchura striata 40157 | AAG|GTAAGATGAG...TATTGCTTGAAT/TTCATTGTTATT...TTCAG|AGC | 2 | 1 | 65.455 | 
| 106495403 | GT-AG | 0 | 1.000000099473604e-05 | 1806 | rna-XM_021545589.2 19905802 | 31 | 24068796 | 24070601 | Lonchura striata 40157 | AAG|GTTAGACATA...CTGACTTTAACT/ACCTTTTTCACT...CCTAG|TAC | 1 | 1 | 70.786 | 
| 106495404 | GT-AG | 0 | 1.000000099473604e-05 | 17170 | rna-XM_021545589.2 19905802 | 32 | 24071805 | 24088974 | Lonchura striata 40157 | AAG|GTAAGATAGT...CATTTTTTCTCT/CTGACAATCATT...GTCAG|GTG | 1 | 1 | 91.606 | 
| 106495405 | GT-AG | 0 | 1.000000099473604e-05 | 2485 | rna-XM_021545589.2 19905802 | 33 | 24089134 | 24091618 | Lonchura striata 40157 | ATG|GTAAGTAGTT...TATAATTTAATA/TATAATTTAATA...TTTAG|GAT | 1 | 1 | 94.358 | 
| 106495406 | GT-AG | 0 | 1.000000099473604e-05 | 14915 | rna-XM_021545589.2 19905802 | 34 | 24091711 | 24106625 | Lonchura striata 40157 | CAG|GTAAATATTT...TTATTATTATTT/ATTATTATTATT...CACAG|GTA | 0 | 1 | 95.95 | 
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);