introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
22 rows where transcript_id = 32210473
This data as json, CSV (advanced)
Suggested facets: score, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 179851948 | GT-AG | 0 | 1.000000099473604e-05 | 139631 | rna-XM_047254284.1 32210473 | 1 | 73447441 | 73587071 | Schistocerca piceifrons 274613 | ATG|GTAAGTCAGC...CCTCTTTTGGCC/CCGCCACTGACT...TGCAG|TGG | 0 | 1 | 0.371 |
| 179851949 | GT-AG | 0 | 1.000000099473604e-05 | 8157 | rna-XM_047254284.1 32210473 | 2 | 73587368 | 73595524 | Schistocerca piceifrons 274613 | CAG|GTAAACAAAC...TACGTCTGACTT/ATACGTCTGACT...CGCAG|GCA | 2 | 1 | 2.204 |
| 179851950 | GT-AG | 0 | 0.0001784983689982 | 16239 | rna-XM_047254284.1 32210473 | 3 | 73595730 | 73611968 | Schistocerca piceifrons 274613 | CAG|GTACACGGCG...CATCCTTTAAAG/AAAGGAATCATT...CACAG|GTG | 0 | 1 | 3.473 |
| 179851951 | GT-AG | 0 | 1.000000099473604e-05 | 3206 | rna-XM_047254284.1 32210473 | 4 | 73622022 | 73625227 | Schistocerca piceifrons 274613 | ATG|GTGAGTGTGG...ATTTTCTAATTT/GATTTTCTAATT...CGCAG|TTG | 0 | 1 | 65.713 |
| 179851952 | GT-AG | 0 | 1.000000099473604e-05 | 145826 | rna-XM_047254284.1 32210473 | 5 | 73627332 | 73773157 | Schistocerca piceifrons 274613 | CTG|GTAAGTCCAA...CAGAGCTGGACG/GTGGTGGTGAGC...CGCAG|TGA | 1 | 1 | 78.739 |
| 179851953 | GT-AG | 0 | 1.000000099473604e-05 | 9383 | rna-XM_047254284.1 32210473 | 6 | 73773329 | 73782711 | Schistocerca piceifrons 274613 | CAG|GTACAGTCGC...AGTGGCTTGCCC/CCAGAGGTGAAA...TGCAG|ACT | 1 | 1 | 79.798 |
| 179851954 | GT-AG | 0 | 1.000000099473604e-05 | 3306 | rna-XM_047254284.1 32210473 | 7 | 73782961 | 73786266 | Schistocerca piceifrons 274613 | TTC|GTGAGTAGCG...TAGAATTTAACT/ATTATACTGATT...TTCAG|GTG | 1 | 1 | 81.34 |
| 179851955 | GT-AG | 0 | 1.000000099473604e-05 | 8332 | rna-XM_047254284.1 32210473 | 8 | 73786465 | 73794796 | Schistocerca piceifrons 274613 | CAA|GTGAGTGTAG...TGTGTCTTGATA/TGTGTCTTGATA...TACAG|GTG | 1 | 1 | 82.566 |
| 179851956 | GT-AG | 0 | 1.000000099473604e-05 | 619 | rna-XM_047254284.1 32210473 | 9 | 73794851 | 73795469 | Schistocerca piceifrons 274613 | CAG|GTAACAGAGA...AAATTTTCAAAT/CAAATTTTCAAA...CACAG|GCG | 1 | 1 | 82.9 |
| 179851957 | GT-AG | 0 | 1.000000099473604e-05 | 5596 | rna-XM_047254284.1 32210473 | 10 | 73795626 | 73801221 | Schistocerca piceifrons 274613 | GAG|GTCAGTAAAT...ATTTATTTATCT/CATTTATTTATC...TTCAG|GTG | 1 | 1 | 83.866 |
| 179851958 | GT-AG | 0 | 0.0010164363004662 | 864 | rna-XM_047254284.1 32210473 | 11 | 73802485 | 73803348 | Schistocerca piceifrons 274613 | CTG|GTATGTACTG...GGAGACTTAACA/GGAGACTTAACA...CACAG|CTG | 1 | 1 | 91.685 |
| 179851959 | GT-AG | 0 | 0.0005236472954305 | 4754 | rna-XM_047254284.1 32210473 | 12 | 73803478 | 73808231 | Schistocerca piceifrons 274613 | CAG|GTAACTAACA...GTTCTTTTAATC/AGATTTCTTACT...GTCAG|GCT | 1 | 1 | 92.484 |
| 179851960 | GT-AG | 0 | 1.000000099473604e-05 | 2468 | rna-XM_047254284.1 32210473 | 13 | 73808397 | 73810864 | Schistocerca piceifrons 274613 | AGG|GTAAGTTGTA...TCTTTTTTATAA/TTCTTTTTTATA...AACAG|GTG | 1 | 1 | 93.505 |
| 179851961 | GT-AG | 0 | 1.000000099473604e-05 | 64590 | rna-XM_047254284.1 32210473 | 14 | 73811029 | 73875618 | Schistocerca piceifrons 274613 | AAG|GTAGGAAAGA...GAATTCATGAAA/TTGGAATTCATG...TGCAG|ACT | 0 | 1 | 94.521 |
| 179851962 | GT-AG | 0 | 1.000000099473604e-05 | 4954 | rna-XM_047254284.1 32210473 | 15 | 73875697 | 73880650 | Schistocerca piceifrons 274613 | CTT|GTAAGACAAC...CTACTTTTAAAT/CTTGTATTAATA...TTCAG|CTT | 0 | 1 | 95.004 |
| 179851963 | GT-AG | 0 | 1.4801905505116551e-05 | 1269 | rna-XM_047254284.1 32210473 | 16 | 73880727 | 73881995 | Schistocerca piceifrons 274613 | AAG|GTACGTCTGA...CTTTTTATGATT/ATTTAGTTCATT...TCCAG|CAT | 1 | 1 | 95.474 |
| 179851964 | GT-AG | 0 | 1.000000099473604e-05 | 11070 | rna-XM_047254284.1 32210473 | 17 | 73882122 | 73893191 | Schistocerca piceifrons 274613 | AGG|GTGAGTCCTC...TTATTTTTAAAG/ATTATTTTTAAA...CATAG|GCC | 1 | 1 | 96.254 |
| 179851965 | GT-AG | 0 | 1.000000099473604e-05 | 88 | rna-XM_047254284.1 32210473 | 18 | 73893255 | 73893342 | Schistocerca piceifrons 274613 | AAG|GTATGAACAA...TTAGTATTACTG/GTATTACTGATT...TGCAG|TAA | 1 | 1 | 96.644 |
| 179851966 | GT-AG | 0 | 1.000000099473604e-05 | 7141 | rna-XM_047254284.1 32210473 | 19 | 73893403 | 73900543 | Schistocerca piceifrons 274613 | GAG|GTAATAAACT...TGTTCCTTTGTC/ATCTATTTTACA...CATAG|CTC | 1 | 1 | 97.016 |
| 179851967 | GT-AG | 0 | 1.000000099473604e-05 | 4375 | rna-XM_047254284.1 32210473 | 20 | 73900620 | 73904994 | Schistocerca piceifrons 274613 | AAG|GTAAGAACTG...CAGTTCTTGACA/CTCTAACTAACC...TGCAG|CTC | 2 | 1 | 97.486 |
| 179851968 | GT-AG | 0 | 1.000000099473604e-05 | 610 | rna-XM_047254284.1 32210473 | 21 | 73905125 | 73905734 | Schistocerca piceifrons 274613 | AAG|GTACAAAAGC...TTTTTCTTACTT/ATTTTTCTTACT...TATAG|AAC | 0 | 1 | 98.291 |
| 179851969 | GT-AG | 0 | 0.000256099582292 | 398 | rna-XM_047254284.1 32210473 | 22 | 73905887 | 73906284 | Schistocerca piceifrons 274613 | TGA|GTAAGTTCTA...ATGTTCTCAACA/TATGTTCTCAAC...TTCAG|TGA | 2 | 1 | 99.232 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);