introns
Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)
- id
- INTEGER (primary key), globally unique identifier for each intron
- dinucleotide_pair
- TEXT, terminal dinucleotide sequences of the intron
- is_minor
- INTEGER, indicates if the intron is a minor intron (1) or not (0)
- score
- REAL, score representing the probability (0-100%) of the intron being minor
- length
- INTEGER, length of the intron in base pairs
- transcript_id
- INTEGER (foreign key referencing transcripts(id)), parent transcript
- ordinal_index
- INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
- start
- INTEGER, start position of the intron in the genome
- end
- INTEGER, end position of the intron in the genome
- taxonomy_id
- INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
- scored_motifs
- TEXT, motifs scored for the intron
- phase
- INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
- in_cds
- INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
- relative_position
- REAL, relative position of the intron within the transcript (as a percentage of coding length)
24 rows where transcript_id = 32671991
This data as json, CSV (advanced)
Suggested facets: score, length, phase
| id ▼ | dinucleotide_pair | is_minor | score | length | transcript_id | ordinal_index | start | end | taxonomy_id | scored_motifs | phase | in_cds | relative_position |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 182503373 | GT-AG | 0 | 1.000000099473604e-05 | 44856 | rna-XM_030239200.1 32671991 | 1 | 17587956 | 17632811 | Serinus canaria 9135 | CAG|GTAGGAACGG...CTATCTTTTTCT/TTTGCAATGATC...TTTAG|GCA | 0 | 1 | 1.448 |
| 182503374 | GT-AG | 0 | 1.000000099473604e-05 | 5881 | rna-XM_030239200.1 32671991 | 2 | 17632995 | 17638875 | Serinus canaria 9135 | AAA|GTAAGTGGAA...GAATTTTTAATA/CATTTATTGAAT...TTTAG|GAT | 0 | 1 | 4.493 |
| 182503375 | GT-AG | 0 | 0.0006869864564507 | 11078 | rna-XM_030239200.1 32671991 | 3 | 17638901 | 17649978 | Serinus canaria 9135 | AAG|GTATGTCTTA...TATTCTTTCTTT/ATGCTATTAAGA...CTCAG|GAA | 1 | 1 | 4.909 |
| 182503376 | GT-AG | 0 | 1.7924695576668065e-05 | 3136 | rna-XM_030239200.1 32671991 | 4 | 17650072 | 17653207 | Serinus canaria 9135 | CAG|GTACTGTTCA...TCAGTTATAACT/ACTAATTTCAGT...TACAG|GTG | 1 | 1 | 6.457 |
| 182503377 | GT-AG | 0 | 1.000000099473604e-05 | 5502 | rna-XM_030239200.1 32671991 | 5 | 17653287 | 17658788 | Serinus canaria 9135 | CAG|GTAAGATAAT...TTATCTGTGATA/TTGAAAATCACT...TTCAG|TGA | 2 | 1 | 7.772 |
| 182503378 | GT-AG | 0 | 0.0031582468464849 | 7902 | rna-XM_030239200.1 32671991 | 6 | 17658844 | 17666745 | Serinus canaria 9135 | TTG|GTATGTTAAT...CTGTCTTTACAT/GCAGTTTTTACT...GCCAG|CTG | 0 | 1 | 8.687 |
| 182503379 | GT-AG | 0 | 1.000000099473604e-05 | 1552 | rna-XM_030239200.1 32671991 | 7 | 17666776 | 17668327 | Serinus canaria 9135 | CTG|GTAAGAAATG...ACTCACTTAATC/TGAATACTCACT...CACAG|GCA | 0 | 1 | 9.186 |
| 182503380 | GT-AG | 0 | 1.000000099473604e-05 | 14579 | rna-XM_030239200.1 32671991 | 8 | 17670282 | 17684860 | Serinus canaria 9135 | TTG|GTGAGTTAAA...AATATGTTAATA/ATTTGATTAATG...TGTAG|ATG | 1 | 1 | 41.704 |
| 182503381 | GT-AG | 0 | 1.000000099473604e-05 | 154 | rna-XM_030239200.1 32671991 | 9 | 17685020 | 17685173 | Serinus canaria 9135 | ATG|GTGAGCGTTG...ATTTCCTGCATA/ATGTAATTCAAT...TGTAG|AAT | 1 | 1 | 44.35 |
| 182503382 | GT-AG | 0 | 1.000000099473604e-05 | 88 | rna-XM_030239200.1 32671991 | 10 | 17685277 | 17685364 | Serinus canaria 9135 | ATC|GTGAGTTCAT...CTCATTTTAACA/TAAATTCTCATT...AACAG|GTC | 2 | 1 | 46.064 |
| 182503383 | GT-AG | 0 | 1.000000099473604e-05 | 515 | rna-XM_030239200.1 32671991 | 11 | 17685402 | 17685916 | Serinus canaria 9135 | AAG|GTAGGTAAAT...CTTTCTGTGATG/CTTTCTGTGATG...TCTAG|GTC | 0 | 1 | 46.68 |
| 182503384 | GT-AG | 0 | 0.0078528392613708 | 746 | rna-XM_030239200.1 32671991 | 12 | 17686043 | 17686788 | Serinus canaria 9135 | AAG|GTACCTGTCA...GACACCTTGGTT/AGCAATCTGACA...TTCAG|CGA | 0 | 1 | 48.777 |
| 182503385 | GT-AG | 0 | 1.000000099473604e-05 | 1084 | rna-XM_030239200.1 32671991 | 13 | 17687074 | 17688157 | Serinus canaria 9135 | GAG|GTGATTGTAT...TCTTTCTCAATT/GTCTTTCTCAAT...TCTAG|GAT | 0 | 1 | 53.52 |
| 182503386 | GT-AG | 0 | 1.000000099473604e-05 | 81 | rna-XM_030239200.1 32671991 | 14 | 17688223 | 17688303 | Serinus canaria 9135 | GAG|GTGGGTGAAT...GAGTTTTTATTT/AGAGTTTTTATT...TTCAG|TTC | 2 | 1 | 54.601 |
| 182503387 | GT-AG | 0 | 0.0001381372808619 | 1488 | rna-XM_030239200.1 32671991 | 15 | 17688453 | 17689940 | Serinus canaria 9135 | AAG|GTCTGTATGT...TCTTCTTTATTT/TTCTTCTTTATT...AAAAG|ATG | 1 | 1 | 57.081 |
| 182503388 | GT-AG | 0 | 6.818233244972986e-05 | 85 | rna-XM_030239200.1 32671991 | 16 | 17690081 | 17690165 | Serinus canaria 9135 | AAA|GTATGGAAGT...TACCTTTTAAAT/TTTTAAATCACC...TCCAG|TAT | 0 | 1 | 59.411 |
| 182503389 | GT-AG | 0 | 0.0002343278535146 | 108 | rna-XM_030239200.1 32671991 | 17 | 17690322 | 17690429 | Serinus canaria 9135 | GAT|GTAAGTCTTT...TCTCTTTTAAAC/GCATGTCTGACC...CATAG|AAA | 0 | 1 | 62.007 |
| 182503390 | GT-AG | 0 | 1.000000099473604e-05 | 442 | rna-XM_030239200.1 32671991 | 18 | 17690509 | 17690950 | Serinus canaria 9135 | ATG|GTAGGTGGTT...TAGATCTAAAAA/TAAAAACTCATA...AACAG|ACA | 1 | 1 | 63.322 |
| 182503391 | GT-AG | 0 | 0.0001138601677161 | 85 | rna-XM_030239200.1 32671991 | 19 | 17691025 | 17691109 | Serinus canaria 9135 | CTG|GTAAACTAAA...GTGTTCTGAATA/TGAATATTGATT...TTCAG|ATT | 0 | 1 | 64.553 |
| 182503392 | GT-AG | 0 | 1.000000099473604e-05 | 1931 | rna-XM_030239200.1 32671991 | 20 | 17691200 | 17693130 | Serinus canaria 9135 | AAG|GTATTAGAAA...ATTTTCTCATTA/TATTTTCTCATT...CTTAG|ATG | 0 | 1 | 66.051 |
| 182503393 | GT-AG | 0 | 1.000000099473604e-05 | 193 | rna-XM_030239200.1 32671991 | 21 | 17693257 | 17693449 | Serinus canaria 9135 | AAA|GTAAGTGGAT...TTTATTTTAACT/TTTATTTTAACT...TTTAG|CAT | 0 | 1 | 68.148 |
| 182503394 | GT-AG | 0 | 4.8562719692175714e-05 | 327 | rna-XM_030239200.1 32671991 | 22 | 17693492 | 17693818 | Serinus canaria 9135 | CTT|GTAAGTATTA...AGATCTTTGTTT/TCTTTGTTTATT...TGTAG|ACA | 0 | 1 | 68.847 |
| 182503395 | GT-AG | 0 | 0.005808909093488 | 1751 | rna-XM_030239200.1 32671991 | 23 | 17693925 | 17695675 | Serinus canaria 9135 | CAG|GTAACTCTTG...AATTTTTTGAAT/AATTTTTTGAAT...CACAG|ATT | 1 | 1 | 70.611 |
| 182503396 | GT-AG | 0 | 1.000000099473604e-05 | 1526 | rna-XM_030239200.1 32671991 | 24 | 17695708 | 17697233 | Serinus canaria 9135 | AAG|GTAAATAATT...TTGACTTTAATT/TTGACTTTAATT...AACAG|GGT | 0 | 1 | 71.143 |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE "introns" (
"id" INTEGER,
"dinucleotide_pair" TEXT,
"is_minor" INTEGER,
"score" REAL,
"length" INTEGER,
"transcript_id" INTEGER,
"ordinal_index" INTEGER,
"start" INTEGER,
"end" INTEGER,
"taxonomy_id" INTEGER,
"scored_motifs" TEXT,
"phase" INTEGER,
"in_cds" INTEGER,
"relative_position" REAL
,PRIMARY KEY ([id]),
FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
ON [introns] ([in_cds]);