home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

21 rows where transcript_id = 35103551

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: dinucleotide_pair, score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
197658080 GT-AG 0 0.0018506546821522 79 rna-XM_007049403.2 35103551 1 14090087 14090165 Theobroma cacao 3641 CAG|GTATTTTCTT...TTGCCTTTGGTT/TAAAATTTGACT...TGCAG|GGC 0 1 1.373
197658081 GT-AG 0 1.000000099473604e-05 545 rna-XM_007049403.2 35103551 2 14089074 14089618 Theobroma cacao 3641 CAT|GTAAGGAGAA...TTTTTTTTGGTT/TTTTGGTTGATG...TGTAG|GGA 0 1 14.764
197658082 GT-AG 0 1.000000099473604e-05 130 rna-XM_007049403.2 35103551 3 14088699 14088828 Theobroma cacao 3641 AAG|GTGCTGTAGT...ATTTCTTTACCA/AATTTCTTTACC...TGCAG|AGT 2 1 21.774
197658083 GT-AG 0 1.000000099473604e-05 110 rna-XM_007049403.2 35103551 4 14088499 14088608 Theobroma cacao 3641 CAG|GTGCAATCTA...TTAGTCTTATAT/ATATTCTTCATC...TGCAG|TGG 2 1 24.349
197658084 GT-AG 0 4.918815162138485e-05 89 rna-XM_007049403.2 35103551 5 14088275 14088363 Theobroma cacao 3641 TGG|GTAGGTTCTG...TTTTCTTTTTCT/TTTCTTGTAATT...TATAG|TCT 2 1 28.212
197658085 GT-AG 0 1.000000099473604e-05 217 rna-XM_007049403.2 35103551 6 14087939 14088155 Theobroma cacao 3641 AAG|GTAAGGCCAA...CTTCTCTTATAT/ACTTCTCTTATA...TGCAG|TGA 1 1 31.617
197658086 GT-AG 0 0.0001882742107286 340 rna-XM_007049403.2 35103551 7 14087434 14087773 Theobroma cacao 3641 AAG|GTTTGTATTT...CCTACCTTAATG/TGTCTCTTCATA...TGCAG|AAC 1 1 36.338
197658087 GT-AG 0 7.268055988162866e-05 192 rna-XM_007049403.2 35103551 8 14087136 14087327 Theobroma cacao 3641 CTT|GTAAGTTGCT...AAAATCTTACAA/AAAAATCTTACA...TTTAG|TTT 2 1 39.371
197658088 GT-AG 0 0.0121316480831795 118 rna-XM_007049403.2 35103551 9 14086912 14087029 Theobroma cacao 3641 CCC|GTATGTGTTG...TTGGATTTGATT/ATTTGATTGACT...TACAG|AAT 0 1 42.403
197658089 GT-AG 0 0.0260673021002576 628 rna-XM_007049403.2 35103551 10 14086173 14086800 Theobroma cacao 3641 AAG|GTATTTTTCA...GTTTTCTTCACC/GTTTTCTTCACC...TTTAG|AGT 0 1 45.579
197658090 GT-AG 0 1.000000099473604e-05 99 rna-XM_007049403.2 35103551 11 14085910 14086008 Theobroma cacao 3641 GAG|GTAGTTCTAA...AATGTATTAACT/AATGTATTAACT...TGTAG|GTA 2 1 50.272
197658091 GT-AG 0 4.7364634299963054e-05 1145 rna-XM_007049403.2 35103551 12 14084647 14085791 Theobroma cacao 3641 GAG|GTAGGCATCT...TTTTTCTGAGAT/GTTTTTCTGAGA...TCCAG|AAA 0 1 53.648
197658092 GT-AG 0 2.1205963674462543e-05 441 rna-XM_007049403.2 35103551 13 14083981 14084421 Theobroma cacao 3641 CAG|GTAATTTCAG...TTTGTTTTGATA/TTTGTTTTGATA...TGCAG|ACT 0 1 60.086
197658093 GT-AG 0 1.000000099473604e-05 212 rna-XM_007049403.2 35103551 14 14083578 14083789 Theobroma cacao 3641 CAG|GTACAGGCAC...TGCGTTCTAACA/TGCGTTCTAACA...TCCAG|TTC 2 1 65.551
197658094 GT-AG 0 1.000000099473604e-05 148 rna-XM_007049403.2 35103551 15 14083262 14083409 Theobroma cacao 3641 CAG|GTGTGTGATT...TGTGTCTTACAC/CTGTGTCTTACA...TTCAG|TTC 2 1 70.358
197658095 GT-AG 0 0.0518063120381526 279 rna-XM_007049403.2 35103551 16 14082877 14083155 Theobroma cacao 3641 AAG|GTATACTTAA...ATCAACTTATTT/GATCAACTTATT...ATCAG|GTG 0 1 73.391
197658096 GT-AG 0 0.0002985652568602 210 rna-XM_007049403.2 35103551 17 14082529 14082738 Theobroma cacao 3641 AAT|GTAATTTCTA...CATTTCATAATT/TACTTCTTCATC...TGAAG|GCT 0 1 77.339
197658097 GT-AG 0 1.000000099473604e-05 138 rna-XM_007049403.2 35103551 18 14082232 14082369 Theobroma cacao 3641 CAG|GTGAGTGCAC...CATATCTTACCA/GTGGTTCTTACA...TCCAG|TTA 0 1 81.888
197658098 GT-AG 0 3.479480835100348e-05 312 rna-XM_007049403.2 35103551 19 14081713 14082024 Theobroma cacao 3641 AAT|GTAAGTCCTA...TCATCCTTAAGC/TACTTGTTCATC...TTCAG|ACA 0 1 87.811
197658099 GT-AG 0 1.000000099473604e-05 92 rna-XM_007049403.2 35103551 20 14081426 14081517 Theobroma cacao 3641 CAG|GTGAAGACAA...ATTGTTTTAATT/ATTGTTTTAATT...ACCAG|ATT 0 1 93.391
197658100 GC-AG 0 1.000000099473604e-05 149 rna-XM_007049403.2 35103551 21 14081205 14081353 Theobroma cacao 3641 GGG|GCAAGTGCTC...TTTCTCATAACA/CAGTTTCTCATA...TGTAG|ATA 0 1 95.451

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 27.177ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)