home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

16 rows where transcript_id = 35103525

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
197657776 GT-AG 0 0.7540847670667695 84 rna-XM_007052040.2 35103525 1 35514855 35514938 Theobroma cacao 3641 ATC|GTACTCTCTC...TAACTTTTAATC/CTTTTAATCATT...CCCAG|ATG 0 1 5.425
197657777 GT-AG 0 0.0202354688890096 114 rna-XM_007052040.2 35103525 2 35515493 35515606 Theobroma cacao 3641 CAG|GTATTTTTCC...GTTACCTTTGTT/AGTTACTTCATG...TTCAG|CTT 2 1 19.942
197657778 GT-AG 0 1.000000099473604e-05 310 rna-XM_007052040.2 35103525 3 35515710 35516019 Theobroma cacao 3641 AAG|GTTCGTTTTT...TACTATTTATTA/ATCAATCTCATT...GTCAG|GCT 0 1 22.642
197657779 GT-AG 0 1.000000099473604e-05 358 rna-XM_007052040.2 35103525 4 35516197 35516554 Theobroma cacao 3641 GTG|GTCAGTATTG...GTTTTTTTGTCA/TTTTTTGTCACC...TGTAG|GGA 0 1 27.28
197657780 GT-AG 0 0.0018825676412397 529 rna-XM_007052040.2 35103525 5 35516747 35517275 Theobroma cacao 3641 ACG|GTATGTCTTA...TCTCTTTTAGAC/GCTGGTTTGATT...TGTAG|GAT 0 1 32.311
197657781 GT-AG 0 0.0219360257489073 168 rna-XM_007052040.2 35103525 6 35517393 35517560 Theobroma cacao 3641 GAG|GTATGCTGAT...CCATCTTTAGCT/TATGTAATGATT...TCCAG|GGA 0 1 35.377
197657782 GT-AG 0 1.000000099473604e-05 215 rna-XM_007052040.2 35103525 7 35517666 35517880 Theobroma cacao 3641 AAG|GTTGTGTGGT...TGATTATTAGAA/TATTTGCTGATT...GACAG|GCA 0 1 38.129
197657783 GT-AG 0 1.000000099473604e-05 109 rna-XM_007052040.2 35103525 8 35518052 35518160 Theobroma cacao 3641 GAG|GTGCTGACCT...TTAGTCTTATTT/ATTAGTCTTATT...ATTAG|GTT 0 1 42.61
197657784 GT-AG 0 0.0006087395516112 895 rna-XM_007052040.2 35103525 9 35518377 35519271 Theobroma cacao 3641 TGG|GTATGGTCTG...TGAATTTTAATT/TTTTAATTAATT...TTCAG|GAT 0 1 48.27
197657785 GT-AG 0 0.0005812034044176 657 rna-XM_007052040.2 35103525 10 35519471 35520127 Theobroma cacao 3641 GCG|GTACGCCACT...AAATCCATAAAT/CTTGTGTTTATA...TTCAG|ATA 1 1 53.485
197657786 GT-AG 0 0.0004609874173406 98 rna-XM_007052040.2 35103525 11 35520334 35520431 Theobroma cacao 3641 CAG|GTACTTCTTT...TTGATTTTGATA/GATATTCTGATT...TACAG|AAT 0 1 58.884
197657787 GT-AG 0 4.599769607124481e-05 94 rna-XM_007052040.2 35103525 12 35520657 35520750 Theobroma cacao 3641 GAG|GTGCACTTGC...CGATGTTTGACT/CGATGTTTGACT...TGCAG|GAT 0 1 64.78
197657788 GT-AG 0 1.000000099473604e-05 85 rna-XM_007052040.2 35103525 13 35521318 35521402 Theobroma cacao 3641 GGA|GTAAGTAATT...CTTACGTTAATG/TTGGATCTTACG...TGTAG|GTA 0 1 79.638
197657789 GT-AG 0 0.0003684426009174 158 rna-XM_007052040.2 35103525 14 35521664 35521821 Theobroma cacao 3641 AAG|GTAACTGAAC...TTTTTCTTATTT/TTTTTTCTTATT...TGCAG|ACA 0 1 86.478
197657790 GT-AG 0 1.000000099473604e-05 410 rna-XM_007052040.2 35103525 15 35521867 35522276 Theobroma cacao 3641 GAG|GTTAGTTTCA...CTTTCTTTAGAA/TGAATATTAATT...TGCAG|GCT 0 1 87.657
197657791 GT-AG 0 6.580024167542074e-05 159 rna-XM_007052040.2 35103525 16 35522463 35522621 Theobroma cacao 3641 AAG|GTTTGTTGTG...ATATCTTTCATC/ATATCTTTCATC...GCCAG|ATT 0 1 92.531

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 30.273ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)