home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

17 rows where transcript_id = 35103538

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: dinucleotide_pair, is_minor, score, length, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
197657945 GT-AG 0 1.000000099473604e-05 119 rna-XM_007050228.2 35103538 1 27345040 27345158 Theobroma cacao 3641 CAG|GTAATTTTGT...AATTTTGTGAAT/TTGTGAATAATT...CTTAG|GGT 0 1 11.987
197657946 GT-AG 0 0.0011891154690484 85 rna-XM_007050228.2 35103538 2 27345396 27345480 Theobroma cacao 3641 CTG|GTATGATTAA...TTTTTCTTTTTT/CTTTTTTGGACA...TGCAG|AAA 0 1 18.473
197657947 GT-AG 0 1.000000099473604e-05 1651 rna-XM_007050228.2 35103538 3 27345715 27347365 Theobroma cacao 3641 AGT|GTGAGTTCTT...TTTTTTTTATAT/TTTTTTTTTATA...TGCAG|CAA 0 1 24.877
197657948 GT-AG 0 0.0001040101505148 1346 rna-XM_007050228.2 35103538 4 27347605 27348950 Theobroma cacao 3641 AAT|GTAAGTTCTT...TTCTGTTTAATA/TTCTGTTTAATA...TTCAG|TAA 2 1 31.418
197657949 GT-AG 0 1.000000099473604e-05 160 rna-XM_007050228.2 35103538 5 27349218 27349377 Theobroma cacao 3641 CAG|GTTAATCAAG...CCCACTTTGAAT/CCTGTGCTTATC...TGTAG|ATC 2 1 38.725
197657950 GT-AG 0 0.0002122207713317 877 rna-XM_007050228.2 35103538 6 27349649 27350525 Theobroma cacao 3641 AAG|GTCTGCTACT...TAATCCTGATTG/TTAATCCTGATT...TACAG|TAT 0 1 46.141
197657951 AT-AA 1 99.99999505058524 1342 rna-XM_007050228.2 35103538 7 27350651 27351992 Theobroma cacao 3641 CCA|ATATCCTTTA...GTGAACTTAACT/CATATGCTCATA...CGTAA|ATT 2 1 49.562
197657952 GT-AG 0 1.000000099473604e-05 86 rna-XM_007050228.2 35103538 8 27352103 27352188 Theobroma cacao 3641 AAG|GTGAATATTA...TCGATGTTAATC/TATAGATTCATG...ATTAG|TTG 1 1 52.573
197657953 GT-AG 0 1.000000099473604e-05 64 rna-XM_007050228.2 35103538 9 27352297 27352360 Theobroma cacao 3641 AAG|GTTGGTTTTA...GCCTTTTTATTA/ATAATATTAACT...TACAG|GTC 1 1 55.528
197657954 GT-AG 0 0.0002645922770834 1121 rna-XM_007050228.2 35103538 10 27352501 27353621 Theobroma cacao 3641 AAG|GTAGCTCGAC...TTTTATTTACCA/TTACCACTGATC...TGCAG|AAA 0 1 59.36
197657955 GT-AG 0 1.000000099473604e-05 74 rna-XM_007050228.2 35103538 11 27353712 27353785 Theobroma cacao 3641 AAG|GTGATTTATG...ACACTTTTACTC/ATGGGTTTAATT...TGCAG|TTA 0 1 61.823
197657956 GT-AG 0 0.3498438988581239 910 rna-XM_007050228.2 35103538 12 27353995 27354904 Theobroma cacao 3641 CCA|GTATGTTTTC...AGCTGCTTGACA/AGCTGCTTGACA...TCCAG|GTT 2 1 67.542
197657957 GT-AG 0 0.0018821769144363 687 rna-XM_007050228.2 35103538 13 27355075 27355761 Theobroma cacao 3641 AGG|GTATGGTTTT...TTTTCCCTATTT/TTGATGTTTATT...GGTAG|AGT 1 1 72.195
197657958 GT-AG 0 1.000000099473604e-05 102 rna-XM_007050228.2 35103538 14 27355872 27355973 Theobroma cacao 3641 AAG|GTCTGAAGAT...CTTTCCCTGATT/CTTTCCCTGATT...TACAG|GAG 0 1 75.205
197657959 GT-AG 0 2.251045030834975e-05 411 rna-XM_007050228.2 35103538 15 27356351 27356761 Theobroma cacao 3641 GAG|GTACTAAACT...CTTTTTTTAATG/CTTTTTTTAATG...TGCAG|ATA 2 1 85.523
197657960 GT-AG 0 1.000000099473604e-05 402 rna-XM_007050228.2 35103538 16 27357014 27357415 Theobroma cacao 3641 CAG|GTAGAGCTCT...TCTTGTTTAATT/TCTTGTTTAATT...TTCAG|CTA 2 1 92.419
197657961 GT-AG 0 1.000000099473604e-05 102 rna-XM_007050228.2 35103538 17 27357644 27357745 Theobroma cacao 3641 GAG|GTAAGTTGTT...ATATCCTTTCTC/TCCTTTCTCATT...TACAG|CTG 2 1 98.659

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 26.759ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)