home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

18 rows where transcript_id = 12801885

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, length, scored_motifs, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
68111150 GT-AG 0 0.0001195047742701 1959 rna-XM_029511039.1 12801885 1 3620546 3622504 Echeneis naucrates 173247 GAG|GTAACGTTGC...GCTGCCCTATTT/TATTTACTGATT...AATAG|GAT 0 1 0.173
68111151 GT-AG 0 1.000000099473604e-05 99 rna-XM_029511039.1 12801885 2 3620278 3620376 Echeneis naucrates 173247 ATC|GTGAGTGGAA...GTTACTTTGTCT/TGATTTGTCACA...GATAG|ATA 1 1 3.424
68111152 GT-AG 0 0.001336483957996 512 rna-XM_029511039.1 12801885 3 3619293 3619804 Echeneis naucrates 173247 ACA|GTATGTAGAA...AGGACATTAAAA/AACCTGTTCACC...TTCAG|ACT 0 1 12.522
68111153 GT-AG 0 4.570013914130094e-05 369 rna-XM_029511039.1 12801885 4 3618740 3619108 Echeneis naucrates 173247 CCA|GTAAGTTATT...CCAGGCTTGATT/CTTGATTTGAAC...TACAG|GAG 1 1 16.061
68111154 GT-AG 0 5.56152130566834e-05 630 rna-XM_029511039.1 12801885 5 3618057 3618686 Echeneis naucrates 173247 AAG|GTAATTTGTT...TTTTTTTTAATC/TTTTTTTTAATC...CACAG|GGC 0 1 17.08
68111155 GT-AG 0 1.000000099473604e-05 93 rna-XM_029511039.1 12801885 6 3617798 3617890 Echeneis naucrates 173247 GTG|GTAAACGGGA...GTTTTCTTTTTG/GCAGTTCTGATG...AGCAG|GAA 1 1 20.273
68111156 GT-AG 0 1.000000099473604e-05 119 rna-XM_029511039.1 12801885 7 3617592 3617710 Echeneis naucrates 173247 CTG|GTGAGTGGGA...CTTTCCATATTA/TCCATATTAAAA...TAAAG|TAA 1 1 21.947
68111157 GT-AG 0 1.000000099473604e-05 77 rna-XM_029511039.1 12801885 8 3617440 3617516 Echeneis naucrates 173247 GAA|GTGAGTTTGA...ATATGCTTATTT/TATATGCTTATT...TACAG|TAT 1 1 23.389
68111158 GT-AG 0 0.0002414886775584 175 rna-XM_029511039.1 12801885 9 3617178 3617352 Echeneis naucrates 173247 CCA|GTAAGCCAAG...GTTTTTTTAAAT/GTTTTTTTAAAT...AACAG|CAA 1 1 25.063
68111159 GT-AG 0 1.000000099473604e-05 210 rna-XM_029511039.1 12801885 10 3616896 3617105 Echeneis naucrates 173247 CTG|GTAGGAGCAA...TTCTTTTTACCA/GTTCTTTTTACC...CGCAG|GGA 1 1 26.447
68111160 GT-AG 0 1.000000099473604e-05 343 rna-XM_029511039.1 12801885 11 3616310 3616652 Echeneis naucrates 173247 TAG|GTGAGAGCTC...TCTGCTTTATCT/CTCTGCTTTATC...TGAAG|GTC 1 1 31.121
68111161 GT-AG 0 1.7108755741557557e-05 5315 rna-XM_029511039.1 12801885 12 3610311 3615625 Echeneis naucrates 173247 AGG|GTCTGCGGCA...CAGACTGTGATA/TCCATGTTCAGA...CTCAG|CAG 1 1 44.278
68111162 GT-AG 0 1.000000099473604e-05 132 rna-XM_029511039.1 12801885 13 3609706 3609837 Echeneis naucrates 173247 GAG|GTAGTGACAA...AGATTCTTGCCT/TTTATTCTCATG...TATAG|ATG 0 1 53.376
68111163 GT-AG 0 0.0011689985907994 93 rna-XM_029511039.1 12801885 14 3609435 3609527 Echeneis naucrates 173247 GTG|GTACTCAAAC...TGCATTTTAACA/TGCATTTTAACA...CATAG|AGC 1 1 56.799
68111164 GT-AG 0 1.000000099473604e-05 227 rna-XM_029511039.1 12801885 15 3609079 3609305 Echeneis naucrates 173247 ACT|GTAAGAAAAT...TGTTTCGTAGCA/TCCCTGTTTATC...TCCAG|TGA 1 1 59.281
68111165 GT-AG 0 1.000000099473604e-05 132 rna-XM_029511039.1 12801885 16 3607826 3607957 Echeneis naucrates 173247 GAG|GTAGTGACAA...AGATTCTTGCCT/TTTATTCTCATG...TATAG|ATG 0 1 80.842
68111166 GT-AG 0 0.0011412336555677 93 rna-XM_029511039.1 12801885 17 3607555 3607647 Echeneis naucrates 173247 GTG|GTACTCAAAC...TGAATTTTAACA/TGAATTTTAACA...CATAG|AGC 1 1 84.266
68111167 GT-AG 0 1.000000099473604e-05 227 rna-XM_029511039.1 12801885 18 3607199 3607425 Echeneis naucrates 173247 ACT|GTAAGAAAAT...TGTTTCGTAGCA/TCCCTGTTTATC...TCCAG|TGA 1 1 86.747

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 33.291ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)