home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

19 rows where transcript_id = 12917198

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
68846879 GT-AG 0 1.000000099473604e-05 20134 rna-XM_009639391.2 12917198 1 457344 477477 Egretta garzetta 188379 AGG|GTGAGTATTA...GTAATATTAACA/GTAATATTAACA...TGTAG|GAT 2 1 1.66
68846880 GT-AG 0 0.0007691296167247 514 rna-XM_009639391.2 12917198 2 456706 457219 Egretta garzetta 188379 AAG|GTATGTCATA...GAGTCTTTGATT/CTTTGATTTATT...TTTAG|AGT 0 1 7.077
68846881 GT-AG 0 1.000000099473604e-05 2891 rna-XM_009639391.2 12917198 3 453686 456576 Egretta garzetta 188379 GAG|GTTGGTTAAC...GTAACTTCAACC/TGTAACTTCAAC...TTCAG|TGC 0 1 12.713
68846882 GT-AG 0 1.288811985592205e-05 1378 rna-XM_009639391.2 12917198 4 452191 453568 Egretta garzetta 188379 ATG|GTAAGTTTAA...AATTATTTGATT/AATTATTTGATT...ACTAG|GTA 0 1 17.824
68846883 GT-AG 0 1.000000099473604e-05 2230 rna-XM_009639391.2 12917198 5 449840 452069 Egretta garzetta 188379 GAG|GTGAGCCCAA...TCACTCCTAATT/TTTCTATTCACT...TTCAG|AAT 1 1 23.111
68846884 GT-AG 0 0.0029075049338935 547 rna-XM_009639391.2 12917198 6 449149 449695 Egretta garzetta 188379 TGG|GTATGTCTGC...ATTTTTTTGTCT/GTCTTCCAAATT...GGCAG|AGA 1 1 29.401
68846885 GT-AG 0 1.000000099473604e-05 592 rna-XM_009639391.2 12917198 7 448454 449045 Egretta garzetta 188379 GAA|GTAAGAAAGT...TTTTTTTTATTA/TTTTTTTTTATT...TTAAG|ATA 2 1 33.901
68846886 GT-AG 0 3.1115392241057325e-05 6504 rna-XM_009639391.2 12917198 8 441786 448289 Egretta garzetta 188379 ATC|GTAAGTACAA...GATGTTTTGATT/TATTTTTTTATA...AACAG|CAT 1 1 41.066
68846887 GT-AG 0 1.000000099473604e-05 1004 rna-XM_009639391.2 12917198 9 440690 441693 Egretta garzetta 188379 CTG|GTAAGATAAT...AATTCTTTTACT/CACTTATTAATT...TTTAG|GAA 0 1 45.085
68846888 GT-AG 0 1.000000099473604e-05 414 rna-XM_009639391.2 12917198 10 440035 440448 Egretta garzetta 188379 CTG|GTAAGGCTAG...ATAGCCTTACAT/CTTACATTGACC...TACAG|AAG 1 1 55.614
68846889 GT-AG 0 1.000000099473604e-05 371 rna-XM_009639391.2 12917198 11 439494 439864 Egretta garzetta 188379 CAG|GTAAGAAGGG...AGAGATTTATCG/GAGAGATTTATC...GTTAG|GTG 0 1 63.041
68846890 GT-AG 0 1.000000099473604e-05 5487 rna-XM_009639391.2 12917198 12 433912 439398 Egretta garzetta 188379 CAG|GTAAATCTGT...TCAACCTTCTTG/GTTCCTGTCAAC...TGCAG|GTT 2 1 67.191
68846891 GT-AG 0 1.000000099473604e-05 1126 rna-XM_009639391.2 12917198 13 432745 433870 Egretta garzetta 188379 AGG|GTTAGCATCT...TCAGCTTTACAA/TTCAGCTTTACA...TTCAG|ATG 1 1 68.982
68846892 GT-AG 0 1.000000099473604e-05 373 rna-XM_009639391.2 12917198 14 432246 432618 Egretta garzetta 188379 AAT|GTAAGTAAAA...GTACTTTTATCA/ACTTTTATCATA...TGTAG|GCC 1 1 74.487
68846893 GT-AG 0 0.0008080214376072 880 rna-XM_009639391.2 12917198 15 431187 432066 Egretta garzetta 188379 AAA|GTATGTAGAT...AACTTCTTGTTT/GCACAACTAAAC...CACAG|CAC 0 1 82.307
68846894 GT-AG 0 1.000000099473604e-05 616 rna-XM_009639391.2 12917198 16 430475 431090 Egretta garzetta 188379 GAG|GTAAGGGTGG...GGTCTCTTACAA/TGGTCTCTTACA...TTCAG|ATT 0 1 86.501
68846895 GT-AG 0 0.0016343095371895 724 rna-XM_009639391.2 12917198 17 429669 430392 Egretta garzetta 188379 ATG|GTATGTATAG...TTTTTCTTTCCC/CTATCCATCATT...CCTAG|ATT 1 1 90.083
68846896 GT-AG 0 6.274152212958768e-05 113 rna-XM_009639391.2 12917198 18 429475 429587 Egretta garzetta 188379 AAG|GTAAGTTTTA...TTTGTGTTAATA/TTTGTGTTAATA...AACAG|TTA 1 1 93.622
68846897 GT-AG 0 1.000000099473604e-05 550 rna-XM_009639391.2 12917198 19 428840 429389 Egretta garzetta 188379 CAG|GTTCGTAGAT...TTGTTTTTATCT/TTTGTTTTTATC...TTCAG|ATA 2 1 97.335

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 196.331ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)