home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

18 rows where transcript_id = 12917268

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
68847546 GT-AG 0 4.659841001762222e-05 4271 rna-XM_009643206.2 12917268 3 2038864 2043134 Egretta garzetta 188379 CAG|GTACCAAATT...TAGGTTTGAGCA/GCAATGATGATT...TTTAG|GAG 1 1 46.125
68847547 GT-AG 0 2.4014515336753052e-05 868 rna-XM_009643206.2 12917268 4 2043220 2044087 Egretta garzetta 188379 TCG|GTAAGTTGGG...TATGTCTGAACT/ATATGTCTGAAC...TGCAG|TCA 2 1 48.428
68847548 GT-AG 0 0.0001629990696607 6538 rna-XM_009643206.2 12917268 5 2044173 2050710 Egretta garzetta 188379 AAG|GTATGTACAA...TAACTTTTAAAT/TAACTTTTAAAT...TACAG|ACT 0 1 50.732
68847549 GT-AG 0 1.000000099473604e-05 1806 rna-XM_009643206.2 12917268 6 2050787 2052592 Egretta garzetta 188379 TAG|GTATGGGCAT...CTTTCTTTCATT/CTTTCTTTCATT...TCTAG|AAA 1 1 52.791
68847550 GT-AG 0 1.000000099473604e-05 1264 rna-XM_009643206.2 12917268 7 2052635 2053898 Egretta garzetta 188379 GTA|GTAAGTGAGA...TTTTGTTTAATT/TTTTGTTTAATT...GATAG|ATG 1 1 53.93
68847551 GT-AG 0 1.000000099473604e-05 2581 rna-XM_009643206.2 12917268 8 2054023 2056603 Egretta garzetta 188379 TAG|GTAAGAGCCT...TGTGACTTAACC/CTGTGACTTAAC...ATTAG|AGT 2 1 57.29
68847552 GT-AG 0 0.0004833018007646 1054 rna-XM_009643206.2 12917268 9 2056851 2057904 Egretta garzetta 188379 GAG|GTATGTCTGT...GTTTCTTTTGTT/CTACATATAACG...TTTAG|GAA 0 1 63.984
68847553 GT-AG 0 1.000000099473604e-05 89 rna-XM_009643206.2 12917268 10 2058068 2058156 Egretta garzetta 188379 GAG|GTACGGTTGA...TGTCTATTGACA/TGTCTATTGACA...TGTAG|TGG 1 1 68.401
68847554 GT-AG 0 1.000000099473604e-05 231 rna-XM_009643206.2 12917268 11 2058290 2058520 Egretta garzetta 188379 TAA|GTAAGTTCAC...ACATTTTTCTCT/CTGCATCTAACA...TTCAG|ACT 2 1 72.005
68847555 GT-AG 0 0.0035720810362494 1942 rna-XM_009643206.2 12917268 12 2058576 2060517 Egretta garzetta 188379 CAC|GTATGTACGC...GTGGTTTTAATT/GTGGTTTTAATT...TCTAG|GGA 0 1 73.496
68847556 GT-AG 0 1.000000099473604e-05 1936 rna-XM_009643206.2 12917268 13 2060611 2062546 Egretta garzetta 188379 AAG|GTAAAGATGA...TGGTGCTTAATT/GTAGTTTTCAGT...CAAAG|AAA 0 1 76.016
68847557 GT-AG 0 0.0361391537051987 1113 rna-XM_009643206.2 12917268 14 2062625 2063737 Egretta garzetta 188379 AAG|GTATTTTTCT...TATTTGTTAATT/TATTTGTTAATT...TTCAG|CTG 0 1 78.13
68847558 GT-AG 0 0.0015997716980438 781 rna-XM_009643206.2 12917268 15 2063778 2064558 Egretta garzetta 188379 ATG|GTATGTACTA...TTTGTTTTGATT/TTTGTTTTGATT...TTTAG|CAT 1 1 79.214
68847559 GT-AG 0 4.319317557426482e-05 907 rna-XM_009643206.2 12917268 16 2064621 2065527 Egretta garzetta 188379 AGA|GTAAGCAGTG...GGTGTCTTCATA/GGTGTCTTCATA...TTCAG|GTC 0 1 80.894
68847560 GT-AG 0 1.000000099473604e-05 977 rna-XM_009643206.2 12917268 17 2065594 2066570 Egretta garzetta 188379 AGG|GTTAGTAAAT...ATAATTTTAGTA/GTTAATTTAAAT...TATAG|GAT 0 1 82.683
68847561 GT-AG 0 1.0780602518277224e-05 1141 rna-XM_009643206.2 12917268 18 2066708 2067848 Egretta garzetta 188379 AAT|GTAAGTTGAG...TTTTTCATAGAT/TGCTTTTTCATA...GACAG|GGT 2 1 86.396
68847562 GT-AG 0 4.767812144550039e-05 343 rna-XM_009643206.2 12917268 19 2067985 2068327 Egretta garzetta 188379 CTG|GTAAGCTGAC...TGGATTTTAATT/TGGATTTTAATT...TTCAG|GGA 0 1 90.081
68847563 GT-AG 0 2.4969732477084884e-05 6233 rna-XM_009643206.2 12917268 20 2068489 2074721 Egretta garzetta 188379 CAG|GTACTTCACT...TTTTTCTTTTCT/GTTATACTGATA...TCCAG|GAT 2 1 94.444

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 156.041ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)