home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

20 rows where transcript_id = 12917197

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: dinucleotide_pair, is_minor, score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
68846859 GT-AG 1 96.80414134400526 11625 rna-XM_009637515.2 12917197 1 388143 399767 Egretta garzetta 188379 CAC|GTATCCTAAT...TATTCCTTAACT/TTATGTCTCATG...GTCAG|TCA 2 1 6.006
68846860 GT-AG 0 1.000000099473604e-05 1138 rna-XM_009637515.2 12917197 2 399943 401080 Egretta garzetta 188379 AAG|GTAAGATGGG...TGTACCTTAAAG/TTGTACCTTAAA...TTCAG|GAT 0 1 13.514
68846861 GT-AG 0 9.665750968594886e-05 1304 rna-XM_009637515.2 12917197 3 401249 402552 Egretta garzetta 188379 TCA|GTAAGTAGCT...TTTTCTTTATTC/GTTTTCTTTATT...TCTAG|CTT 0 1 20.721
68846862 GT-AG 0 0.0006419410000213 1032 rna-XM_009637515.2 12917197 4 402604 403635 Egretta garzetta 188379 CAG|GTATATACAT...TGACTTTTAATC/CTGTGCTTGACT...CTAAG|GTA 0 1 22.909
68846863 GT-AG 0 1.000000099473604e-05 682 rna-XM_009637515.2 12917197 5 403727 404408 Egretta garzetta 188379 ATG|GTAAATGAGA...TTGTCATTACTT/AATTTTGTCATT...TGTAG|TGG 1 1 26.813
68846864 GT-AG 0 1.000000099473604e-05 3989 rna-XM_009637515.2 12917197 6 404573 408561 Egretta garzetta 188379 AAG|GTAAGTTACT...ATGTTTATATCT/TTCATGTTTATA...TGTAG|GCT 0 1 33.848
68846865 GT-AG 0 1.000000099473604e-05 3635 rna-XM_009637515.2 12917197 7 408725 412359 Egretta garzetta 188379 AAG|GTAAGGAGAT...TTTTTTTTTTTT/ATAGTACAAATA...TCCAG|ACT 1 1 40.841
68846866 GC-AG 0 1.000000099473604e-05 2267 rna-XM_009637515.2 12917197 8 412491 414757 Egretta garzetta 188379 AAT|GCAAGTATTC...TGGGTTGTAAAA/TGGGTTGTAAAA...TGCAG|GAT 0 1 46.461
68846867 GT-AG 0 1.000000099473604e-05 94 rna-XM_009637515.2 12917197 9 414866 414959 Egretta garzetta 188379 AAA|GTAAGTATAT...TCTTTTGTGATT/CAAAATTTCACT...TATAG|GCT 0 1 51.094
68846868 GT-AG 0 1.000000099473604e-05 1146 rna-XM_009637515.2 12917197 10 415067 416212 Egretta garzetta 188379 AAG|GTACGTCCTC...TTTACTTCAGCA/TTTTACTTCAGC...TGCAG|CTC 2 1 55.684
68846869 GT-AG 0 0.0001407091570844 516 rna-XM_009637515.2 12917197 11 416262 416777 Egretta garzetta 188379 GTG|GTAAGTTGTC...TTCTTCTTACCT/GTTCTTCTTACC...TCCAG|ATG 0 1 57.786
68846870 GT-AG 0 1.000000099473604e-05 563 rna-XM_009637515.2 12917197 12 416910 417472 Egretta garzetta 188379 AAA|GTGAGTATTC...GTGCTTTTAAAA/GTCTTGCTGATA...TACAG|CAA 0 1 63.449
68846871 GT-AG 0 1.000000099473604e-05 706 rna-XM_009637515.2 12917197 13 417591 418296 Egretta garzetta 188379 ATT|GTAAGTAATA...AGGCTCTTCACC/AGGCTCTTCACC...TCCAG|TGG 1 1 68.511
68846872 GT-AG 0 1.000000099473604e-05 744 rna-XM_009637515.2 12917197 14 418374 419117 Egretta garzetta 188379 GAG|GTGAGGCGCT...ATTTATTTATTG/CATTTATTTATT...TACAG|TTA 0 1 71.815
68846873 GT-AG 0 1.000000099473604e-05 1369 rna-XM_009637515.2 12917197 15 419250 420618 Egretta garzetta 188379 CAG|GTAAGGATAA...CTCCCCTTCATT/CATTTTCTGATT...GTTAG|GCA 0 1 77.477
68846874 GT-AG 0 1.000000099473604e-05 1320 rna-XM_009637515.2 12917197 16 420712 422031 Egretta garzetta 188379 ATG|GTAGTGACTT...TTTTTTGTAATT/TTTTTTGTAATT...TGTAG|GAC 0 1 81.467
68846875 GT-AG 0 4.356505219332046e-05 90 rna-XM_009637515.2 12917197 17 422080 422169 Egretta garzetta 188379 CTT|GTAAGTACTC...TTTGTTTTATTT/TATTTATTTATT...TGCAG|GTT 0 1 83.526
68846876 GT-AG 0 1.000000099473604e-05 1489 rna-XM_009637515.2 12917197 18 422253 423741 Egretta garzetta 188379 AAA|GTAAGGAAAA...TGGTTTTTAAAC/GATTGTTTTACT...CACAG|CAA 2 1 87.087
68846877 GT-AG 0 2.278026459045368e-05 749 rna-XM_009637515.2 12917197 19 423848 424596 Egretta garzetta 188379 CAG|GTGACTTGCA...TGCTCCTAAGCA/TTGCTCCTAAGC...TGCAG|GCT 0 1 91.634
68846878 GT-AG 0 1.0090932086786702e-05 898 rna-XM_009637515.2 12917197 20 424711 425608 Egretta garzetta 188379 AAG|GTATGTGAGA...CACCGCTTACAT/CCACCGCTTACA...TGCAG|AAA 0 1 96.525

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 54.592ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)