home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

24 rows where transcript_id = 1341764

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase, in_cds

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
7217599 GT-AG 0 1.000000099473604e-05 1226 rna-XM_020676409.1 1341764 1 3258231 3259456 Amborella trichopoda 13333 CTG|GTCAGTGTTT...CCTTTTTTATAT/TTGTTTGTCATC...TTCAG|GCT 0 1 4.842
7217600 GT-AG 0 1.000000099473604e-05 150 rna-XM_020676409.1 1341764 2 3257937 3258086 Amborella trichopoda 13333 GAG|GTCAGTTGAG...CTTCTCTTGATT/CTTCTCTTGATT...TATAG|GAG 0 1 10.248
7217601 GT-AG 0 0.0001432361195379 655 rna-XM_020676409.1 1341764 3 3257174 3257828 Amborella trichopoda 13333 GAG|GTTTGTTTGA...TATTCATTACCT/GGTGTATTCATT...TGCAG|GGA 0 1 14.302
7217602 GT-AG 0 1.315021358205468e-05 1014 rna-XM_020676409.1 1341764 4 3256064 3257077 Amborella trichopoda 13333 AAG|GTGCTTTGCC...TTGTTCTTATCT/TTTGTTCTTATC...TGCAG|GTT 0 1 17.905
7217603 GT-AG 0 0.0058091456812097 2488 rna-XM_020676409.1 1341764 5 3253445 3255932 Amborella trichopoda 13333 CAG|GTATGTTGAT...TTCTCTTTGACC/TTCTCTTTGACC...CTTAG|GGA 2 1 22.823
7217604 GT-AG 0 0.000860791429776 280 rna-XM_020676409.1 1341764 6 3253104 3253383 Amborella trichopoda 13333 TTG|GTAATCTCCT...TAATTTTTACCT/TTAATTTTTACC...TGCAG|GCC 0 1 25.113
7217605 GT-AG 0 3.5990558663526694e-05 836 rna-XM_020676409.1 1341764 7 3252101 3252936 Amborella trichopoda 13333 CAA|GTAAGCAAGA...TATGTTTTGACA/TATGTTTTGACA...TGCAG|GAG 2 1 31.381
7217606 GT-AG 0 0.0147125535785017 205 rna-XM_020676409.1 1341764 8 3251790 3251994 Amborella trichopoda 13333 CAG|GTATATTCTC...GAATCTTTGAAT/TTTCTTCTGATT...TGCAG|CTT 0 1 35.36
7217607 GT-AG 0 1.000000099473604e-05 1097 rna-XM_020676409.1 1341764 9 3250615 3251711 Amborella trichopoda 13333 CAT|GTAAGTGGGT...TATTTCTTTTTT/GATATATTGAGT...AACAG|AAG 0 1 38.288
7217608 GT-AG 0 2.95189058736062e-05 4415 rna-XM_020676409.1 1341764 10 3246138 3250552 Amborella trichopoda 13333 TAG|GTATGACTTC...TAATTTTCAATA/ATAATTTTCAAT...TGCAG|GTC 2 1 40.616
7217609 GT-AG 0 1.015062496063412e-05 2182 rna-XM_020676409.1 1341764 11 3243883 3246064 Amborella trichopoda 13333 AAG|GTAGATCTAC...TTATTTTTACAA/TTTATTTTTACA...TACAG|ATA 0 1 43.356
7217610 GT-AG 0 0.0002139253972753 105 rna-XM_020676409.1 1341764 12 3243712 3243816 Amborella trichopoda 13333 ACT|GTAAGTCTCT...ACTCCATTAACT/ATATTGTTAACA...TACAG|CCT 0 1 45.833
7217611 GT-AG 0 0.0001202220280029 4350 rna-XM_020676409.1 1341764 13 3239218 3243567 Amborella trichopoda 13333 ACG|GTATGGTCAC...GAAGTTTTACTT/TTCGTATTAATT...TGTAG|CTG 0 1 51.239
7217612 GT-AG 0 1.000000099473604e-05 645 rna-XM_020676409.1 1341764 14 3238515 3239159 Amborella trichopoda 13333 TTG|GTAAGTGGTC...TATACTTTAGAC/ATTAAAGTGATT...AGCAG|GCT 1 1 53.416
7217613 GT-AG 0 2.603718404912766e-05 1518 rna-XM_020676409.1 1341764 15 3236970 3238487 Amborella trichopoda 13333 CAA|GTTCTTTTGT...ATTTTCCAAAAG/TCAGAAGTGATA...AAGAG|TGA 1 1 54.429
7217614 GT-AG 0 1.000000099473604e-05 12415 rna-XM_020676409.1 1341764 17 3220227 3232641 Amborella trichopoda 13333 TAG|GTGAATGCAA...ACTTTCTTGACT/ACTTTCTTGACT...TGCAG|TTA 1 1 57.47
7217615 GT-AG 0 1.000000099473604e-05 191 rna-XM_020676409.1 1341764 19 3219973 3220163 Amborella trichopoda 13333 GTG|GTAAGCACAT...TTTTTCTCAATA/TTTTTTCTAAGA...TTCAG|GAT 2 1 59.76
7217616 GT-AG 0 0.0566815568808868 348 rna-XM_020676409.1 1341764 20 3219456 3219803 Amborella trichopoda 13333 CAG|GTATATTTTG...TTGTTCTAAATA/TATGTTCTCACG...TACAG|TTA 0 1 66.104
7217617 GT-AG 0 0.083405565090615 132 rna-XM_020676409.1 1341764 21 3219259 3219390 Amborella trichopoda 13333 CAA|GTATGGTTCT...TTTTCCTTACTT/TTTTTCCTTACT...GTCAG|CTA 2 1 68.544
7217618 GT-AG 0 1.455064224333089e-05 145 rna-XM_020676409.1 1341764 22 3219023 3219167 Amborella trichopoda 13333 CAG|GTAACAAAAA...AAACTTTTATCC/AAAACTTTTATC...CCCAG|AGC 0 1 71.959
7217619 GT-AG 0 0.0001701053170966 567 rna-XM_020676409.1 1341764 23 3218369 3218935 Amborella trichopoda 13333 TTG|GTAATCTCCA...TTCCATTTAGCA/ACTTTTTCCATT...TGCAG|GTG 0 1 75.225
7217620 GT-AG 0 1.000000099473604e-05 1419 rna-XM_020676409.1 1341764 24 3216872 3218290 Amborella trichopoda 13333 GAG|GTCAGGACTC...CATCTTTTATTC/TCATCTTTTATT...GACAG|GTC 0 1 78.153
7217621 GT-AG 0 7.740895056307258e-05 156 rna-XM_020676409.1 1341764 25 3216678 3216833 Amborella trichopoda 13333 AAG|GTGTGCCTTT...TCTTTCTTTCCC/ATGTATTTCAGA...TACAG|CTC 2 1 79.58
7218062 GT-AG 0 0.0001886527547527 391 rna-XM_020676409.1 1341764 26 3216187 3216577 Amborella trichopoda 13333 GAG|GTAATCAGCA...CTTTTCTTGATA/GGTTTCTTCACT...CGTAG|AAA   0 83.333

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 141.867ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)