home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

31 rows where transcript_id = 22544186

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
122194066 GT-AG 0 1.000000099473604e-05 11235 rna-XM_021176114.1 22544186 1 85640855 85652089 Mus caroli 10089 AAG|GTCAGTGAAG...GGGCCCATAAGA/CCAGGGCCCATA...TTCAG|AAG 0 1 1.585
122194067 GT-AG 0 1.000000099473604e-05 909 rna-XM_021176114.1 22544186 2 85652241 85653149 Mus caroli 10089 CAG|GTGAGGCTGA...CTGGCCTCATCT/CCTGGCCTCATC...CACAG|CGC 1 1 4.654
122194068 GT-AG 0 1.000000099473604e-05 2146 rna-XM_021176114.1 22544186 3 85653299 85655444 Mus caroli 10089 AGG|GTGAGTGTGC...TCATACTTAGAT/GGTGGGCTCACA...GCCAG|CTG 0 1 7.683
122194069 GT-AG 0 1.000000099473604e-05 1489 rna-XM_021176114.1 22544186 4 85655552 85657040 Mus caroli 10089 GAG|GTGAGACCCA...TGGGTTTTGTCC/TGGGAAGTCACC...TTTAG|GAG 2 1 9.858
122194070 GT-AG 0 1.000000099473604e-05 3482 rna-XM_021176114.1 22544186 5 85657183 85660664 Mus caroli 10089 GAG|GTGCATCACT...ATGGCCTGAGTA/CATGGCCTGAGT...CTCAG|AGC 0 1 12.744
122194071 GT-AG 0 1.000000099473604e-05 538 rna-XM_021176114.1 22544186 6 85660769 85661306 Mus caroli 10089 GAG|GTAAGCAGAT...CTACTCTCATAT/ACTACTCTCATA...CCCAG|GGG 2 1 14.858
122194072 GT-AG 0 1.000000099473604e-05 341 rna-XM_021176114.1 22544186 7 85661505 85661845 Mus caroli 10089 CAG|GTGGGCCACC...GTCACCCTGATT/TTCATCGTCACC...TCCAG|ACT 2 1 18.882
122194073 GT-AG 0 1.000000099473604e-05 81 rna-XM_021176114.1 22544186 8 85661943 85662023 Mus caroli 10089 CTG|GTTTGTGGGA...GGTGCTTTGCCG/GCTCGGCTCAGG...CACAG|AAA 0 1 20.854
122194074 GT-AG 0 1.8044964237215645e-05 141 rna-XM_021176114.1 22544186 9 85662114 85662254 Mus caroli 10089 GAG|GTATGGCCTT...CTCTCTGTGATC/CTCTCTGTGATC...CAAAG|GTG 0 1 22.683
122194075 GT-AG 0 1.000000099473604e-05 233 rna-XM_021176114.1 22544186 10 85662462 85662694 Mus caroli 10089 CAG|GTGGGTGACC...TGGTCCTCACTG/CTGGTCCTCACT...GGCAG|GAG 0 1 26.89
122194076 GT-AG 0 1.000000099473604e-05 950 rna-XM_021176114.1 22544186 11 85662895 85663844 Mus caroli 10089 AAG|GTGAGGGAAG...CCACCCCTGAAG/GACAGTCTCAGG...CCCAG|GGA 2 1 30.955
122194077 GT-AG 0 1.000000099473604e-05 349 rna-XM_021176114.1 22544186 12 85664028 85664376 Mus caroli 10089 CAG|GTGGGTTGTG...TGCCCTTTGGCC/AGACCACTCAAC...CTCAG|CCA 2 1 34.675
122194078 GT-AG 0 1.000000099473604e-05 264 rna-XM_021176114.1 22544186 13 85664522 85664785 Mus caroli 10089 CAG|GTATGTGCAC...AAACTCTGAAAC/CTCTGGGTGACC...CACAG|GCT 0 1 37.622
122194079 GT-AG 0 1.000000099473604e-05 258 rna-XM_021176114.1 22544186 14 85664933 85665190 Mus caroli 10089 CAG|GTAAGGCAAG...GTATTCCCACCT/CACAGATTAAAT...TGCAG|CTG 0 1 40.61
122194080 GT-AG 0 1.000000099473604e-05 2763 rna-XM_021176114.1 22544186 15 85665422 85668184 Mus caroli 10089 CAG|GTGAGACCAG...TCCCTCTTTCCT/CTGTGGCACATG...CCTAG|GTC 0 1 45.305
122194081 GT-AG 0 2.8869330700377816e-05 2747 rna-XM_021176114.1 22544186 16 85668379 85671125 Mus caroli 10089 GAG|GTACCAGTGT...GACACCTCAGGA/TGCTATCTGATG...CACAG|GGC 2 1 49.248
122194082 GT-AG 0 1.000000099473604e-05 242 rna-XM_021176114.1 22544186 17 85671254 85671495 Mus caroli 10089 AAG|GTGCTACATG...AGCACCGTGATG/ACACATCTGACC...CACAG|TGG 1 1 51.85
122194083 GT-AG 0 1.000000099473604e-05 777 rna-XM_021176114.1 22544186 18 85671666 85672442 Mus caroli 10089 AAG|GTCCGTCTTC...CATTCCTGATCT/CCTGATCTCACA...GCCAG|GAC 0 1 55.305
122194084 GT-AG 0 1.000000099473604e-05 3082 rna-XM_021176114.1 22544186 19 85672620 85675701 Mus caroli 10089 CAG|GTGATGCAGC...ACTCTCTTTCCT/TCTTTCCTCATG...TTCAG|GCC 0 1 58.902
122194085 GT-AG 0 1.000000099473604e-05 3231 rna-XM_021176114.1 22544186 20 85675816 85679046 Mus caroli 10089 GAG|GTGAGCCCCA...CCTCCCTCAAAC/TCAGGTCTCAGA...CCCAG|GCT 0 1 61.22
122194086 GT-AG 0 1.000000099473604e-05 3416 rna-XM_021176114.1 22544186 21 85679191 85682606 Mus caroli 10089 GAG|GTGAGACGGG...TGGTCCCCAGCT/CAGCTGGTCACT...CTTAG|GCT 0 1 64.146
122194087 GT-AG 0 0.003589917369774 516 rna-XM_021176114.1 22544186 22 85682825 85683340 Mus caroli 10089 CAG|GTATCACAGT...AAGCTCTCAGCC/GAAGCTCTCAGC...CTCAG|TTT 2 1 68.577
122194088 GT-AG 0 1.000000099473604e-05 359 rna-XM_021176114.1 22544186 23 85683501 85683859 Mus caroli 10089 CAG|GTGAGGGGAC...GACCCCTCAGCC/AGGCTTCTCAGT...CCTAG|GTA 0 1 71.829
122194089 GT-AG 0 1.000000099473604e-05 1183 rna-XM_021176114.1 22544186 24 85684028 85685210 Mus caroli 10089 GAG|GTAGGAAAGC...CCAGCCTAGATA/CTACATCTGAGC...TCCAG|GTT 0 1 75.244
122194090 GT-AG 0 1.000000099473604e-05 222 rna-XM_021176114.1 22544186 25 85685566 85685787 Mus caroli 10089 CAG|GTAAGTGTTT...CTGCCTCTACCC/CCTCTACCCACA...TGCAG|GCA 1 1 82.459
122194091 GT-AG 0 1.000000099473604e-05 792 rna-XM_021176114.1 22544186 26 85685970 85686761 Mus caroli 10089 CGG|GTAGGATAGG...TCCCTCTTGCCT/GCTGAGTTCATT...CCTAG|GAC 0 1 86.159
122194092 GT-AG 0 1.000000099473604e-05 667 rna-XM_021176114.1 22544186 27 85686883 85687549 Mus caroli 10089 AAG|GTGAACCCCT...TGCTTCTTCCCC/AAGAGCCTCAGG...CACAG|GCC 1 1 88.618
122194093 GT-AG 0 1.000000099473604e-05 5662 rna-XM_021176114.1 22544186 28 85687684 85693345 Mus caroli 10089 CAG|GTAGGACTCC...CTCTCCTTCCCT/CCTTCTCTCCTT...CCTAG|GAG 0 1 91.341
122194094 GT-AG 0 1.000000099473604e-05 432 rna-XM_021176114.1 22544186 29 85693445 85693876 Mus caroli 10089 CAG|GTGAGGGGGC...GTTCATGTAACC/CCCATGTTCATG...CTCAG|GTG 0 1 93.354
122194095 GT-AG 0 0.0011033659912364 2419 rna-XM_021176114.1 22544186 30 85694003 85696421 Mus caroli 10089 CAG|GTATATGTTT...TGAGTCTTGCCA/AAGACCCTGAGT...TGCAG|ACA 0 1 95.915
122194096 GT-AG 0 1.000000099473604e-05 2044 rna-XM_021176114.1 22544186 31 85696554 85698597 Mus caroli 10089 CAG|GTGAGCCAGT...CCCTCCTCACCT/TCCCTCCTCACC...TCCAG|GTA 0 1 98.598

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 25.446ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)