home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

41 rows where transcript_id = 35103474

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: dinucleotide_pair, score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
197657050 GT-AG 0 0.0009189249511626 1314 rna-XM_007048819.2 35103474 1 9968545 9969858 Theobroma cacao 3641 TCT|GTAAGCTCAT...TAGGCCTTGCTT/AATTTACTCATT...TTTAG|GCC 1 1 3.559
197657051 GT-AG 0 0.0010913443650504 1943 rna-XM_007048819.2 35103474 2 9966501 9968443 Theobroma cacao 3641 GAG|GTATATCTTG...TTGAATTTGATT/TTGAATTTGATT...TGCAG|GAA 0 1 5.338
197657052 GT-AG 0 1.000000099473604e-05 92 rna-XM_007048819.2 35103474 3 9966296 9966387 Theobroma cacao 3641 ACC|GTGAGGCTTT...TTGCCCTTATAC/TGTTTGCTTACT...TGAAG|GGA 2 1 7.329
197657053 GT-AG 0 1.4123672627805704e-05 101 rna-XM_007048819.2 35103474 4 9966107 9966207 Theobroma cacao 3641 AAG|GTTTGATTTA...TCATTATTGATT/TCATTATTGATT...CACAG|ACC 0 1 8.879
197657054 GT-AG 0 1.000000099473604e-05 91 rna-XM_007048819.2 35103474 5 9965905 9965995 Theobroma cacao 3641 GAG|GTTGTATATA...ACAACATTGATT/GTGGATCTCACA...TACAG|ATC 0 1 10.835
197657055 GT-AG 0 1.000000099473604e-05 2213 rna-XM_007048819.2 35103474 6 9963563 9965775 Theobroma cacao 3641 CAG|GTAGTGCAAT...TCTTTTTTATTT/ATCTTTTTTATT...TGAAG|AAA 0 1 13.108
197657056 GT-AG 0 1.000000099473604e-05 133 rna-XM_007048819.2 35103474 7 9963340 9963472 Theobroma cacao 3641 GAG|GTGAATCATT...CTTTTGTTGATG/CTTTTGTTGATG...TGCAG|CTT 0 1 14.693
197657057 GT-AG 0 16.002547870181633 139 rna-XM_007048819.2 35103474 8 9963106 9963244 Theobroma cacao 3641 AAG|GTATCTTTTG...GAAACTTTAACT/GTTTTTCTTATG...TGTAG|GTA 2 1 16.367
197657058 GT-AG 0 0.0001375069558864 1854 rna-XM_007048819.2 35103474 9 9961128 9962981 Theobroma cacao 3641 AAT|GTAAGTTACC...TTTTTCATGATT/TATTTTTTCATG...AGAAG|ATG 0 1 18.552
197657059 GT-AG 0 0.0001983607465304 91 rna-XM_007048819.2 35103474 10 9960905 9960995 Theobroma cacao 3641 AAG|GTAATCTCTA...AGCTTCATAGCT/TAAAGCTTCATA...GAAAG|GAA 0 1 20.877
197657060 GT-AG 0 1.000000099473604e-05 77 rna-XM_007048819.2 35103474 11 9960751 9960827 Theobroma cacao 3641 CTG|GTGAGTTTTT...ATTCTTTTGTCT/TTTGTCTACACC...TCTAG|GTC 2 1 22.234
197657061 GT-AG 0 0.0359682265769615 609 rna-XM_007048819.2 35103474 12 9960054 9960662 Theobroma cacao 3641 GAG|GTAGCTTCTT...CTTATTTTATTT/CCTTATTTTATT...TTCAG|ATT 0 1 23.784
197657062 GT-AG 0 0.3838385748886729 104 rna-XM_007048819.2 35103474 13 9959827 9959930 Theobroma cacao 3641 CAG|GTACCTTTCA...ATTTTTTTATTT/TATTTTTTTATT...TTCAG|GCT 0 1 25.951
197657063 GT-AG 0 1.000000099473604e-05 250 rna-XM_007048819.2 35103474 14 9959459 9959708 Theobroma cacao 3641 AAG|GTAACAGAAG...GTATGTTTGATG/ATGAATTTCATC...TGCAG|CTA 1 1 28.03
197657064 GC-AG 0 1.000000099473604e-05 148 rna-XM_007048819.2 35103474 15 9958979 9959126 Theobroma cacao 3641 CAG|GCAAGCATAT...TAATTTTTATTT/ATAATTTTTATT...TCCAG|CCA 0 1 33.879
197657065 GT-AG 0 1.000000099473604e-05 115 rna-XM_007048819.2 35103474 16 9958811 9958925 Theobroma cacao 3641 AAA|GTAAGAGACA...TGTATTTTAATA/TGTATTTTAATA...CTCAG|GTA 2 1 34.813
197657066 GT-AG 0 1.000000099473604e-05 1592 rna-XM_007048819.2 35103474 17 9957158 9958749 Theobroma cacao 3641 GAG|GTGATTTCTC...TGCTTCTAAGCT/CTTACTTTTATT...TTAAG|ATT 0 1 35.888
197657067 GT-AG 0 1.000000099473604e-05 106 rna-XM_007048819.2 35103474 18 9956970 9957075 Theobroma cacao 3641 ACG|GTAATACATT...ACCTTCTTATAT/ATGGAATTTACT...TGTAG|TTG 1 1 37.333
197657068 GT-AG 0 1.000000099473604e-05 110 rna-XM_007048819.2 35103474 19 9956810 9956919 Theobroma cacao 3641 TTG|GTAAGTAAGC...AGTGTTTTACTC/GTTTTACTCATG...CATAG|GTT 0 1 38.214
197657069 GT-AG 0 0.0422524213184853 236 rna-XM_007048819.2 35103474 20 9956487 9956722 Theobroma cacao 3641 GAG|GTATGCTGTA...ACTTTCGTAACT/TTTGCTCTCATC...CTTAG|ATA 0 1 39.746
197657070 GT-AG 0 1.000000099473604e-05 221 rna-XM_007048819.2 35103474 21 9956161 9956381 Theobroma cacao 3641 TTG|GTAGTGCCGA...ATTTTCTTTTCC/TTTTGGCTAAAG...GGCAG|GAT 0 1 41.596
197657071 GT-AG 0 1.000000099473604e-05 71 rna-XM_007048819.2 35103474 22 9955995 9956065 Theobroma cacao 3641 TAG|GTGAGGACTT...ACTCTTTTATTT/GTAAATCTCATC...TCCAG|GGA 2 1 43.27
197657072 GT-AG 0 1.121289743551525e-05 88 rna-XM_007048819.2 35103474 23 9955825 9955912 Theobroma cacao 3641 AAG|GTAAACACTG...TATGTTATAATT/TTATAATTTATT...GACAG|ATT 0 1 44.715
197657073 GT-AG 0 1.000000099473604e-05 148 rna-XM_007048819.2 35103474 24 9955513 9955660 Theobroma cacao 3641 GAA|GTAAGGCTGC...TTTCTCTCAATT/TGTCTTCTAATT...AATAG|GAT 2 1 47.604
197657074 GT-AG 0 0.0002746198076565 110 rna-XM_007048819.2 35103474 25 9955279 9955388 Theobroma cacao 3641 TTG|GTAACAATCG...TTCTTGTTGACA/TTCTTGTTGACA...TACAG|ATG 0 1 49.789
197657075 GT-AG 0 0.0001578259267258 477 rna-XM_007048819.2 35103474 26 9954698 9955174 Theobroma cacao 3641 GAA|GTAAGCACTG...ATTTCCTTGTCT/TGAGTCTTCATC...TGTAG|AAC 2 1 51.621
197657076 GC-AG 0 1.000000099473604e-05 82 rna-XM_007048819.2 35103474 27 9954516 9954597 Theobroma cacao 3641 AAG|GCACTGAACT...TGCTTTTTATTA/TTGCTTTTTATT...TATAG|GTC 0 1 53.383
197657077 GT-AG 0 1.000000099473604e-05 299 rna-XM_007048819.2 35103474 28 9954065 9954363 Theobroma cacao 3641 CAG|GTCAGTGACC...TATTTCTTGATT/TATTTCTTGATT...TTCAG|TGT 2 1 56.061
197657078 GT-AG 0 1.000000099473604e-05 85 rna-XM_007048819.2 35103474 29 9953870 9953954 Theobroma cacao 3641 CAG|GTGAGTTCTG...ATGGACTTATTA/CATGGACTTATT...ATTAG|ATG 1 1 57.999
197657079 GT-AG 0 1.000000099473604e-05 109 rna-XM_007048819.2 35103474 30 9953662 9953770 Theobroma cacao 3641 CAG|GTCTGGATGA...AGATATTTGATA/AGATATTTGATA...GTCAG|TGC 1 1 59.743
197657080 GT-AG 0 1.708437158296535e-05 142 rna-XM_007048819.2 35103474 31 9953451 9953592 Theobroma cacao 3641 ATG|GTTTGTCGCT...TATATATTAACT/TATATATTAACT...TGCAG|CTA 1 1 60.958
197657081 GT-AG 0 0.0005099570027098 94 rna-XM_007048819.2 35103474 32 9953203 9953296 Theobroma cacao 3641 AAT|GTAAGTTATC...CACTCCTTATTT/CTTATTTTAATA...TACAG|GCA 2 1 63.672
197657082 GT-AG 0 1.000000099473604e-05 826 rna-XM_007048819.2 35103474 33 9952256 9953081 Theobroma cacao 3641 AGG|GTAAGTGCTA...ACATCCTTATAC/TATACATTCATT...TCTAG|GAA 0 1 65.803
197657083 GT-AG 0 0.0495623089690066 71 rna-XM_007048819.2 35103474 34 9952062 9952132 Theobroma cacao 3641 CAG|GTAGCTTTTT...CATCTTTTAATA/CATCTTTTAATA...TTTAG|GAT 0 1 67.97
197657084 GT-AG 0 1.000000099473604e-05 141 rna-XM_007048819.2 35103474 35 9951802 9951942 Theobroma cacao 3641 AAG|GTTAGTCTGA...TACTTTTTAATT/TACTTTTTAATT...TACAG|TGT 2 1 70.067
197657085 GT-AG 0 2.0447300322321507 642 rna-XM_007048819.2 35103474 36 9951076 9951717 Theobroma cacao 3641 GAG|GTACCCTTAA...ATGATCTTATTT/ATTTCTTTCATA...TGCAG|GGT 2 1 71.547
197657086 GT-AG 0 5.2282300533947926e-05 72 rna-XM_007048819.2 35103474 37 9950891 9950962 Theobroma cacao 3641 CAG|GTAATCTTCA...TGGTGGTTAATT/ATCTAACTAACT...TTCAG|GGT 1 1 73.538
197657087 GT-AG 0 1.000000099473604e-05 371 rna-XM_007048819.2 35103474 38 9950290 9950660 Theobroma cacao 3641 ATG|GTGAGCAAAC...CTGTTTTTGGCA/TTTGGCATTACA...TTCAG|GTT 0 1 77.59
197657088 GT-AG 0 0.000304620117934 137 rna-XM_007048819.2 35103474 39 9949355 9949491 Theobroma cacao 3641 CTG|GTATAATATG...AAGCGTTTAACC/AAGCGTTTAACC...TGCAG|GTT 0 1 91.649
197657089 GT-AG 0 4.698759461113103e-05 239 rna-XM_007048819.2 35103474 40 9949065 9949303 Theobroma cacao 3641 AAG|GTATGTGATG...GGTTTTTTGCTT/CTTGTTGTGATC...TGCAG|ATT 0 1 92.548
197657090 GT-AG 0 0.0018955198553618 316 rna-XM_007048819.2 35103474 41 9948563 9948878 Theobroma cacao 3641 CTT|GTAAGTTTCA...ATTTCCTTGTCC/TATTACCTAACA...CCAAG|CTG 0 1 95.825

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 31.02ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)