home / WtMTA

introns

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

id
INTEGER (primary key), globally unique identifier for each intron
dinucleotide_pair
TEXT, terminal dinucleotide sequences of the intron
is_minor
INTEGER, indicates if the intron is a minor intron (1) or not (0)
score
REAL, score representing the probability (0-100%) of the intron being minor
length
INTEGER, length of the intron in base pairs
transcript_id
INTEGER (foreign key referencing transcripts(id)), parent transcript
ordinal_index
INTEGER, ordinal position of the intron within the transcript (e.g., 3 for the third intron)
start
INTEGER, start position of the intron in the genome
end
INTEGER, end position of the intron in the genome
taxonomy_id
INTEGER (foreign key referencing genomes(taxonomy_id)), NCBI taxonomy identifier for species
scored_motifs
TEXT, motifs scored for the intron
phase
INTEGER, phase of the intron in coding sequence (0, 1, or 2 or null for introns outside of coding sequence)
in_cds
INTEGER, indicates if the intron is within the coding sequence (1) or not (0; e.g., UTR introns)
relative_position
REAL, relative position of the intron within the transcript (as a percentage of coding length)

18 rows where transcript_id = 12917271

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: score, phase

id ▼ dinucleotide_pair is_minor score length transcript_id ordinal_index start end taxonomy_id scored_motifs phase in_cds relative_position
68847579 GT-AG 0 1.000000099473604e-05 1179 rna-XM_009640831.2 12917271 1 2861577 2862755 Egretta garzetta 188379 TAA|GTGAGTAAGC...TTATTCTTATTT/CTTATTCTTATT...TGAAG|GAG 2 1 3.768
68847580 GT-AG 0 1.6374055561335734e-05 270 rna-XM_009640831.2 12917271 2 2861268 2861537 Egretta garzetta 188379 GCG|GTAATTCTAT...GTAATTTTAATA/ATATAACTCACT...CTTAG|GGG 2 1 6.258
68847581 GT-AG 0 1.000000099473604e-05 3686 rna-XM_009640831.2 12917271 3 2857528 2861213 Egretta garzetta 188379 ACA|GTAAGTCCTT...TCTGTTTTGTTT/TGGGTAATAATC...TATAG|TGC 2 1 9.706
68847582 GT-AG 0 1.000000099473604e-05 1011 rna-XM_009640831.2 12917271 4 2856474 2857484 Egretta garzetta 188379 AAG|GTAAGAGAGG...GATGCTTTGAAT/TGGTTTTTCATT...TTCAG|CCT 0 1 12.452
68847583 GT-AG 0 1.000000099473604e-05 960 rna-XM_009640831.2 12917271 5 2855351 2856310 Egretta garzetta 188379 TAG|GTAATAAGAG...ACATTTTTAAAT/ACATTTTTAAAT...TCTAG|GTA 1 1 22.861
68847584 GT-AG 0 0.0123850103192778 1779 rna-XM_009640831.2 12917271 6 2853462 2855240 Egretta garzetta 188379 CTG|GTATGTATTT...TACTTTTTAACT/TTTTAACTTATT...TCTAG|AAA 0 1 29.885
68847585 GT-AG 0 1.000000099473604e-05 2485 rna-XM_009640831.2 12917271 7 2850935 2853419 Egretta garzetta 188379 CAC|GTGAGTATTA...ATATTTTTAATT/ATTGTTTTTACT...TACAG|ATG 0 1 32.567
68847586 GT-AG 0 1.157227322437042e-05 1189 rna-XM_009640831.2 12917271 8 2849661 2850849 Egretta garzetta 188379 GAG|GTAGTATATT...CCTTCCTTAAGT/CCTTCCTTAAGT...TGCAG|ATC 1 1 37.995
68847587 GT-AG 0 0.0805635648753803 2193 rna-XM_009640831.2 12917271 9 2847388 2849580 Egretta garzetta 188379 CAG|GTATATTTCT...TTTTCCTTCCCT/CTGTATATCAAA...ATCAG|CTA 0 1 43.103
68847588 GT-AG 0 1.000000099473604e-05 86 rna-XM_009640831.2 12917271 10 2847241 2847326 Egretta garzetta 188379 CTG|GTAAGTTACT...TGTTTTCTAATT/TGTTTTCTAATT...CCCAG|GTA 1 1 46.999
68847589 GT-AG 0 1.000000099473604e-05 2598 rna-XM_009640831.2 12917271 11 2844525 2847122 Egretta garzetta 188379 CAG|GTAAATATAT...ATTGTTTTAGTT/TCTGTATTTATA...TGTAG|GAA 2 1 54.534
68847590 GT-AG 0 1.000000099473604e-05 2686 rna-XM_009640831.2 12917271 12 2841780 2844465 Egretta garzetta 188379 TTG|GTAAGTAAAG...ATTTGCTTAGTA/TATTTGCTTAGT...GGCAG|TGA 1 1 58.301
68847591 GT-AG 0 1.000000099473604e-05 801 rna-XM_009640831.2 12917271 13 2840875 2841675 Egretta garzetta 188379 AAG|GTAATATTAT...TTTCCCTTCTAA/TCCCTTCTAATA...TCTAG|CAC 0 1 64.943
68847592 GT-AG 0 1.000000099473604e-05 2537 rna-XM_009640831.2 12917271 14 2838166 2840702 Egretta garzetta 188379 CAG|GTTTGTGTGC...ATGTTATGAACT/TATGAACTAACT...TATAG|ACA 1 1 75.926
68847593 GT-AG 0 0.000155614910087 115 rna-XM_009640831.2 12917271 15 2837982 2838096 Egretta garzetta 188379 ATT|GTAAGTTTTA...TCCTATTTATTG/ATCCTATTTATT...TATAG|GCT 1 1 80.332
68847594 GT-AG 0 1.000000099473604e-05 1908 rna-XM_009640831.2 12917271 16 2835981 2837888 Egretta garzetta 188379 TAG|GTAAGTTGGA...ATGTTCTTTGTT/TCAGAACTGATT...ACCAG|TCT 1 1 86.271
68847595 GT-AG 0 1.000000099473604e-05 3141 rna-XM_009640831.2 12917271 17 2832769 2835909 Egretta garzetta 188379 GAG|GTAAGTACTG...CTTCTCTTATTT/CTTATTTTTATT...TCTAG|ATC 0 1 90.805
68847596 GT-AG 0 1.3069170455245913e-05 2421 rna-XM_009640831.2 12917271 18 2830292 2832712 Egretta garzetta 188379 CAG|GTATGAATAG...GCTTACTTGACA/GGCTTTTTCATT...TTTAG|GGT 2 1 94.381

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "introns" (
"id" INTEGER,
  "dinucleotide_pair" TEXT,
  "is_minor" INTEGER,
  "score" REAL,
  "length" INTEGER,
  "transcript_id" INTEGER,
  "ordinal_index" INTEGER,
  "start" INTEGER,
  "end" INTEGER,
  "taxonomy_id" INTEGER,
  "scored_motifs" TEXT,
  "phase" INTEGER,
  "in_cds" INTEGER,
  "relative_position" REAL
  ,PRIMARY KEY ([id]),
   FOREIGN KEY([transcript_id]) REFERENCES [transcripts]([id]),
   FOREIGN KEY([taxonomy_id]) REFERENCES [genomes]([taxonomy_id])
);
CREATE INDEX [idx_introns_transcript_id]
    ON [introns] ([transcript_id]);
CREATE INDEX [idx_introns_taxonomy_id]
    ON [introns] ([taxonomy_id]);
CREATE INDEX [idx_introns_phase]
    ON [introns] ([phase]);
CREATE INDEX [idx_introns_is_minor]
    ON [introns] ([is_minor]);
CREATE INDEX [idx_introns_dinucleotide_pair]
    ON [introns] ([dinucleotide_pair]);
CREATE INDEX [idx_introns_score]
    ON [introns] ([score]);
CREATE INDEX [idx_introns_in_cds]
    ON [introns] ([in_cds]);
Powered by Datasette · Queries took 681.294ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)