home / WtMTA

genomes

Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)

taxonomy_id
INTEGER (primary key), unique identifier for each species
species
TEXT, binomial name of the species
family
TEXT, taxonomic family of the species
order
TEXT, taxonomic order of the species
phylum
TEXT, taxonomic phylum of the species
accession
TEXT, accession number of the genome assembly
n_minor_introns
INTEGER, total number of minor introns in the genome
n_major_introns
INTEGER, total number of major introns in the genome
percent_minor_introns
REAL, percentage of minor introns in the genome
busco_score
REAL, BUSCO score assessing the genome assembly completeness (vs. eukaryota_odb10)
minor_snRNAs
TEXT, minor snRNAs found in the annotated transcriptome
genome_version
TEXT, version of the genome assembly
source_url
TEXT, URL for the source genome/annotation files
source_metadata
TEXT, additional metadata from the original data source
minor_intron+
INTEGER, indicates if the species is inferred to contain real minor introns (1) or not (0)

27 rows where busco_score = "94.5" and minor_snRNAs contains "u11" sorted by percent_minor_introns descending

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: family, order, phylum, n_minor_introns, minor_snRNAs, genome_version, minor_snRNAs (array)

taxonomy_id species family order phylum accession n_minor_introns n_major_introns percent_minor_introns ▲ busco_score minor_snRNAs genome_version source_url source_metadata minor_intron+
1868482 Carlito syrichta Tarsiidae Primates Chordata GCF_000164805.1 621 174099 0.3554258241758242 94.5 ["u11", "u12", "u4atac", "u6atac"] Tarsius_syrichta-2.0.1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/164/805/GCF_000164805.1_Tarsius_syrichta-2.0.1 GCF_000164805.1;PRJNA236776;SAMN02445010;ABRT00000000.2;representative genome;1868482;1868482;Carlito syrichta;;Samal-C Ts95f;latest;Scaffold;Major;Full;2013/09/18;Tarsius_syrichta-2.0.1;Washington University (WashU);GCA_000164805.2;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/164/805/GCF_000164805.1_Tarsius_syrichta-2.0.1;;;na 1
7918 Lepisosteus oculatus Lepisosteidae Semionotiformes Chordata GCF_000242695.1 632 185220 0.340055528054581 94.5 ["u11", "u12", "u4atac", "u6atac"] LepOcu1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/242/695/GCF_000242695.1_LepOcu1 GCF_000242695.1;PRJNA221149;SAMN00706774;AHAT00000000.1;representative genome;7918;7918;Lepisosteus oculatus;;Spotted Gar 1;latest;Chromosome;Major;Full;2012/01/13;LepOcu1;Broad Institute;GCA_000242695.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/242/695/GCF_000242695.1_LepOcu1;;;na 1
10020 Dipodomys ordii Heteromyidae Rodentia Chordata GCF_000151885.1 595 175998 0.3369329475120757 94.5 ["u11", "u12", "u4atac", "u6atac"] Dord_2.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/151/885/GCF_000151885.1_Dord_2.0 GCF_000151885.1;PRJNA287906;SAMN02900551;ABRO00000000.2;representative genome;10020;10020;Dipodomys ordii;;6190;latest;Scaffold;Major;Full;2014/12/12;Dord_2.0;Baylor College of Medicine;GCA_000151885.2;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/151/885/GCF_000151885.1_Dord_2.0;;;na 1
68294 Corvus kubaryi Corvidae Passeriformes Chordata GCF_017639235.1 559 166404 0.3348047172127956 94.5 ["u11", "u12", "u4atac", "u6atac"] C.kubaryi_AGA036_p1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/017/639/235/GCF_017639235.1_C.kubaryi_AGA036_p1.0 GCF_017639235.1;PRJNA735849;SAMN16883221;JAEMUS000000000.1;representative genome;68294;68294;Corvus kubaryi;;FWS band 111438036;latest;Scaffold;Major;Full;2021/03/30;C.kubaryi_AGA036_p1.0;United States Geological Survey;GCA_017639235.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/017/639/235/GCF_017639235.1_C.kubaryi_AGA036_p1.0;;;na 1
9874 Odocoileus virginianus Cervidae Artiodactyla Chordata GCF_002102435.1 635 193274 0.3274731961899654 94.5 ["u11", "u12", "u4atac", "u6atac"] Ovir.te_1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/002/102/435/GCF_002102435.1_Ovir.te_1.0 GCF_002102435.1;PRJNA384059;SAMN05363940;MLBE00000000.1;representative genome;9880;9874;Odocoileus virginianus texanus;;animal Pink-7;latest;Scaffold;Major;Full;2017/04/20;Ovir.te_1.0;Baylor College of Medicine;GCA_002102435.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/002/102/435/GCF_002102435.1_Ovir.te_1.0;;;na 1
9568 Mandrillus leucophaeus Cercopithecidae Primates Chordata GCF_000951045.1 619 188438 0.3274144834626594 94.5 ["u11", "u12", "u4atac", "u6atac"] Mleu.le_1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/951/045/GCF_000951045.1_Mleu.le_1.0 GCF_000951045.1;PRJNA279492;SAMN03121813;JYKQ00000000.1;representative genome;9568;9568;Mandrillus leucophaeus;;KB7577;latest;Scaffold;Major;Full;2015/03/12;Mleu.le_1.0;Baylor College of Medicine;GCA_000951045.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/951/045/GCF_000951045.1_Mleu.le_1.0;;;na 1
61621 Rhinopithecus bieti Cercopithecidae Primates Chordata GCF_001698545.1 611 194371 0.3133622590803253 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM169854v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/698/545/GCF_001698545.1_ASM169854v1 GCF_001698545.1;PRJNA339282;SAMN02786331;MCGX00000000.1;representative genome;61621;61621;Rhinopithecus bieti;;Rb0;latest;Scaffold;Major;Full;2016/08/03;ASM169854v1;Laboratory for conservation and utilization of Bio-resource;GCA_001698545.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/698/545/GCF_001698545.1_ASM169854v1;;;na 1
658196 Glomus cerebriforme Glomeraceae Glomerales Mucoromycota GCA_003550305.1 179 64868 0.2751856350023829 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM355030v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/003/550/305/GCA_003550305.1_ASM355030v1 GCA_003550305.1;PRJNA430010;SAMN08364855;QKYT00000000.1;representative genome;658196;658196;Glomus cerebriforme;strain=DAOM 227022;;latest;Scaffold;Major;Full;2018/09/12;ASM355030v1;INRA;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/003/550/305/GCA_003550305.1_ASM355030v1;;;na 1
588596 Rhizophagus irregularis Glomeraceae Glomerales Mucoromycota GCF_000439145.1 205 75172 0.2719662496517505 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM43914v3 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/439/145/GCF_000439145.1_ASM43914v3 GCF_000439145.1;PRJNA471752;SAMN02744054;AUPC00000000.2;representative genome;747089;588596;Rhizophagus irregularis DAOM 181602=DAOM 197198;strain=DAOM 197198;;latest;Scaffold;Major;Full;2018/01/30;ASM43914v3;DOE Joint Genome Institute;GCA_000439145.3;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/439/145/GCF_000439145.1_ASM43914v3;;;na 1
175797 Silurus meridionalis Siluridae Siluriformes Chordata GCA_014805685.1 518 208766 0.2475105598134592 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM1480568v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/014/805/685/GCA_014805685.1_ASM1480568v1 GCA_014805685.1;PRJNA623722;SAMN14558653;JABFDY000000000.1;representative genome;175797;175797;Silurus meridionalis;;SWU-2019-XX;latest;Chromosome;Major;Full;2020/10/02;ASM1480568v1;Southwest University;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/014/805/685/GCA_014805685.1_ASM1480568v1;;;na 1
10228 Trichoplax adhaerens Trichoplacidae   Placozoa GCF_000150275.1 211 93076 0.2261837126287693 94.5 ["u11", "u12", "u4atac", "u6atac"] v1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/150/275/GCF_000150275.1_v1.0 GCF_000150275.1;PRJNA30931;SAMN02953699;ABGP00000000.1;representative genome;10228;10228;Trichoplax adhaerens;strain=Grell-BS-1999;;latest;Scaffold;Major;Full;2008/06/17;v1.0;US DOE Joint Genome Institute (JGI-PGF);GCA_000150275.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/150/275/GCF_000150275.1_v1.0;;;na 1
2448454 Pyrus ussuriensis x pyrus communis Rosaceae Rosales Streptophyta GCA_008932095.1 392 183686 0.2129532046197807 94.5 ["u11", "u12", "u6atac"] ASM893209v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/008/932/095/GCA_008932095.1_ASM893209v1 GCA_008932095.1;PRJNA494996;SAMN10188208;SMOL00000000.1;representative genome;2448454;2448454;Pyrus ussuriensis x Pyrus communis;cultivar=Zhongai 1;S2;latest;Chromosome;Major;Full;2019/10/11;ASM893209v1;Research Institute of Pomology Chinese Academy of Agricultural Sciences;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/008/932/095/GCA_008932095.1_ASM893209v1;;;na 1
300111 Temnothorax curvispinosus Formicidae Hymenoptera Arthropoda GCF_003070985.1 155 80644 0.1918340573521949 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM307098v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/070/985/GCF_003070985.1_ASM307098v1 GCF_003070985.1;PRJNA453998;SAMN08906336;QBEX00000000.1;representative genome;300111;300111;Temnothorax curvispinosus;;PA1;latest;Scaffold;Major;Full;2018/04/24;ASM307098v1;University of Pennsylvania;GCA_003070985.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/070/985/GCF_003070985.1_ASM307098v1;;;na 1
103762 Zizania palustris Poaceae Poales Streptophyta GCA_019279435.1 305 163903 0.1857400370262106 94.5 ["u11", "u12", "u6atac"] ASM1927943v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/019/279/435/GCA_019279435.1_ASM1927943v1 GCA_019279435.1;PRJNA600525;SAMN13825534;JAAALK000000000.1;representative genome;103762;103762;Zizania palustris;cultivar=Itasca-C12;;latest;Scaffold;Major;Full;2021/07/19;ASM1927943v1;University of Minnesota;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/019/279/435/GCA_019279435.1_ASM1927943v1;;;na 1
400682 Amphimedon queenslandica Niphatidae Haplosclerida Porifera GCF_000090795.1 263 149226 0.1759326773207393 94.5 ["u11", "u12", "u4atac", "u6atac"] v1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/090/795/GCF_000090795.1_v1.0 GCF_000090795.1;PRJNA66531;SAMN02743868;ACUQ00000000.1;representative genome;400682;400682;Amphimedon queenslandica;;;latest;Scaffold;Major;Full;2010/05/28;v1.0;US DOE Joint Genome Institute (JGI-PGF);GCA_000090795.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/090/795/GCF_000090795.1_v1.0;;;na 1
106549 Malus baccata Rosaceae Rosales Streptophyta GCA_006547085.1 258 155534 0.1656054226147684 94.5 ["u11", "u12", "u6atac"] Malus_baccata_v1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/006/547/085/GCA_006547085.1_Malus_baccata_v1.0 GCA_006547085.1;PRJNA428857;SAMN08323692;VIEB00000000.1;representative genome;106549;106549;Malus baccata;cultivar=Shandingzi;;latest;Scaffold;Major;Full;2019/07/03;Malus_baccata_v1.0;Northwest A&F University;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/006/547/085/GCA_006547085.1_Malus_baccata_v1.0;;;na 1
121224 Pediculus humanus Pediculidae Phthiraptera Arthropoda GCA_000006295.1 88 57955 0.1516117361266647 94.5 ["u11", "u12", "u4atac", "u6atac"] PhumU2 ftp://ftp.ensemblgenomes.org/pub/metazoa/release-52/fasta/pediculus_humanus/dna/Pediculus_humanus.PhumU2.dna.toplevel.fa.gz; ftp://ftp.ensemblgenomes.org/pub/metazoa/release-52/gtf/pediculus_humanus/Pediculus_humanus.PhumU2.52.gtf.gz Pediculus humanus;pediculus_humanus;EnsemblMetazoa;121224;PhumU2;GCA_000006295.1;PhumU2.5;N;N;Y;Y;N;Y;pediculus_humanus_core_52_105_2;1 1
63057 Trema orientale Cannabaceae Rosales Streptophyta GCA_002914845.1 147 102565 0.1431186229457123 94.5 ["u11", "u12", "u6atac"] TorRG33x02_asm01 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/914/845/GCA_002914845.1_TorRG33x02_asm01 GCA_002914845.1;PRJNA272482;SAMN03322532;JXTC00000000.1;representative genome;63057;63057;Trema orientale;;RG33-2;latest;Scaffold;Major;Full;2018/02/02;TorRG33x02_asm01;Wageningen University;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/914/845/GCA_002914845.1_TorRG33x02_asm01;;;na 1
3476 Parasponia andersonii Cannabaceae Rosales Streptophyta GCA_002914805.1 144 101195 0.1420973169263561 94.5 ["u11", "u12", "u6atac"] PanWU01x14_asm01 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/914/805/GCA_002914805.1_PanWU01x14_asm01 GCA_002914805.1;PRJNA272473;SAMN03317003;JXTB00000000.1;representative genome;3476;3476;Parasponia andersonii;;WU1-14;latest;Scaffold;Major;Full;2018/02/02;PanWU01x14_asm01;Wageningen University;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/914/805/GCA_002914805.1_PanWU01x14_asm01;;;na 1
76194 Papilio polytes Papilionidae Lepidoptera Arthropoda GCF_000836215.1 97 78758 0.123010589055862 94.5 ["u11", "u12", "u4atac", "u6atac"] Ppol_1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/836/215/GCF_000836215.1_Ppol_1.0 GCF_000836215.1;PRJNA291535;SAMD00018697;BBJD00000000.1;representative genome;76194;76194;Papilio polytes;;;latest;Scaffold;Major;Full;2015/02/02;Ppol_1.0;Tokyo Institute of Technology;GCA_000836215.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/836/215/GCF_000836215.1_Ppol_1.0;;;na 1
151541 Danaus chrysippus Nymphalidae Lepidoptera Arthropoda GCA_916720795.1 98 83894 0.1166777788360796 94.5 ["u11", "u12", "u4atac", "u6atac"] Dchry2.2 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/916/720/795/GCA_916720795.1_Dchry2.2 GCA_916720795.1;PRJEB47812;SAMEA9973796;CAKASE000000000.1;representative genome;151541;151541;Danaus chrysippus;;;latest;Contig;Major;Full;2021/11/13;Dchry2.2;UNIVERSITY OF EDINBURGH;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/916/720/795/GCA_916720795.1_Dchry2.2;;;na 1
47600 Gossypium anomalum Malvaceae Malvales Streptophyta GCA_019455425.1 179 170605 0.1048107551058647 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM1945542v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/019/455/425/GCA_019455425.1_ASM1945542v1 GCA_019455425.1;PRJNA421337;SAMN08140125;JAHUZN000000000.1;representative genome;47600;47600;Gossypium anomalum;;JFW-Udall;latest;Chromosome;Major;Full;2021/08/09;ASM1945542v1;NCGR;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/019/455/425/GCA_019455425.1_ASM1945542v1;;;na 1
139456 Penaeus chinensis Penaeidae Decapoda Arthropoda GCF_019202785.1 103 133021 0.0773714732129443 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM1920278v2 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/019/202/785/GCF_019202785.1_ASM1920278v2 GCF_019202785.1;PRJNA822080;SAMN17293200;JAGKSU000000000.1;representative genome;139456;139456;Penaeus chinensis;breed=Huanghai No. 1;;latest;Chromosome;Major;Full;2021/07/13;ASM1920278v2;Yellow Sea Fisheries Research Institute, Chinese Academy of Fishery Sciences;GCA_019202785.2;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/019/202/785/GCF_019202785.1_ASM1920278v2;;;na 1
41427 Anopheles atroparvus Culicidae Diptera Arthropoda GCA_000473505.1 16 45311 0.035299049131864 94.5 ["u11", "u12", "u4atac", "u6atac"] AatrE3 ftp://ftp.ensemblgenomes.org/pub/metazoa/release-51/fasta/anopheles_atroparvus/dna/Anopheles_atroparvus.AatrE3.dna.toplevel.fa.gz; ftp://ftp.ensemblgenomes.org/pub/metazoa/release-51/gtf/anopheles_atroparvus/Anopheles_atroparvus.AatrE3.51.gtf.gz Anopheles atroparvus;anopheles_atroparvus;EnsemblMetazoa;41427;AatrE3;GCA_000473505.1;AatrE3.2;N;N;N;Y;Y;Y;anopheles_atroparvus_core_51_104_3;1 1
6954 Dermatophagoides farinae Pyroglyphidae Sarcoptiformes Arthropoda GCF_020809275.1 10 30775 0.0324833522819554 94.5 ["u11", "u4atac", "u6atac"] ASM2080927v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/020/809/275/GCF_020809275.1_ASM2080927v1 GCF_020809275.1;PRJNA811591;SAMN10743607;SDOV00000000.1;representative genome;6954;6954;Dermatophagoides farinae;;JKM2019;latest;Contig;Major;Full;2021/11/09;ASM2080927v1;EasyATGC;GCA_020809275.1;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/020/809/275/GCF_020809275.1_ASM2080927v1;;;na 1
2054153 Mucor circinatus Mucoraceae Mucorales Mucoromycota GCA_016758965.1 5 50679 0.009865046168416 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM1675896v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/016/758/965/GCA_016758965.1_ASM1675896v1 GCA_016758965.1;PRJNA668042;SAMN16393841;JAEPRB000000000.1;representative genome;2054153;2054153;Mucor circinatus;strain=CBS 142.35;;latest;Scaffold;Major;Full;2021/01/27;ASM1675896v1;University of Warsaw;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/016/758/965/GCA_016758965.1_ASM1675896v1;;;na 1
104782 Adineta vaga Adinetidae Adinetida Rotifera GCA_021613535.1 10 137682 0.0072625860616448 94.5 ["u11", "u12", "u4atac", "u6atac"] ASM2161353v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/021/613/535/GCA_021613535.1_ASM2161353v1 GCA_021613535.1;PRJNA680543;SAMN16913262;;representative genome;104782;104782;Adineta vaga;breed=AD008;;latest;Chromosome;Major;Full;2022/01/26;ASM2161353v1;University of Namur;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/021/613/535/GCA_021613535.1_ASM2161353v1;genome length too small;;na 1

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "genomes" (
"taxonomy_id" INTEGER,
  "species" TEXT,
  "family" TEXT,
  "order" TEXT,
  "phylum" TEXT,
  "accession" TEXT,
  "n_minor_introns" INTEGER,
  "n_major_introns" INTEGER,
  "percent_minor_introns" REAL,
  "busco_score" REAL,
  "minor_snRNAs" TEXT,
  "genome_version" TEXT,
  "source_url" TEXT,
  "source_metadata" TEXT,
  "minor_intron+" INTEGER
  ,PRIMARY KEY ([taxonomy_id])
);
CREATE INDEX [idx_genomes_phylum]
    ON [genomes] ([phylum]);
CREATE INDEX [idx_genomes_order]
    ON [genomes] ([order]);
CREATE INDEX [idx_genomes_family]
    ON [genomes] ([family]);
Powered by Datasette · Queries took 85.679ms · Data license: ODbL · Data source: Larue & Roy, 2023 · About: Minor Intron Database (WtMTA)