home / WtMTA

genomes

Data license: ODbL · Data source: Larue & Roy, 2023

taxonomy_id
INTEGER (primary key), unique identifier for each species
species
TEXT, binomial name of the species
family
TEXT, taxonomic family of the species
order
TEXT, taxonomic order of the species
phylum
TEXT, taxonomic phylum of the species
accession
TEXT, accession number of the genome assembly
n_minor_introns
INTEGER, total number of minor introns in the genome
n_major_introns
INTEGER, total number of major introns in the genome
percent_minor_introns
REAL, percentage of minor introns in the genome
busco_score
REAL, BUSCO score assessing the genome assembly completeness (vs. eukaryota_odb10)
minor_snRNAs
TEXT, minor snRNAs found in the annotated transcriptome
genome_version
TEXT, version of the genome assembly
source_url
TEXT, URL for the source genome/annotation files
source_metadata
TEXT, additional metadata from the original data source
minor_intron+
INTEGER, indicates if the species is inferred to contain real minor introns (1) or not (0)

27 rows where minor_snRNAs = "["u12", "u4atac", "u6atac"]" sorted by percent_minor_introns descending

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: family, order, phylum, n_minor_introns, busco_score, minor_snRNAs (array)

taxonomy_id species family order phylum accession n_minor_introns n_major_introns percent_minor_introns ▲ busco_score minor_snRNAs genome_version source_url source_metadata minor_intron+
57397 Apaloderma vittatum Trogonidae Trogoniformes Chordata GCF_000703405.1 423 113269 0.3720578404813003 55.7 ["u12", "u4atac", "u6atac"] ASM70340v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/703/405/GCF_000703405.1_ASM70340v1 GCF_000703405.1;PRJNA263608;SAMN02318033;JMFV00000000.1;representative genome;57397;57397;Apaloderma vittatum;;BGI_N311;latest;Scaffold;Major;Full;2014/06/16;ASM70340v1;BGI;GCA_000703405.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/703/405/GCF_000703405.1_ASM70340v1;;;na 1
48883 Geospiza fortis Thraupidae Passeriformes Chordata GCF_000277835.1 525 147101 0.3556284123392898 84.7 ["u12", "u4atac", "u6atac"] GeoFor_1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/277/835/GCF_000277835.1_GeoFor_1.0 GCF_000277835.1;PRJNA217051;SAMN00839579;AKZB00000000.1;representative genome;48883;48883;Geospiza fortis;;;latest;Scaffold;Major;Full;2012/07/25;GeoFor_1.0;Beijing Genomics Institute;GCA_000277835.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/277/835/GCF_000277835.1_GeoFor_1.0;;;na 1
30464 Nothoprocta perdicaria Tinamidae Tinamiformes Chordata GCF_003342845.1 552 154817 0.3552832289581576 92.9 ["u12", "u4atac", "u6atac"] notPer1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/342/845/GCF_003342845.1_notPer1 GCF_003342845.1;PRJNA484763;SAMN08476459;PTEW00000000.1;representative genome;30464;30464;Nothoprocta perdicaria;;Ctin4;latest;Scaffold;Major;Full;2018/07/26;notPer1;Harvard University;GCA_003342845.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/342/845/GCF_003342845.1_notPer1;;;na 1
8663 Notechis scutatus Elapidae Squamata Chordata GCF_900518725.1 607 171967 0.3517331695388645 95.3 ["u12", "u4atac", "u6atac"] TS10Xv2-PRI https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/900/518/725/GCF_900518725.1_TS10Xv2-PRI GCF_900518725.1;PRJNA494227;SAMEA4800209;ULFQ00000000.1;representative genome;8663;8663;Notechis scutatus;;;latest;Scaffold;Major;Full;2018/09/24;TS10Xv2-PRI;UNIVERSITY OF NEW SOUTH WALES;GCA_900518725.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/900/518/725/GCF_900518725.1_TS10Xv2-PRI;;;na 1
9244 Calypte anna Trochilidae Apodiformes Chordata GCF_003957555.1 537 153405 0.3488326772420781 94.9 ["u12", "u4atac", "u6atac"] bCalAnn1_v1.p https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/957/555/GCF_003957555.1_bCalAnn1_v1.p GCF_003957555.1;PRJNA558503;SAMN02265252;RRCD00000000.1;representative genome;9244;9244;Calypte anna;;BGI_N300;latest;Chromosome;Major;Full;2019/05/16;bCalAnn1_v1.p;Vertebrate Genomes Project;GCA_003957555.2;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/003/957/555/GCF_003957555.1_bCalAnn1_v1.p;;;na 1
328815 Manacus vitellinus Pipridae Passeriformes Chordata GCF_001715985.3 519 149246 0.3465429172370046 87.5 ["u12", "u4atac", "u6atac"] ASM171598v3 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/715/985/GCF_001715985.3_ASM171598v3 GCF_001715985.3;PRJNA341382;SAMN02299332;MCBO00000000.3;representative genome;328815;328815;Manacus vitellinus;;BGI_N305;latest;Scaffold;Major;Full;2019/07/03;ASM171598v3;Smithsonian Institution National Museum of Natural History;GCA_001715985.3;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/715/985/GCF_001715985.3_ASM171598v3;;;na 1
1754191 Piromyces finnis Neocallimastigaceae Neocallimastigales Chytridiomycota GCA_002104945.1 147 43177 0.3393038500600129 88.2 ["u12", "u4atac", "u6atac"] Piromyces sp. finnis v3.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/945/GCA_002104945.1_Piromyces_sp._finnis_v3.0 GCA_002104945.1;PRJNA330696;SAMN05421903;MCFH00000000.1;representative genome;1754191;1754191;Piromyces finnis;strain=finn;;latest;Contig;Major;Full;2017/04/20;Piromyces sp. finnis v3.0;DOE Joint Genome Institute;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/945/GCA_002104945.1_Piromyces_sp._finnis_v3.0;;assembly from type material;na 1
321398 Lepidothrix coronata Pipridae Passeriformes Chordata GCF_001604755.1 554 162800 0.3391407617811623 94.9 ["u12", "u4atac", "u6atac"] Lepidothrix_coronata-1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/604/755/GCF_001604755.1_Lepidothrix_coronata-1.0 GCF_001604755.1;PRJNA338288;SAMN04274560;LVWP00000000.1;representative genome;321398;321398;Lepidothrix coronata;;B3197;latest;Scaffold;Major;Full;2016/03/31;Lepidothrix_coronata-1.0;McDonnell Genome Institute;GCA_001604755.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/604/755/GCF_001604755.1_Lepidothrix_coronata-1.0;;;na 1
8496 Alligator mississippiensis Alligatoridae Crocodylia Chordata GCF_000281125.3 644 193122 0.3323596502998462 99.6 ["u12", "u4atac", "u6atac"] ASM28112v4 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/281/125/GCF_000281125.3_ASM28112v4 GCF_000281125.3;PRJNA221578;SAMN02981418;AKHW00000000.3;representative genome;8496;8496;Alligator mississippiensis;;KSC_2009_1;latest;Scaffold;Major;Full;2016/03/28;ASM28112v4;International Crocodilian Genomes Working Group;GCA_000281125.4;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/281/125/GCF_000281125.3_ASM28112v4;;;na 1
40210 Spizella passerina Passerellidae Passeriformes Chordata GCA_013401375.1 105 37509 0.2791513798053916 44.7 ["u12", "u4atac", "u6atac"] ASM1340137v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/401/375/GCA_013401375.1_ASM1340137v1 GCA_013401375.1;PRJNA545868;SAMN12253929;WBNQ00000000.1;representative genome;40210;40210;Spizella passerina;;B10K-DU-023-52;latest;Scaffold;Major;Full;2020/07/10;ASM1340137v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/401/375/GCA_013401375.1_ASM1340137v1;;;na 1
1754190 Neocallimastix californiae Neocallimastigaceae Neocallimastigales Chytridiomycota GCA_002104975.1 183 65380 0.2791208455988896 88.6 ["u12", "u4atac", "u6atac"] Neocallimastix sp. G1 v1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/975/GCA_002104975.1_Neocallimastix_sp._G1_v1.0 GCA_002104975.1;PRJNA262392;SAMN05428678;MCOG00000000.1;representative genome;1754190;1754190;Neocallimastix californiae;strain=G1;;latest;Contig;Major;Full;2017/04/20;Neocallimastix sp. G1 v1.0;DOE Joint Genome Institute;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/975/GCA_002104975.1_Neocallimastix_sp._G1_v1.0;;assembly from type material;na 1
172689 Lophotis ruficrista Otididae Gruiformes Chordata GCA_013396455.1 304 108749 0.2787635369957726 86.7 ["u12", "u4atac", "u6atac"] ASM1339645v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/455/GCA_013396455.1_ASM1339645v1 GCA_013396455.1;PRJNA545868;SAMN12253761;VWYV00000000.1;representative genome;172689;172689;Lophotis ruficrista;;B10K-CU-031-23;latest;Scaffold;Major;Full;2020/07/10;ASM1339645v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/455/GCA_013396455.1_ASM1339645v1;;;na 1
114276 Cephalopterus ornatus Cotingidae Passeriformes Chordata GCA_013396775.1 298 106670 0.2785879889312692 83.9 ["u12", "u4atac", "u6atac"] ASM1339677v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/775/GCA_013396775.1_ASM1339677v1 GCA_013396775.1;PRJNA545868;SAMN12253765;VZRE00000000.1;representative genome;114276;114276;Cephalopterus ornatus;;B10K-DU-001-01;latest;Scaffold;Major;Full;2020/07/10;ASM1339677v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/775/GCA_013396775.1_ASM1339677v1;;;na 1
1961834 Ceuthmochares aereus Cuculidae Cuculiformes Chordata GCA_013398935.1 245 88218 0.2769519460113268 72.2 ["u12", "u4atac", "u6atac"] ASM1339893v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/935/GCA_013398935.1_ASM1339893v1 GCA_013398935.1;PRJNA545868;SAMN12253749;VWPQ00000000.1;representative genome;1961834;1961834;Ceuthmochares aereus;;B10K-CU-031-02;latest;Scaffold;Major;Full;2020/07/10;ASM1339893v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/935/GCA_013398935.1_ASM1339893v1;;;na 1
425643 Ibidorhyncha struthersii Charadriidae Charadriiformes Chordata GCA_013398815.1 298 108054 0.2750295333727112 83.9 ["u12", "u4atac", "u6atac"] ASM1339881v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/815/GCA_013398815.1_ASM1339881v1 GCA_013398815.1;PRJNA545868;SAMN12253964;VZSZ00000000.1;representative genome;425643;425643;Ibidorhyncha struthersii;;B10K-DU-030-25;latest;Scaffold;Major;Full;2020/07/10;ASM1339881v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/815/GCA_013398815.1_ASM1339881v1;;;na 1
89386 Ardeotis kori Otididae Gruiformes Chordata GCA_013396375.1 292 107619 0.270593359342421 82.0 ["u12", "u4atac", "u6atac"] ASM1339637v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/375/GCA_013396375.1_ASM1339637v1 GCA_013396375.1;PRJNA545868;SAMN12253748;VWPR00000000.1;representative genome;89386;89386;Ardeotis kori;;B10K-CU-031-01;latest;Scaffold;Major;Full;2020/07/10;ASM1339637v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/396/375/GCA_013396375.1_ASM1339637v1;;;na 1
1754192 Anaeromyces robustus Neocallimastigaceae Neocallimastigales Chytridiomycota GCA_002104895.1 126 46705 0.269052550660887 84.3 ["u12", "u4atac", "u6atac"] Anaeromyces sp. S4 v1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/895/GCA_002104895.1_Anaeromyces_sp._S4_v1.0 GCA_002104895.1;PRJNA330692;SAMN05421914;MCFG00000000.1;representative genome;1754192;1754192;Anaeromyces robustus;strain=S4;;latest;Contig;Major;Full;2017/04/20;Anaeromyces sp. S4 v1.0;DOE Joint Genome Institute;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/002/104/895/GCA_002104895.1_Anaeromyces_sp._S4_v1.0;;assembly from type material;na 1
227192 Pedionomus torquatus Pedionomidae Charadriiformes Chordata GCA_013398155.1 269 100994 0.2656449048517227 79.2 ["u12", "u4atac", "u6atac"] ASM1339815v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/155/GCA_013398155.1_ASM1339815v1 GCA_013398155.1;PRJNA545868;SAMN12253960;VZRU00000000.1;representative genome;227192;227192;Pedionomus torquatus;;B10K-DU-029-80;latest;Scaffold;Major;Full;2020/07/10;ASM1339815v1;B10K Consortium;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/013/398/155/GCA_013398155.1_ASM1339815v1;;;na 1
2767002 Neocallimastix sp. jgi-2020a Neocallimastigaceae Neocallimastigales Chytridiomycota GCA_016946835.1 192 98056 0.1954238254213826 89.8 ["u12", "u4atac", "u6atac"] ASM1694683v1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/016/946/835/GCA_016946835.1_ASM1694683v1 GCA_016946835.1;PRJNA658393;SAMN15902602;JACVTC000000000.1;representative genome;2767002;2767002;Neocallimastix sp. JGI-2020a;strain=sp3;;latest;Contig;Major;Full;2021/02/24;ASM1694683v1;DOE Joint Genome Institute;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/016/946/835/GCA_016946835.1_ASM1694683v1;;;na 1
197043 Homalodisca vitripennis Cicadellidae Hemiptera Arthropoda GCF_021130785.1 214 120126 0.1778294831311284 89.8 ["u12", "u4atac", "u6atac"] UT_GWSS_2.1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/021/130/785/GCF_021130785.1_UT_GWSS_2.1 GCF_021130785.1;PRJNA801498;SAMN22783162;JAJKGG000000000.2;representative genome;197043;197043;Homalodisca vitripennis;;AUS2020;latest;Chromosome;Major;Full;2022/01/26;UT_GWSS_2.1;University of Texas at Austin;GCA_021130785.2;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/021/130/785/GCF_021130785.1_UT_GWSS_2.1;;;na 1
742174 Melanaphis sacchari Aphididae Hemiptera Arthropoda GCF_002803265.2 136 82634 0.1643107406064999 98.8 ["u12", "u4atac", "u6atac"] SCAv2.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/002/803/265/GCF_002803265.2_SCAv2.0 GCF_002803265.2;PRJNA421017;SAMN07757676;PDEX00000000.2;representative genome;742174;742174;Melanaphis sacchari;strain=LSU;;latest;Scaffold;Major;Full;2018/06/22;SCAv2.0;USDA-ARS Center for Grain and Animal Health Research;GCA_002803265.2;different;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/002/803/265/GCF_002803265.2_SCAv2.0;;;na 1
2340872 Endogone sp. flas-f59071 Endogonaceae Endogonales Mucoromycota GCA_003990785.1 43 34757 0.1235632183908045 63.1 ["u12", "u4atac", "u6atac"] Endsp1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/003/990/785/GCA_003990785.1_Endsp1 GCA_003990785.1;PRJNA331665;SAMN05444560;RBNK00000000.1;representative genome;2340872;2340872;Endogone sp. FLAS-F59071;strain=FLAS-F59071;;latest;Contig;Major;Full;2019/01/02;Endsp1;DOE Joint Genome Institute;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/003/990/785/GCA_003990785.1_Endsp1;;;na 1
6185 Schistosoma haematobium Schistosomatidae Strigeidida Platyhelminthes GCF_000699445.2 59 62370 0.0945073603613705 76.1 ["u12", "u4atac", "u6atac"] SchHae_2.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/699/445/GCF_000699445.2_SchHae_2.0 GCF_000699445.2;PRJNA273970;SAMN11431408;AMPZ00000000.2;representative genome;6185;6185;Schistosoma haematobium;;;latest;Scaffold;Major;Full;2020/01/28;SchHae_2.0;The University of Melbourne;GCA_000699445.2;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/699/445/GCF_000699445.2_SchHae_2.0;;;na 1
35570 Stomoxys calcitrans Muscidae Diptera Arthropoda GCF_001015335.1 20 53063 0.0376768456944784 98.4 ["u12", "u4atac", "u6atac"] Stomoxys_calcitrans-1.0.1 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/015/335/GCF_001015335.1_Stomoxys_calcitrans-1.0.1 GCF_001015335.1;PRJNA288986;SAMN03486548;LDNW00000000.1;representative genome;35570;35570;Stomoxys calcitrans;breed=8C7A2A5H3J4;;latest;Scaffold;Major;Full;2015/05/31;Stomoxys_calcitrans-1.0.1;Glossina Genomes Consortium;GCA_001015335.1;identical;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/001/015/335/GCF_001015335.1_Stomoxys_calcitrans-1.0.1;;;na 1
114742 Pythium insidiosum Pythiaceae Pythiales Oomycota GCA_001029375.1 4 30975 0.012911972626618 87.1 ["u12", "u4atac", "u6atac"] Pythium_insidiosum_1.0 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/001/029/375/GCA_001029375.1_Pythium_insidiosum_1.0 GCA_001029375.1;PRJDB3817;SAMD00028776;BBXB00000000.1;representative genome;114742;114742;Pythium insidiosum;strain=Pi-s;;latest;Scaffold;Major;Full;2015/05/08;Pythium_insidiosum_1.0;King Mongkut's University of Technology Thonburi;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/001/029/375/GCA_001029375.1_Pythium_insidiosum_1.0;;;na 1
104778 Seison nebaliae Seisonidae Seisonacea Rotifera GCA_023231475.1 3 38785 0.0077343508301536 75.7 ["u12", "u4atac", "u6atac"] GA2.2 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/023/231/475/GCA_023231475.1_GA2.2 GCA_023231475.1;PRJEB43415;SAMN27400648;JALJEE000000000.1;representative genome;104778;104778;Seison nebaliae;;594-2016;latest;Contig;Major;Full;2022/05/03;GA2.2;Institute of Organismic and Molecular Evolution (iomE), Johannes Gutenberg University Mainz;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/023/231/475/GCA_023231475.1_GA2.2;;;na 1
39272 Allacma fusca Sminthuridae Symphypleona Arthropoda GCA_910591605.1 5 152197 0.0032851079486471 90.2 ["u12", "u4atac", "u6atac"] Afus1_asm01 https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/910/591/605/GCA_910591605.1_Afus1_asm01 GCA_910591605.1;PRJEB44694;SAMEA8803696;CAJVCH000000000.1;representative genome;39272;39272;Allacma fusca;;;latest;Scaffold;Major;Full;2021/08/13;Afus1_asm01;THE UNIVERSITY OF EDINBURGH;na;na;https://ftp.ncbi.nlm.nih.gov/genomes/all/GCA/910/591/605/GCA_910591605.1_Afus1_asm01;;;na 1

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE "genomes" (
"taxonomy_id" INTEGER,
  "species" TEXT,
  "family" TEXT,
  "order" TEXT,
  "phylum" TEXT,
  "accession" TEXT,
  "n_minor_introns" INTEGER,
  "n_major_introns" INTEGER,
  "percent_minor_introns" REAL,
  "busco_score" REAL,
  "minor_snRNAs" TEXT,
  "genome_version" TEXT,
  "source_url" TEXT,
  "source_metadata" TEXT,
  "minor_intron+" INTEGER
  ,PRIMARY KEY ([taxonomy_id])
);
CREATE INDEX [idx_genomes_phylum]
    ON [genomes] ([phylum]);
CREATE INDEX [idx_genomes_order]
    ON [genomes] ([order]);
CREATE INDEX [idx_genomes_family]
    ON [genomes] ([family]);
Powered by Datasette · Queries took 46.517ms · Data license: ODbL · Data source: Larue & Roy, 2023