Rows: 221,085
Columns: 95
$ pr2_accession <chr> "AB353770.1.1740_U", "AB284159.1.1765_U…
$ domain <chr> "Eukaryota", "Eukaryota", "Eukaryota", …
$ supergroup <chr> "TSAR", "TSAR", "Obazoa", "Obazoa", "Ob…
$ division <chr> "Alveolata", "Alveolata", "Opisthokonta…
$ subdivision <chr> "Dinoflagellata", "Dinoflagellata", "Fu…
$ class <chr> "Dinophyceae", "Dinophyceae", "Ascomyco…
$ order <chr> "Peridiniales", "Peridiniales", "Pezizo…
$ family <chr> "Kryptoperidiniaceae", "Protoperidiniac…
$ genus <chr> "Unruhdinium", "Protoperidinium", "Sord…
$ species <chr> "Unruhdinium_kevei", "Protoperidinium_b…
$ genbank_accession <chr> "AB353770", "AB284159", "AY123745", "FJ…
$ start <dbl> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, …
$ end <dbl> 1740, 1765, 924, 1907, 853, 1731, 1627,…
$ label <chr> "U", "U", "UC", "U", "U", "U", "U", "U"…
$ gene <chr> "18S_rRNA", "18S_rRNA", "18S_rRNA", "18…
$ organelle <chr> "nucleus", "nucleus", "nucleus", "nucle…
$ reference_sequence <int> 1, 1, NA, NA, NA, NA, NA, NA, NA, 1, NA…
$ added_version <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ edited_version <chr> "4.9.0", "4.10.0", NA, NA, NA, NA, NA, …
$ edited_by <chr> "Mordret S.", "Vaulot D.", NA, NA, NA, …
$ edited_remark <chr> NA, "length of sequence fixed (before t…
$ remark <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, "re…
$ taxo_id <int> 49091, 2087, 13926, 12048, 13926, 41939…
$ taxo_edited_version <chr> "4.9.0", "4.9.0", "4.5", NA, "4.5", NA,…
$ taxo_edited_by <chr> "Mordret S.", "Mordret S.", NA, NA, NA,…
$ taxo_remark <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ reference <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ mixoplankton <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ worms_id <int> 1380090, NA, NA, NA, NA, NA, NA, NA, NA…
$ worms_marine <chr> "0", NA, NA, NA, NA, NA, NA, NA, NA, "0…
$ worms_brackish <int> 0, NA, NA, NA, NA, NA, NA, NA, NA, 0, N…
$ worms_freshwater <int> 1, NA, NA, NA, NA, NA, NA, NA, NA, 1, N…
$ worms_terrestrial <int> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ seq_id <int> 5, 8, 10, 11, 14, 15, 16, 17, 18, 19, 2…
$ sequence <chr> "ATGCTTGTCTCAAAGATTAAGCCATGCATGTCTCAGTA…
$ sequence_length <int> 1740, 1765, 924, 1907, 853, 1731, 1627,…
$ ambiguities <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, …
$ sequence_hash <chr> "26c3890d597f9d39e45e91eaa4f01ba6c603b6…
$ gb_date <chr> "04-SEP-2007", "22-MAY-2007", "07-AUG-2…
$ gb_division <chr> "PLN", "PLN", "ENV", "PLN", "ENV", "ENV…
$ gb_definition <chr> "Peridiniopsis cf. kevei gene for 18S r…
$ gb_organism <chr> "Peridiniopsis cf. kevei", NA, "uncultu…
$ gb_organelle <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ gb_taxonomy <chr> "Eukaryota; Sar; Alveolata; Dinophyceae…
$ gb_strain <chr> NA, NA, NA, "CBS 120353", NA, NA, NA, N…
$ gb_culture_collection <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ gb_clone <chr> NA, NA, NA, NA, "G913P33FB4.T0", "SType…
$ gb_isolate <chr> NA, NA, NA, NA, NA, NA, NA, NA, "145Br"…
$ gb_isolation_source <chr> NA, "seawater sample", "soil", NA, "air…
$ gb_specimen_voucher <chr> NA, NA, NA, NA, NA, NA, "Ed Biffin 9102…
$ gb_host <chr> NA, NA, NA, NA, NA, NA, NA, "yellow cat…
$ gb_collection_date <chr> "26-juil.-03", NA, NA, NA, "17-May-2006…
$ gb_environmental_sample <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ gb_country <chr> "Japan: Toyama, Tomi-iwa Canal Park", "…
$ gb_lat_lon <chr> NA, NA, NA, NA, "40.01 N 105.27 W", NA,…
$ gb_collected_by <chr> NA, NA, NA, NA, "Noah Fierer", NA, NA, …
$ gb_note <chr> NA, "acquired from 2 individual cells c…
$ gb_publication <chr> "Serial replacement of diatom endosymbi…
$ gb_authors <chr> "Takano,Y.", "Yamaguchi,A., Kawamura,H.…
$ gb_journal <chr> "Unpublished", "Unpublished", "Phytopat…
$ eukref_name <chr> NA, NA, NA, NA, NA, NA, NA, "YCRPS2", N…
$ eukref_source <chr> NA, NA, NA, NA, NA, NA, NA, "Environmen…
$ eukref_env_material <chr> NA, NA, NA, NA, NA, NA, NA, "ruminal fl…
$ eukref_env_biome <chr> "freshwater biome", "marine pelagic bio…
$ eukref_biotic_relationship <chr> "host of diatom symbiont", NA, NA, NA, …
$ eukref_specific_host <chr> NA, NA, NA, NA, NA, NA, NA, "yellow cat…
$ eukref_geo_loc_name <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ eukref_notes <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_sample_type <chr> NA, NA, "environmental", "culture", "en…
$ pr2_sample_method <chr> "single cell isolation", "single cell i…
$ pr2_latitude <dbl> NA, NA, NA, NA, 40.010, NA, NA, NA, NA,…
$ pr2_longitude <dbl> NA, NA, NA, NA, -105.270, NA, NA, NA, N…
$ pr2_depth <dbl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_ocean <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_sea <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_sea_lat <dbl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_sea_lon <dbl> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ pr2_country <chr> "Japan", "Japan", NA, NA, "United State…
$ pr2_location <chr> "Toyama, Tomi-iwa Canal Park", "Hokkaid…
$ pr2_location_geoname <chr> NA, NA, NA, NA, "Boulder", "Glasgow", N…
$ pr2_location_geotype <chr> NA, NA, NA, NA, "seat of a second-order…
$ pr2_location_lat <dbl> NA, NA, NA, NA, 40, 56, NA, NA, NA, NA,…
$ pr2_location_lon <dbl> NA, NA, NA, NA, -105, -4, NA, NA, NA, N…
$ pr2_sequence_origin <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ metadata_remark <chr> "Metadata from DinoRef (Mordret S.)", "…
$ pr2_continent <chr> "Asia", "Asia", NA, NA, NA, NA, NA, NA,…
$ pr2_country_geocode <chr> "JP", "JP", NA, NA, NA, NA, NA, NA, "PT…
$ pr2_country_lat <dbl> 36, 36, NA, NA, NA, NA, NA, NA, 40, NA,…
$ pr2_country_lon <dbl> 140, 140, NA, NA, NA, NA, NA, NA, -8, N…
$ eukribo_UniEuk_taxonomy_string <chr> "Eukaryota|Diaphoretickes|Sar|Alveolata…
$ eukribo_V4 <chr> "yes - complete", "yes - complete", NA,…
$ eukribo_V9 <chr> "yes - partial", "yes - complete", NA, …
$ silva_taxonomy <chr> "Eukaryota;SAR;Alveolata;Dinoflagellata…
$ organelle_code <chr> "", "", "", "", "", "", "", "", "", "",…
$ species_url <glue> "<a href='https://www.marinespecies.or…