From c12440aecdb6272cffeba49f7ef427021c998f44 Mon Sep 17 00:00:00 2001 From: Francesco Sabatini <francesco.sabatini@idiv.de> Date: Tue, 10 Mar 2020 14:38:43 +0100 Subject: [PATCH] Modified Taxonomic Backbone, manual check before TNRS - rerunning --- code/03_TaxonomicBackbone.Rmd | 1081 +++++++++++++++++---------------- code/07_buildCWMs.Rmd | 17 +- 2 files changed, 558 insertions(+), 540 deletions(-) diff --git a/code/03_TaxonomicBackbone.Rmd b/code/03_TaxonomicBackbone.Rmd index b9a057f..58a3076 100644 --- a/code/03_TaxonomicBackbone.Rmd +++ b/code/03_TaxonomicBackbone.Rmd @@ -70,24 +70,14 @@ DT0 <- readr::read_delim("../sPlot_data_export/sPlot_3_0_2_species_test.csv", ) ) ``` -Create list of species, and exclude fungi -```{r eval=T, echo=F} -## fungi genera #NOT COMPLETE LIST -mushroom <- c("Mycena", "Boletus", "Russula","Calocybe","Collybia","Amanita","Amanitopsis","Coprinus", - "Galerina","Geoglossum","Hebeloma","Hydnum","Lactarius","Leucocarpia","Naucoria","Otidea","Polyporus", - "Sarcodom","Sarcoscyphus","Scleroderma","Stropharia","Tylopilus","Typhula", "Calyptella", "Chrysopsora", "Lacrymaria", "Dermoloma", - "Agaricus","Alnicola", "Amanitina", "Bovista", "Cheilymenia","Clavulinopsis", "Clitocybe", "Entoloma", "Geaster", "Inocybe", "Paxillus", - "Laccaria", "Laetiporus", "Lepista", "Macrolepiota", "Macrolepis", "Marasmius", "Panaeolus", "Psathyrella", "Psilocybe", - "Rickenella", "Sarcoscypha", "Vascellum", "Ramaria", "Agrocybe", - "Flammulaster", "Phaeocollybia", "Cortinarius", "Lepiota", "Cystoderma", - "Armillaria", "Athelia", "Ceraceomyces", "Chlorociboria", "Clavariaceae", - "Cystoderma", "Dacrymyces","Dendrographa","Dirina", "Flammulaster","Fomes","Gyrophora", - "Kirschsteiniothelia", "Lepiota","Llimoniella","Mazosia","Mollisia", - "Multiclavula","Phaeocollybia","Phellinus","Plectocarpon","Pleospora","Ramariopsis","Reinkella", - "Roccella","Roccellina","Sigridea","Stereum","Tremella","Tulostoma","Unguiculariopsis" , - "Xanthoconium") + +## Import lists of species classified into groups +These objects are defined in the appendix +```{r} +load("../derived/taxa_manual.RData") ``` + ```{r eval=F} splot.species <- DT0 %>% rename(Species.original=`Turboveg2 concept`, Matched.concept=`Matched concept`) %>% @@ -223,6 +213,491 @@ spec.list.TRY.sPlot <- spec.list.TRY.sPlot %>% distinct() ``` +## Manual cleaning +Fix known issues in some species names +```{r} +#Manual cleaning +spec.list.TRY.sPlot <- spec.list.TRY.sPlot %>% + mutate(Species=tolower(Species)) %>% + mutate(Species=firstup(Species)) %>% + mutate(Species=gsub("^Str ", "", Species)) %>% + mutate(Species=gsub("^Unknown ", "", Species)) %>% + mutate(Species=firstup(Species)) %>% + mutate(Species=gsub(" [0-9]*$", "", Species)) %>% #delete digits at end of object + mutate(Species=gsub("^\\d+|\\d+$", "", Species)) %>% #delete digits at the beginning or end of a string + mutate(Species=gsub(" sp.$", "", Species)) %>% + mutate(Species=gsub(" sp$", "", Species)) %>% + mutate(Species=gsub(" species$", "", Species)) %>% + mutate(Species=gsub(" *$", "", Species)) %>% + mutate(Species=gsub(" #$", "", Species)) %>% + mutate(Species=gsub(" m$", "", Species)) %>% + mutate(Species=gsub("acea ", "aceae ", Species)) %>% + mutate(Species=gsub('^Agropyrum', 'Agropyron', Species)) %>% + mutate(Species=gsub('^Anno ', 'Annona ', Species)) %>% + mutate(Species=gsub('Adpdytes dimidiata', 'Apodytes dimidiata', Species)) %>% + mutate(Species=gsub('Adenostorna fasciculaturn', 'Adenostoma fasciculatum', Species)) %>% + mutate(Species=gsub('Arctostapliylos glallca', 'Arctostaphylos glauca', Species)) %>% + mutate(Species=gsub('Bituminosa bituminosa', 'Bituminaria bituminosa', Species)) %>% + mutate(Species=gsub('Causurina equisitifolia', 'Causuarina equisetifolia', Species)) %>% + mutate(Species=gsub('Convulvus arvensis', 'Convolvulus arvensis', Species)) %>% + mutate(Species=gsub('Diospyrus dygina', 'Diospyros dygina', Species)) %>% + mutate(Species=gsub('^Dodoea', 'Dodonaea', Species)) %>% + mutate(Species=gsub('^Boheravia', 'Boerhavia', Species)) %>% + mutate(Species=gsub('Centaria maculosa', 'Centaurea maculosa', Species)) %>% + mutate(Species=gsub('Chamrenerium angustifolium', 'Chamaenerion angustifolium', Species)) %>% + mutate(Species=gsub('^Chicorium', 'Cichorium', Species)) %>% + mutate(Species=gsub('^Cirsiumum', 'Cirsium', Species)) %>% + mutate(Species=gsub('^Colubrium', 'Colubrina', Species)) %>% + mutate(Species=gsub('^Corymbium', 'Corymbia', Species)) %>% + mutate(Species=gsub('Cosmos bipinnata', 'Cosmos bipinnatus', Species)) %>% + mutate(Species=gsub('Diospyrus dygina', 'Diospyros digyna', Species)) %>% + mutate(Species=gsub('Diospyros egbert', 'Diospyros egbert-walkeri', Species)) %>% + mutate(Species=gsub('Dispyrus halesioides', 'Diospyros halesioides', Species)) %>% + mutate(Species=gsub('^Drymis', 'Drimys', Species)) %>% + mutate(Species=gsub('^Dysoxylon', 'Dysoxylum', Species)) %>% + mutate(Species=gsub('^Eleaegnus', 'Elaeagnus', Species)) %>% + mutate(Species=gsub('^Eleutherant', 'Eleutherantera', Species)) %>% + mutate(Species=gsub('^Echicea', 'Echinacea', Species)) %>% + mutate(Species=gsub('Gauteria foliolata', 'Gaultheria foliolosa', Species)) %>% + mutate(Species=gsub('^Geophylla', 'Geophyla', Species)) %>% + mutate(Species=gsub('Gloichidion insignis', 'Glochidion insigne', Species)) %>% + mutate(Species=gsub('^Glycium', 'Glycine', Species)) %>% + mutate(Species=gsub('^Hammalis', 'Hamamelis', Species)) %>% + mutate(Species=gsub('^Hippochoeris', 'Hypochaeris', Species)) %>% + mutate(Species=gsub('Ilix tephrohylla', 'Ilex tephrophylla', Species)) %>% + mutate(Species=gsub('^Jasininum', 'Jasminum', Species)) %>% + mutate(Species=gsub('Jenipa conjuta', 'Jenipa conjunta', Species)) %>% + mutate(Species=gsub('^Lechytis', 'Lecythis', Species)) %>% + mutate(Species=gsub('Lespedeza juncus', 'Lespedeza juncea', Species)) %>% + mutate(Species=gsub('Licania apelata', 'Licania apetala', Species)) %>% + mutate(Species=gsub('Limeum arenicola', 'Limeum arenicolum', Species)) %>% + mutate(Species=gsub('^Maniota', 'Manihot', Species)) %>% + mutate(Species=gsub('^Menta', 'Mentha', Species)) %>% + mutate(Species=gsub('Metophyum brownei', 'Metopium brownei', Species)) %>% + mutate(Species=gsub('Miliusa tomentosum', 'Miliusa tomentosa', Species)) %>% + mutate(Species=gsub('Mimululus ringens', 'Mimulus ringens', Species)) %>% + mutate(Species=gsub('Nardus strictus', 'Nardus stricta', Species)) %>% + mutate(Species=gsub('Neea glomeratha', 'Neea glomerata', Species)) %>% + mutate(Species=gsub('^Onopordon', 'Onopordum', Species)) %>% + mutate(Species=gsub('^Orbigynia', 'Orbignya', Species)) %>% + mutate(Species=gsub('Orites excelsa', 'Orites excelsus', Species)) %>% + mutate(Species=gsub('Paedorata lutea', 'Paederota lutea', Species)) %>% + mutate(Species=gsub('Palaquin ellipticum', 'Palaquium ellipticum', Species)) %>% + mutate(Species=gsub('Palmeria arfakensis', 'Palmeria arfakiana', Species)) %>% + mutate(Species=gsub('Petalostcmum purpureum', 'Petalostemum purpureum', Species)) %>% + mutate(Species=gsub('Petalostimum purpureum', 'Petalostemum purpureum', Species)) %>% + mutate(Species=gsub('^Petrosileum', 'Petroselinum', Species)) %>% + mutate(Species=gsub('Phlomis herba', 'Phlomis herba-venti', Species)) %>% + mutate(Species=gsub('^Phyllirea', 'Phillyrea', Species)) %>% + mutate(Species=gsub('Physilus pumula', 'Physalus pumila', Species)) %>% + mutate(Species=gsub('Picea maria', 'Picea mariana', Species)) %>% + mutate(Species=gsub('Picea retroXexa', 'Picea retroflexa', Species)) %>% + mutate(Species=gsub('Pilayella litoralis', 'Pilayella littoralis', Species)) %>% + mutate(Species=gsub('Placocarpus schaereri', 'Platecarpus schaerer', Species)) %>% + mutate(Species=gsub('Placocarpus schraereri', 'Platecarpus schaerer', Species)) %>% + mutate(Species=gsub('^Pulteea', 'Pultenaea', Species)) %>% + mutate(Species=gsub('Quercus rubrum', 'Quercus rubra', Species)) %>% + mutate(Species=gsub('Rubus fruticosa', 'Rubus fruticosus', Species)) %>% + mutate(Species=gsub('Rubus saxatile', 'Rubus saxatilis', Species)) %>% + mutate(Species=gsub('Rubus sylvatici', 'Rubus sylvaticus', Species)) %>% + mutate(Species=gsub('^Sanguiria', 'Sanguinaria', Species)) %>% + mutate(Species=gsub('Sarauja nepaulensis', 'Sarauja nepalensis', Species)) %>% + mutate(Species=gsub('^Sateria', 'Setaria', Species)) %>% + mutate(Species=gsub('Sauraiea nepulensis', 'Saurauia nepalensis', Species)) %>% + mutate(Species=gsub('Schneckia australis', 'Schenckia australis', Species)) %>% + mutate(Species=gsub('Smirnium oleastrum', 'Smyrnium olusatrum', Species)) %>% + mutate(Species=gsub('Solms laubachia', 'Solms-laubachia himalayensis', Species)) %>% + mutate(Species=gsub('Stellaria chamaejasme', 'Stellera chamaejasme', Species)) %>% + mutate(Species=gsub('Steraria parviflora', 'Setaria parviflora', Species)) %>% + mutate(Species=gsub('^Stuartia', 'Stewartia', Species)) %>% + mutate(Species=gsub('Sycops sinensis', 'Sycopsis sinensis', Species)) %>% + mutate(Species=gsub('Tacetum vulgare', 'Tanacetum vulgare', Species)) %>% + mutate(Species=gsub('Talinurn angustissimun', 'Talinun angustissimun', Species)) %>% + mutate(Species=gsub('Talloma hodgsoni', 'Talauma hodgsonii', Species)) %>% + mutate(Species=gsub('Taraxacum albo', 'Taraxacum album', Species)) %>% + mutate(Species=gsub('Tetragonia falcata', 'Tetragona falcata', Species)) %>% + mutate(Species=gsub('Trapogogon', 'Tragopogon', Species)) %>% + mutate(Species=gsub('Zyzyphus saeri', 'Zizyphus saeri', Species)) %>% + mutate(Species=gsub('^Helicrysum', 'Helichrysum', Species)) %>% + mutate(Species=gsub('^Diceropappus rhinocerotis', 'Elytropappus rhinocerotis', Species)) %>% + mutate(Species=gsub('^Euphorbiace ', 'Euphorbiacaea ', Species)) %>% + mutate(Species=gsub('^Gloecapsa', 'Gloeocapsa', Species)) %>% + mutate(Species=gsub('Glycirhiza', 'Glycyrrhiza', Species)) %>% + mutate(Species=gsub('Abiesnordmannia', 'Abies nordmannia', Species)) %>% + mutate(Species=gsub('Alnus inca', 'Alnus incana', Species)) %>% + mutate(Species=gsub('Amalencier alnifolia', 'Amalenchier alnifolia', Species)) %>% + mutate(Species=gsub('Antylis barba-jovis', 'Anthyllis barba-jovis', Species)) %>% + mutate(Species=gsub('^Albizzia "', 'Albizia ', Species)) %>% + mutate(Species=gsub('^Ipomoena ', 'Ipomoea ', Species)) %>% + mutate(Species=gsub('^Ipomea ', 'Ipomoea ', Species)) %>% + mutate(Species=gsub('Ipomo wolco', 'Ipomoea wolcottiana', Species)) %>% + ## additional manual cleaning from UJ, BJA, HB + mutate(Species=gsub('Abacaba palm', 'Oenocarpus balickii', Species)) %>% + mutate(Species=gsub('Acerkuomeii', 'Acer kuomeii', Species)) %>% + mutate(Species=gsub('Alder$', 'Alnus', Species)) %>% + mutate(Species=gsub('Amapa$', 'Tabebuia', Species)) %>% + mutate(Species=gsub('Amapa amargoso', 'Parahancornia amapa', Species)) %>% + mutate(Species=gsub('Amapa doce$', 'Tabebuia', Species)) %>% + mutate(Species=gsub('Amapai$', 'Tabebuia', Species)) %>% + mutate(Species=gsub('Amapaí$', 'Tabebuia', Species)) %>% + mutate(Species=gsub('Amapa m1', 'Tabebuia', Species)) %>% + mutate(Species=gsub('Amaranth$', 'Amaranthus', Species)) %>% + mutate(Species=gsub('Amophora fruticosa', 'Amorpha fruticosa', Species)) %>% + mutate(Species=gsub('Anacardiace ', 'Anacardiaceae ', Species)) %>% + mutate(Species=gsub('Anagallisarvensis', 'Anagallis arvensis', Species)) %>% + mutate(Species=gsub('Anemonenarcissiflora var.', 'Anemone narcissiflora', Species)) %>% + mutate(Species=gsub('Anenome ', 'Anemone', Species)) %>% + mutate(Species=gsub('Anona ', 'Annona ', Species)) %>% + mutate(Species=gsub('Antylis ', 'Anthyllis', Species)) %>% + mutate(Species=gsub('Apocyncadea gelbblueh$', 'Apocynaceae', Species)) %>% + mutate(Species=gsub('Aracium', 'Crepis', Species)) %>% + mutate(Species=gsub('Ardis mexic', 'Ardisia mexicana subsp. siltepecana', Species)) %>% + mutate(Species=gsub('Ardis verap', 'Ardisia verapazensis', Species)) %>% + mutate(Species=gsub('Argenomne hummemannii', 'Argemone hunnemanni', Species)) %>% + mutate(Species=gsub('Artabotus', 'Artabotrys', Species)) %>% + mutate(Species=gsub('Artemisiaintegrifolia', 'Artemisia integrifolia', Species)) %>% + mutate(Species=gsub('Asclepiacea$', 'Asclepiadaceae', Species)) %>% + mutate(Species=gsub('Asclep. klimmer', 'Asclepiadaceae', Species)) %>% + mutate(Species=gsub('Astartoseris triquetra', 'Lactuca triquetra', Species)) %>% + mutate(Species=gsub('Asteracee ', 'Asteraceae ', Species)) %>% + mutate(Species=gsub('Avenula glauc$', 'Avenula', Species)) %>% + mutate(Species=gsub('Baikea plurijuga', 'Baikiaea plurijuga', Species)) %>% + mutate(Species=gsub('Binse rundbl', 'Juncaceae', Species)) %>% + mutate(Species=gsub('Blättrige fabaceae th', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Bonel macro$', 'Bonellia macrocarpa subsp. macrocarpa', Species)) %>% + mutate(Species=gsub('Boraginacee samtig', 'Boraginaceae', Species)) %>% + mutate(Species=gsub('Bri¢fitos', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Bryophyte$', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Bryopsida', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Carallia macrophylla', 'Carallia', Species)) %>% + mutate(Species=gsub('Carexectabilis', 'Carex spectabilis', Species)) %>% + mutate(Species=gsub('Carex fein', 'Carex', Species)) %>% + mutate(Species=gsub('Cerania vermicularis', 'Thamnolia vermicularis', Species)) %>% + mutate(Species=gsub('Chamelauci merredin', 'Chamelaucium', Species)) %>% + mutate(Species=gsub('Chamelau drummon', 'Chamelaucium', Species)) %>% + mutate(Species=gsub('Charophyta', 'Characeae', Species)) %>% + mutate(Species=gsub('Cheiridopsis-keimlinge', 'Cheiridopsis', Species)) %>% + mutate(Species=gsub('Chenopodiacee$', 'Chenopodiaceae', Species)) %>% + mutate(Species=gsub('Chiangioden mexicanum', 'Chiangiodendron mexicanum', Species)) %>% + mutate(Species=gsub('Chiranthode pentadactylon', 'Chiranthodendron pentadactylon', Species)) %>% + mutate(Species=gsub('Chrysobalan ', 'Chrysobalanus ', Species)) %>% + mutate(Species=gsub('Cladapodiella', 'Cladopodiella', Species)) %>% + mutate(Species=gsub('Cleidium ', 'Cleidion ', Species)) %>% + mutate(Species=gsub('Collema/leptogium lichenoides', 'Collemataceae', Species)) %>% + mutate(Species=gsub('Comarostaph discolor', 'Comarostaphylis discolor', Species)) %>% + mutate(Species=gsub('Combretdodendrum africana', 'Combretodendrum africanum', Species)) %>% + mutate(Species=gsub('Commelinacaea floscopa', 'Floscopa glomerata', Species)) %>% + mutate(Species=gsub('Coyncia setigera', 'Coincya setigera', Species)) %>% + mutate(Species=gsub('Crataeva', 'Crateva', Species)) %>% + mutate(Species=gsub('Craterosperma', 'Rubiaceae', Species)) %>% + mutate(Species=gsub('Crespicium', 'Burseraceae', Species)) %>% + mutate(Species=gsub('Critoniadel nubigenus', 'Critoniadelphus nubigenus', Species)) %>% + mutate(Species=gsub('Crotalaria/vigna?', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Croto billb', 'Croton billbergianus subsp. pyramidalis', Species)) %>% + mutate(Species=gsub('Dana„ racemosa', 'Danae racemosa', Species)) %>% + mutate(Species=gsub('Deehasia', 'Dehaasia', Species)) %>% + mutate(Species=gsub('Dichapetala', 'Dichapetalum', Species)) %>% + mutate(Species=gsub('Distel bractea', 'Asteracaea', Species)) %>% + mutate(Species=gsub('Distelig asteraceae', 'Asteracaea', Species)) %>% + mutate(Species=gsub('Dodon visco', 'Dodonaea viscosa', Species)) %>% + mutate(Species=gsub('Doldenbluetler', 'Apiaceae', Species)) %>% + mutate(Species=gsub('Echinosurus capitatus', 'Poaceae', Species)) %>% + mutate(Species=gsub('Einähriges gras$', 'Poaceae', Species)) %>% + mutate(Species=gsub('Einähriges gras von gestern$', 'Poaceae', Species)) %>% + mutate(Species=gsub('Einblütiges rispengras', 'Poaceae', Species)) %>% + mutate(Species=gsub('Eiovaltrichtergrundblatt orchidee', 'Orchidaceae', Species)) %>% + mutate(Species=gsub('Elongata subsp.', 'Pohlia elongata', Species)) %>% + mutate(Species=gsub('Enriquebelt ', 'Enriquebeltrania ', Species)) %>% + mutate(Species=gsub('Entermorpha ', 'Enteromorpha ', Species)) %>% + mutate(Species=gsub('Erodiurn$', 'Erodium', Species)) %>% + mutate(Species=gsub('Euc. chloroclada x camaldulensis', 'Eucalyptus', Species)) %>% + mutate(Species=gsub('Euphorbiacée ipatouduluga gouduatché', 'Euphorbiaceae', Species)) %>% + mutate(Species=gsub('Fabacee kleeblatt stengel schwarzdrüsi', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Fabaceenstrauch wie 132446 f', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Fabaceenstr kleinbltrg', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Fabacee wie lotus f', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Farn', 'Pteridophyta', Species)) %>% + mutate(Species=gsub('Farn cystopteris', 'Cystopteris', Species)) %>% + mutate(Species=gsub('Fern', 'Pteridophyta', Species)) %>% + mutate(Species=replace(Species, list=word(Species, 1)=="Fingergras", values="Digitaria")) %>% + mutate(Species=replace(Species, list=word(Species, 1)=="Fingerhirse", values="Digitaria")) %>% + mutate(Species=gsub('Gelbe onagraceae', 'Onagraceae', Species)) %>% + mutate(Species=gsub('Gramine', 'Poaceae', Species)) %>% + mutate(Species=gsub('Graminea', 'Poaceae', Species)) %>% + mutate(Species=gsub('Graminia', 'Poaceae', Species)) %>% + mutate(Species=gsub('Grannenquecke', 'Poaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Gras", + values="Poaceae")) %>% + mutate(Species=gsub('Gynostachi dicanthus', 'Gymnostachium diacanthus', Species)) %>% + mutate(Species=gsub('Hafer haarkranz', 'Poaceae', Species)) %>% + mutate(Species=gsub('Hapolosiphon', 'Hapalosiphon', Species)) %>% + mutate(Species=gsub('Heliocrysum', 'Helichrysum', Species)) %>% + mutate(Species=replace(Species, list=word(Species, 1)=="Hepaticae", values="Bryophyta")) %>% + mutate(Species=gsub('Hepaticas', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Hepatophyta', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Hermerocalis', 'Hemerocallis', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Hirse", + values="Poaceae")) %>% + mutate(Species=gsub('Hirte trian', 'Hirtella triandra subsp. media', Species)) %>% + mutate(Species=replace(Species, list=word(Species, 1)=="Hohlzahn", values="Lamiaceae")) %>% + mutate(Species=gsub('Hondurodend urceolatum', 'Hondurodendron urceolatum', Species)) %>% + mutate(Species=gsub('Hornklee gelb', 'Fabaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Horstgras", + values="Poaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Huehnerhirse", + values="Digitaria")) %>% + mutate(Species=gsub('Hydrocoleus lyngbyaceus', 'Hydrocoleum lyngbyaceum', Species)) %>% + mutate(Species=gsub('Hyernima nipensis', 'Hieronyma nipensis', Species)) %>% + mutate(Species=gsub('Hyeronima', 'Hieronyma', Species)) %>% + mutate(Species=gsub('Hypocal angusti', 'Hypocalymma angustifolium', Species)) %>% + mutate(Species=gsub('Hypocalym nambung', 'Hypocalymma', Species)) %>% + mutate(Species=gsub('Hyprium', 'Hypericum', Species)) %>% + mutate(Species=gsub('Igelkolben', 'Sparganium', Species)) %>% + mutate(Species=gsub('Ilexã‚â paraguariensis', 'Ilex', Species)) %>% + mutate(Species=gsub('Ipomea', 'Ipomoea', Species)) %>% + mutate(Species=gsub('Ipomoena', 'Ipomoea', Species)) %>% + mutate(Species=gsub('Jm kürbis stark behaart', 'Cucurbitaceae', Species)) %>% + mutate(Species=gsub('Juncaginacee/triglochin', 'Triglochin', Species)) %>% + mutate(Species=gsub('Juncas', 'Juncus', Species)) %>% + mutate(Species=gsub('Keilblatt cyperus', 'Cyperus', Species)) %>% + mutate(Species=gsub('Khh 3010 polygalacee', 'Polygalaceae', Species)) %>% + mutate(Species=gsub(' Khh 3014 liliacee 3f„ch. kapsel schwarze samen', 'Liliaceae', Species)) %>% + mutate(Species=gsub('Khh 3024 brachiaria', 'Brachiaria', Species)) %>% + mutate(Species=gsub('Khh 3025 liliaceae gelbe blten breite bl„tter', 'Liliaceae', Species)) %>% + mutate(Species=gsub('Khh 3037 ficus', 'Ficus', Species)) %>% + mutate(Species=gsub('Khh 3054 ficus iteophylla miq.', 'Ficus', Species)) %>% + mutate(Species=gsub('Kl. borstgras', 'Poaceae', Species)) %>% + mutate(Species=gsub('Kleine malvaceae', 'Malvaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Kletter", + values="Asteraceae")) %>% + mutate(Species=gsub('Klimmer asclepiadaceae', 'Asclepiadaceae', Species)) %>% + mutate(Species=gsub('Klimmer curcuvitaceae', 'Cucurbitaceae', Species)) %>% + mutate(Species=gsub('Kl. sauergras', 'Cyperaceae', Species)) %>% + mutate(Species=gsub('Knabenkraut gefleckt', 'Orchis', Species)) %>% + mutate(Species=gsub('Knubbelblüt. gras haarkranz vgl f', 'Poaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Koenigskerze", + values="Verbascum")) %>% + mutate(Species=gsub('Kriechgras zynodon', 'Poaceae', Species)) %>% + mutate(Species=gsub('Kürbis', 'Cucurbitaceae', Species)) %>% + mutate(Species=gsub('Lamiaceen strauch', 'Lamiaceae', Species)) %>% + mutate(Species=gsub('Lamiacee orange', 'Lamiaceae', Species)) %>% + mutate(Species=gsub('Lamiales orobanchaceae + phrymaceae + plantaginaceae + scrophulariaceae', 'Orobanchaceae', Species)) %>% + mutate(Species=gsub('Lantanacamara wandelrösschen', 'Lantana camara', Species)) %>% + mutate(Species=gsub('Lasiopeta watheroo k. shepherd & c. wilkins ks', 'Lasiopetalum', Species)) %>% + mutate(Species=gsub('Leg-inderteminada', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Legu 1fiedrig groá schlank', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Legume$', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Leguminosae spgm', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Leguminosea', 'Fabaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Leguminose", + values="Fabaceae")) %>% + mutate(Species=gsub('Leheelo grass', 'Poaceae', Species)) %>% + mutate(Species=gsub('Lepid carra', 'Lepiderema', Species)) %>% + mutate(Species=gsub('Lich caloplaca', 'Caloplaca', Species)) %>% + mutate(Species=gsub('Liliacee', 'Liliaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Lilie", + values="Liliaceae")) %>% + mutate(Species=gsub('Liliengewächs', 'Liliaceae', Species)) %>% + mutate(Species=gsub('Lisea', 'Litsea', Species)) %>% + mutate(Species=gsub('Lisymachia', 'Lysimachia', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Liverwort", + values="Bryophyta")) %>% + mutate(Species=gsub('Livwort', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Lonicerachrysantha', 'Lonicera chrysantha', Species)) %>% + mutate(Species=gsub('Lycoctamnus barbatus', 'Aconitum barbatum', Species)) %>% + mutate(Species=gsub('Lygopus', 'Lycopus', Species)) %>% + mutate(Species=gsub('Maitenus', 'Maytenus', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Malpighiace", + values="Malpighiaceae")) %>% + mutate(Species=gsub('Malpighiales chrysobalanaceae + humiriaceae', 'Malpighiaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Malve", + values="Malvaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Mammutgras", + values="Poaceae")) %>% + mutate(Species=gsub('Mammutgrass', 'Poaceae', Species)) %>% + mutate(Species=gsub('Maqui guian', 'Maquira guianensis subsp. costaricana', Species)) %>% + mutate(Species=gsub('Marchantiophyta', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Mariana aphylla', 'Maireana aphylla', Species)) %>% + mutate(Species=gsub('Mehrfingeriges ährengras', 'Poaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Melastomata", + values="Melastomataceae")) %>% + mutate(Species=gsub('Mesembr minibl', 'Mesembryanthemum', Species)) %>% + mutate(Species=gsub('Mesostomma kotschyanum', 'Mesostemma kotschyana', Species)) %>% + mutate(Species=gsub('Microhepatics', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Micromeria micrantha', 'Micromeria graeca subsp. micrantha', Species)) %>% + mutate(Species=gsub('Mimose minifiedrig f', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Miniepilobium', 'Epilobium', Species)) %>% + mutate(Species=gsub('Minimargerite', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Miniochna', 'Ochna', Species)) %>% + mutate(Species=gsub('Minischilf 132466 f', 'Poaceae', Species)) %>% + mutate(Species=gsub('Mistletoe', 'Viscum', Species)) %>% + mutate(Species=gsub('Mniaecia', 'Mniaceae', Species)) %>% + mutate(Species=gsub('Molemo', 'Turraea', Species)) %>% + mutate(Species=gsub('Molses', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Momisa pigra', 'Mimosa pigra', Species)) %>% + mutate(Species=gsub('Monandrus squarrosus', 'Cyperus squarrosus', Species)) %>% + mutate(Species=gsub('Monchema debile', 'Monechma debile', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Monochna", + values="Polygalaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Moos", + values="Bryophyta")) %>% + mutate(Species=gsub('Moospolster grau-grün', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Mortonioden ', 'Mortoniodendron ', Species)) %>% + mutate(Species=gsub('Mos onbekend', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Mossen overige', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Mougetia', 'Mougeotia', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Musci", + values="Bryophyta")) %>% + mutate(Species=gsub('Myciantes', 'Myrcianthes', Species)) %>% + mutate(Species=gsub('Myrciaã‚â pulchra', 'Myrcia pulchra', Species)) %>% + mutate(Species=gsub('Myrcianov.', 'Myrcia', Species, fixed = T)) %>% + mutate(Species=gsub('Myrsi coria', 'Myrsine coriacea', Species)) %>% + mutate(Species=gsub('Myrtaceenstrauch', 'Myrtaceae', Species)) %>% + mutate(Species=gsub('Nachtkerze fru dreispaltig', 'Onagracaee', Species)) %>% + mutate(Species=gsub('Neobartsia crenoloba', 'Bartsia crenoloba', Species)) %>% + mutate(Species=gsub('None$', 'Nonea', Species)) %>% + mutate(Species=gsub('Ocos adenophylla', 'Symplocos adenophylla', Species)) %>% + mutate(Species=gsub('Officinale subsp. group', 'Taraxacum officinale s.l.', Species)) %>% + mutate(Species=gsub('Orch$', 'Orchidaceae', Species)) %>% + mutate(Species=gsub('Orchid', 'Orchidaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Orchidee", + values="Orchidaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% c("Papilonacea", "Papilionacea"), + values="Fabaceae")) %>% + mutate(Species=gsub('Pasania dodoniifolia', 'Lithocarpus dodonaeifolius', Species)) %>% + mutate(Species=gsub('Phoebengmoensis', 'Phoebe hungmoensis', Species)) %>% + mutate(Species=gsub('Picra antid$', 'Picramnia antidesma subsp. fessonia', Species)) %>% + mutate(Species=gsub('Pinopsida', 'Coniferae', Species)) %>% + mutate(Species=gsub('Pisonianov.', 'Pisonia', Species, fixed=T)) %>% + mutate(Species=gsub('Pithecellob ', 'Pithecellobium ', Species)) %>% + mutate(Species=gsub('Pithecocten', 'Pithecoctenium', Species)) %>% + mutate(Species=gsub('Pleradenoph longicuspis', 'Pleradenophora longicuspis', Species)) %>% + mutate(Species=gsub('Pleuranthod ', 'Pleuranthodendron ', Species)) %>% + mutate(Species=gsub('Poales', 'Poaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% c("Polygalacea", "Polygalacee"), + values="Polygalaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% c("Polygonaceae", "Polygonacee"), + values="Polygonaceae")) %>% + mutate(Species=gsub('Polygonumlongisetum', 'Polygonum longisetum', Species)) %>% + mutate(Species=gsub('Posoq coria subsp. maxima', 'Posoqueria coriacea subsp. maxima', Species)) %>% + mutate(Species=gsub('Prosthecidi ', 'Prosthecidiscus ', Species)) %>% + mutate(Species=gsub('Pseudo bidens', '', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% + c("Pseudobriza", "Pseudofingergras", + "Pseudogerste", "Puschelgras", "Quecke", + "Queckenblatt", "Queckengras", + "Roggen/hafer", "Ruchgras", "Silbergras", + "Suessgras"), + values="Poaceae")) %>% + mutate(Species=gsub('Ptarmica', 'Achillea', Species)) %>% + mutate(Species=gsub('Pterost cauline leaves n. gibson & m.n. lyons', 'Pterostegia', Species)) %>% + mutate(Species=gsub('Quararibeaã‚â guianensis', 'Quararibea guianensis', Species)) %>% + mutate(Species=gsub('Rainfarn f', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Ranke ipomoea', 'Ipomoea', Species)) %>% + mutate(Species=gsub('Ranke rubiaceae', 'Rubiaceae', Species)) %>% + mutate(Species=gsub('Rauwolfia', 'Rauvolfia', Species)) %>% + mutate(Species=gsub('Rheinfarn', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Rhodostemon kunthiana', 'Rhodostemonodaphne kunthiana', Species)) %>% + mutate(Species=gsub('Riccardia/aneura', 'Bryophyta', Species)) %>% + mutate(Species=gsub('Rietgras steril 134051a', 'Poaceae', Species)) %>% + mutate(Species=gsub('Rosenbergio formosum', 'Rosenbergiodendron formosum', Species)) %>% + mutate(Species=gsub('Rotes puschelgras', 'Poaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Rubiacea", + values="Rubiaceae")) %>% + mutate(Species=gsub('Rytidospe goomallin a.g. gunness et al. oakp 10/', 'Rytidosperma', Species)) %>% + mutate(Species=gsub('Salacia idoensis', 'Salacia', Species)) %>% + mutate(Species=gsub('Samphire', 'Amaranthaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% + c("Sauergras", "Schlanksegge", "Sedge", + "Segge", "Simse"), + values="Cyperaceae")) %>% + mutate(Species=gsub('Scaev repen subsp. north sandp r.j. cranf & p.j. spenc', 'Scaevola repens', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Schachtelhalm", + values="Equisetaceae")) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Schnittlauch", + values="Amaryllidaceae")) %>% + mutate(Species=gsub('Schwertlilie trocken', 'Iridaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% c("Scropholacea", "Scrophulariacea", "Scroph."), + values="Scrophulariacea")) %>% + mutate(Species=gsub('Sitzende onagraceae', 'Onagraceae', Species)) %>% + mutate(Species=gsub('Sonnenblume', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Stachelgurke', 'Cucurbitaceae', Species)) %>% + mutate(Species=gsub('Stark behaarte malve', 'Malvaceae', Species)) %>% + mutate(Species=gsub('Staude asteraceae bl watteweich f', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Staude crotalaria unterseite silber', 'Crotalaria', Species)) %>% + mutate(Species=gsub('Staude solanum', 'Solanaceae', Species)) %>% + mutate(Species=gsub('Staude tephrosia', 'Tephrosia', Species)) %>% + mutate(Species=gsub('Stipagrosist panicle gross', 'Stipagrostis', Species)) %>% + mutate(Species=gsub('Asteraceae u silber', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Stratonostoc communeá', 'Stratonostoc commune', Species)) %>% + mutate(Species=gsub('Strauch asteraceae nadelblätt.', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Strauch blatt wie salix reticulata astera', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Strauch blatt wie salix reticulata astera 132534b', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Strauch fabaceae gerieft schote', 'Fabaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Strauch" & + word(Species,2)=="Rubiaceae", + values="Rubiaceae")) %>% + mutate(Species=gsub('Fabaceae samtig bl lanzettlich', 'Fabaceae', Species)) %>% + mutate(Species=gsub('Ochna mini', 'Ochna', Species)) %>% + mutate(Species=gsub('Stryphnoden microstachyum', 'Stryphnodendron microstachyum', Species)) %>% + mutate(Species=gsub('Sumpfgladiole haarig', 'Gladiolus', Species)) %>% + mutate(Species=gsub('Sygnum ramphicarpa', 'Scrophulariaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1)=="Symplococar", + values="Symplococarpon")) %>% + mutate(Species=gsub('Sysirinchium', 'Sisyrinchium', Species)) %>% + mutate(Species=gsub('Syzigium accuminatisima', 'Syzygium acuminatissimum', Species)) %>% + mutate(Species=gsub('Tabernaemon ', 'Tabernaemontana ', Species)) %>% + mutate(Species=gsub('Thalassodend', 'Thalassodendron', Species)) %>% + mutate(Species=gsub('Thinouia canescens', 'Thinouia', Species)) %>% + mutate(Species=gsub('Thistle', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Trisetumicatum', 'Trisetum spicatum', Species)) %>% + mutate(Species=gsub('Undetermined sedge', 'Cyperaceae', Species)) %>% + mutate(Species=replace(Species, + list=word(Species, 1) %in% + c("Liverwort", "Liverworts", "Moss"), + values="Bryophyta")) %>% + mutate(Species=gsub('Vismi bacci', 'Vismia baccifera subsp. ferruginea', Species)) %>% + mutate(Species=gsub('Weidenr”schen', 'Onagraceae', Species)) %>% + mutate(Species=gsub('Weißpelziger brauner Spross Asteracea', 'Asteraceae', Species)) %>% + mutate(Species=gsub('Wie stipagrostis', 'Poaceae', Species)) %>% + mutate(Species=gsub('Wincassia', 'Fabaceae', Species)) %>% + mutate(Species=gsub('xDactyloden st-quintini', 'Dactylodenia st-quintinii', Species)) %>% + mutate(Species=gsub('Zizyphus sp1 IUCN1', 'Zizyphus', Species)) %>% + mutate(Species=gsub('Zwiebel Lilaceae steril', 'Lilaceae', Species)) %>% + mutate(Species=gsub('Zwstr faurea', 'Faurea', Species)) %>% + mutate(Species=gsub('Quercus crispla', 'Quercus crispula', Species)) %>% + mutate(Species=gsub('Corallorrhiza', 'Corallorhiza', Species)) %>% + mutate(Species=gsub('Brunella vulgaris', 'Prunella vulgaris', Species)) +``` + A total of `r nrow(spec.list.TRY.sPlot %>% filter(OriginalNames != Species))` species names were modified. Although substantially improved, the species list has still quite a lot of inconsistencies. The total list submitted to TNRS contains `r length(unique(spec.list.TRY.sPlot$Species))` species names. @@ -437,492 +912,11 @@ save(tnrs.res.certain, tnrs.res.uncertain, file="../_derived/TNRS_submit/tnrs.it ``` -### Manual cleaning, delete subspecies information and rerun match in TNRS +### Delete subspecies information and rerun match in TNRS Many unmatched records do contain subspecies information which could not be retrieved in TNRS, although genus and species seem to be spelled correctly. Also, sometimes the mismatch derives from having the word 'species' or 'sp' at the end of the name. ```{r} -#Manual cleaning tnrs.submit.iter2 <- data.frame(old=tnrs.res.uncertain$Name_submitted) %>% - mutate(new=old) %>% - mutate(new=tolower(new)) %>% - mutate(new=firstup(new)) %>% - mutate(new=gsub("^Str ", "", new)) %>% - mutate(new=gsub("^Unknown ", "", new)) %>% - mutate(new=firstup(new)) %>% - mutate(new=gsub(" [0-9]*$", "", new)) %>% #delete digits at end of object - mutate(new=gsub("^\\d+|\\d+$", "", new)) %>% #delete digits at the beginning or end of a string - mutate(new=gsub(" sp.$", "", new)) %>% - mutate(new=gsub(" sp$", "", new)) %>% - mutate(new=gsub(" species$", "", new)) %>% - mutate(new=gsub(" *$", "", new)) %>% - mutate(new=gsub(" #$", "", new)) %>% - mutate(new=gsub(" m$", "", new)) %>% - mutate(new=gsub("acea ", "aceae ", new)) %>% - mutate(new=gsub('^Agropyrum', 'Agropyron', new)) %>% - mutate(new=gsub('^Anno ', 'Annona ', new)) %>% - mutate(new=gsub('Adpdytes dimidiata', 'Apodytes dimidiata', new)) %>% - mutate(new=gsub('Adenostorna fasciculaturn', 'Adenostoma fasciculatum', new)) %>% - mutate(new=gsub('Arctostapliylos glallca', 'Arctostaphylos glauca', new)) %>% - mutate(new=gsub('Bituminosa bituminosa', 'Bituminaria bituminosa', new)) %>% - mutate(new=gsub('Causurina equisitifolia', 'Causuarina equisetifolia', new)) %>% - mutate(new=gsub('Convulvus arvensis', 'Convolvulus arvensis', new)) %>% - mutate(new=gsub('Diospyrus dygina', 'Diospyros dygina', new)) %>% - mutate(new=gsub('^Dodoea', 'Dodonaea', new)) %>% - mutate(new=gsub('^Boheravia', 'Boerhavia', new)) %>% - mutate(new=gsub('Centaria maculosa', 'Centaurea maculosa', new)) %>% - mutate(new=gsub('Chamrenerium angustifolium', 'Chamaenerion angustifolium', new)) %>% - mutate(new=gsub('^Chicorium', 'Cichorium', new)) %>% - mutate(new=gsub('^Cirsiumum', 'Cirsium', new)) %>% - mutate(new=gsub('^Colubrium', 'Colubrina', new)) %>% - mutate(new=gsub('^Corymbium', 'Corymbia', new)) %>% - mutate(new=gsub('Cosmos bipinnata', 'Cosmos bipinnatus', new)) %>% - mutate(new=gsub('Diospyrus dygina', 'Diospyros digyna', new)) %>% - mutate(new=gsub('Diospyros egbert', 'Diospyros egbert-walkeri', new)) %>% - mutate(new=gsub('Dispyrus halesioides', 'Diospyros halesioides', new)) %>% - mutate(new=gsub('^Drymis', 'Drimys', new)) %>% - mutate(new=gsub('^Dysoxylon', 'Dysoxylum', new)) %>% - mutate(new=gsub('^Eleaegnus', 'Elaeagnus', new)) %>% - mutate(new=gsub('^Eleutherant', 'Eleutherantera', new)) %>% - mutate(new=gsub('^Echicea', 'Echinacea', new)) %>% - mutate(new=gsub('Gauteria foliolata', 'Gaultheria foliolosa', new)) %>% - mutate(new=gsub('^Geophylla', 'Geophyla', new)) %>% - mutate(new=gsub('Gloichidion insignis', 'Glochidion insigne', new)) %>% - mutate(new=gsub('^Glycium', 'Glycine', new)) %>% - mutate(new=gsub('^Hammalis', 'Hamamelis', new)) %>% - mutate(new=gsub('^Hippochoeris', 'Hypochaeris', new)) %>% - mutate(new=gsub('Ilix tephrohylla', 'Ilex tephrophylla', new)) %>% - mutate(new=gsub('^Jasininum', 'Jasminum', new)) %>% - mutate(new=gsub('Jenipa conjuta', 'Jenipa conjunta', new)) %>% - mutate(new=gsub('^Lechytis', 'Lecythis', new)) %>% - mutate(new=gsub('Lespedeza juncus', 'Lespedeza juncea', new)) %>% - mutate(new=gsub('Licania apelata', 'Licania apetala', new)) %>% - mutate(new=gsub('Limeum arenicola', 'Limeum arenicolum', new)) %>% - mutate(new=gsub('^Maniota', 'Manihot', new)) %>% - mutate(new=gsub('^Menta', 'Mentha', new)) %>% - mutate(new=gsub('Metophyum brownei', 'Metopium brownei', new)) %>% - mutate(new=gsub('Miliusa tomentosum', 'Miliusa tomentosa', new)) %>% - mutate(new=gsub('Mimululus ringens', 'Mimulus ringens', new)) %>% - mutate(new=gsub('Nardus strictus', 'Nardus stricta', new)) %>% - mutate(new=gsub('Neea glomeratha', 'Neea glomerata', new)) %>% - mutate(new=gsub('^Onopordon', 'Onopordum', new)) %>% - mutate(new=gsub('^Orbigynia', 'Orbignya', new)) %>% - mutate(new=gsub('Orites excelsa', 'Orites excelsus', new)) %>% - mutate(new=gsub('Paedorata lutea', 'Paederota lutea', new)) %>% - mutate(new=gsub('Palaquin ellipticum', 'Palaquium ellipticum', new)) %>% - mutate(new=gsub('Palmeria arfakensis', 'Palmeria arfakiana', new)) %>% - mutate(new=gsub('Petalostcmum purpureum', 'Petalostemum purpureum', new)) %>% - mutate(new=gsub('Petalostimum purpureum', 'Petalostemum purpureum', new)) %>% - mutate(new=gsub('^Petrosileum', 'Petroselinum', new)) %>% - mutate(new=gsub('Phlomis herba', 'Phlomis herba-venti', new)) %>% - mutate(new=gsub('^Phyllirea', 'Phillyrea', new)) %>% - mutate(new=gsub('Physilus pumula', 'Physalus pumila', new)) %>% - mutate(new=gsub('Picea maria', 'Picea mariana', new)) %>% - mutate(new=gsub('Picea retroXexa', 'Picea retroflexa', new)) %>% - mutate(new=gsub('Pilayella litoralis', 'Pilayella littoralis', new)) %>% - mutate(new=gsub('Placocarpus schaereri', 'Platecarpus schaerer', new)) %>% - mutate(new=gsub('Placocarpus schraereri', 'Platecarpus schaerer', new)) %>% - mutate(new=gsub('^Pulteea', 'Pultenaea', new)) %>% - mutate(new=gsub('Quercus rubrum', 'Quercus rubra', new)) %>% - mutate(new=gsub('Rubus fruticosa', 'Rubus fruticosus', new)) %>% - mutate(new=gsub('Rubus saxatile', 'Rubus saxatilis', new)) %>% - mutate(new=gsub('Rubus sylvatici', 'Rubus sylvaticus', new)) %>% - mutate(new=gsub('^Sanguiria', 'Sanguinaria', new)) %>% - mutate(new=gsub('Sarauja nepaulensis', 'Sarauja nepalensis', new)) %>% - mutate(new=gsub('^Sateria', 'Setaria', new)) %>% - mutate(new=gsub('Sauraiea nepulensis', 'Saurauia nepalensis', new)) %>% - mutate(new=gsub('Schneckia australis', 'Schenckia australis', new)) %>% - mutate(new=gsub('Smirnium oleastrum', 'Smyrnium olusatrum', new)) %>% - mutate(new=gsub('Solms laubachia', 'Solms-laubachia himalayensis', new)) %>% - mutate(new=gsub('Stellaria chamaejasme', 'Stellera chamaejasme', new)) %>% - mutate(new=gsub('Steraria parviflora', 'Setaria parviflora', new)) %>% - mutate(new=gsub('^Stuartia', 'Stewartia', new)) %>% - mutate(new=gsub('Sycops sinensis', 'Sycopsis sinensis', new)) %>% - mutate(new=gsub('Tacetum vulgare', 'Tanacetum vulgare', new)) %>% - mutate(new=gsub('Talinurn angustissimun', 'Talinun angustissimun', new)) %>% - mutate(new=gsub('Talloma hodgsoni', 'Talauma hodgsonii', new)) %>% - mutate(new=gsub('Taraxacum albo', 'Taraxacum album', new)) %>% - mutate(new=gsub('Tetragonia falcata', 'Tetragona falcata', new)) %>% - mutate(new=gsub('Trapogogon', 'Tragopogon', new)) %>% - mutate(new=gsub('Zyzyphus saeri', 'Zizyphus saeri', new)) %>% - mutate(new=gsub('^Helicrysum', 'Helichrysum', new)) %>% - mutate(new=gsub('^Diceropappus rhinocerotis', 'Elytropappus rhinocerotis', new)) %>% - mutate(new=gsub('^Euphorbiace ', 'Euphorbiacaea ', new)) %>% - mutate(new=gsub('^Gloecapsa', 'Gloeocapsa', new)) %>% - mutate(new=gsub('Glycirhiza', 'Glycyrrhiza', new)) %>% - mutate(new=gsub('Abiesnordmannia', 'Abies nordmannia', new)) %>% - mutate(new=gsub('Alnus inca', 'Alnus incana', new)) %>% - mutate(new=gsub('Amalencier alnifolia', 'Amalenchier alnifolia', new)) %>% - mutate(new=gsub('Antylis barba-jovis', 'Anthyllis barba-jovis', new)) %>% - mutate(new=gsub('^Albizzia "', 'Albizia ', new)) %>% - mutate(new=gsub('^Ipomoena ', 'Ipomoea ', new)) %>% - mutate(new=gsub('^Ipomea ', 'Ipomoea ', new)) %>% - mutate(new=gsub('Ipomo wolco', 'Ipomoea wolcottiana', new)) %>% - ## additional manual cleaning from UJ, BJA, HB - mutate(new=gsub('Abacaba palm', 'Oenocarpus balickii', new)) %>% - mutate(new=gsub('Acerkuomeii', 'Acer kuomeii', new)) %>% - mutate(new=gsub('Adelphacme minima', '', new)) %>% - mutate(new=gsub('Alder$', 'Alnus', new)) %>% - mutate(new=gsub('Amapa$', 'Tabebuia', new)) %>% - mutate(new=gsub('Amapa amargoso', 'Parahancornia amapa', new)) %>% - mutate(new=gsub('Amapa doce$', 'Tabebuia', new)) %>% - mutate(new=gsub('Amapai$', 'Tabebuia', new)) %>% - mutate(new=gsub('Amapaí$', 'Tabebuia', new)) %>% - mutate(new=gsub('Amapa m1', 'Tabebuia', new)) %>% - mutate(new=gsub('Amaranth$', 'Amaranthus', new)) %>% - mutate(new=gsub('Amophora fruticosa', 'Amorpha fruticosa', new)) %>% - mutate(new=gsub('Anacardiace ', 'Anacardiaceae ', new)) %>% - mutate(new=gsub('Anagallisarvensis', 'Anagallis arvensis', new)) %>% - mutate(new=gsub('Anemonenarcissiflora var.', 'Anemone narcissiflora', new)) %>% - mutate(new=gsub('Anenome ', 'Anemone', new)) %>% - mutate(new=gsub('Anona ', 'Annona ', new)) %>% - mutate(new=gsub('Antylis ', 'Anthyllis', new)) %>% - mutate(new=gsub('Apocyncadea gelbblueh$', 'Apocynaceae', new)) %>% - mutate(new=gsub('Aracium', 'Crepis', new)) %>% - mutate(new=gsub('Ardis mexic', 'Ardisia mexicana subsp. siltepecana', new)) %>% - mutate(new=gsub('Ardis verap', 'Ardisia verapazensis', new)) %>% - mutate(new=gsub('Argenomne hummemannii', 'Argemone hunnemanni', new)) %>% - mutate(new=gsub('Artabotus', 'Artabotrys', new)) %>% - mutate(new=gsub('Artemisiaintegrifolia', 'Artemisia integrifolia', new)) %>% - mutate(new=gsub('Asclepiacea$', 'Asclepiadaceae', new)) %>% - mutate(new=gsub('Asclep. klimmer', 'Asclepiadaceae', new)) %>% - mutate(new=gsub('Astartoseris triquetra', 'Lactuca triquetra', new)) %>% - mutate(new=gsub('Asteracee ', 'Asteraceae ', new)) %>% - mutate(new=gsub('Avenula glauc$', 'Avenula', new)) %>% - mutate(new=gsub('Baikea plurijuga', 'Baikiaea plurijuga', new)) %>% - mutate(new=gsub('Binse rundbl', 'Juncaceae', new)) %>% - mutate(new=gsub('Blättrige fabaceae th', 'Fabaceae', new)) %>% - mutate(new=gsub('Bonel macro$', 'Bonellia macrocarpa subsp. macrocarpa', new)) %>% - mutate(new=gsub('Boraginacee samtig', 'Boraginaceae', new)) %>% - mutate(new=gsub('Bri¢fitos', 'Bryophyta', new)) %>% - mutate(new=gsub('Bryophyte$', 'Bryophyta', new)) %>% - mutate(new=gsub('Bryopsida', 'Bryophyta', new)) %>% - mutate(new=gsub('Carallia macrophylla', 'Carallia', new)) %>% - mutate(new=gsub('Carexectabilis', 'Carex spectabilis', new)) %>% - mutate(new=gsub('Carex fein', 'Carex', new)) %>% - mutate(new=gsub('Cerania vermicularis', 'Thamnolia vermicularis', new)) %>% - mutate(new=gsub('Chamelauci merredin', 'Chamelaucium', new)) %>% - mutate(new=gsub('Chamelau drummon', 'Chamelaucium', new)) %>% - mutate(new=gsub('Charophyta', 'Characeae', new)) %>% - mutate(new=gsub('Cheiridopsis-keimlinge', 'Cheiridopsis', new)) %>% - mutate(new=gsub('Chenopodiacee$', 'Chenopodiaceae', new)) %>% - mutate(new=gsub('Chiangioden mexicanum', 'Chiangiodendron mexicanum', new)) %>% - mutate(new=gsub('Chiranthode pentadactylon', 'Chiranthodendron pentadactylon', new)) %>% - mutate(new=gsub('Chrysobalan ', 'Chrysobalanus ', new)) %>% - mutate(new=gsub('Cladapodiella', 'Cladopodiella', new)) %>% - mutate(new=gsub('Cleidium ', 'Cleidion ', new)) %>% - mutate(new=gsub('Collema/leptogium lichenoides', 'Collemataceae', new)) %>% - mutate(new=gsub('Comarostaph discolor', 'Comarostaphylis discolor', new)) %>% - mutate(new=gsub('Combretdodendrum africana', 'Combretodendrum africanum', new)) %>% - mutate(new=gsub('Commelinacaea floscopa', 'Floscopa glomerata', new)) %>% - mutate(new=gsub('Coyncia setigera', 'Coincya setigera', new)) %>% - mutate(new=gsub('Crataeva', 'Crateva', new)) %>% - mutate(new=gsub('Craterosperma', 'Rubiaceae', new)) %>% - mutate(new=gsub('Crespicium', 'Burseraceae', new)) %>% - mutate(new=gsub('Critoniadel nubigenus', 'Critoniadelphus nubigenus', new)) %>% - mutate(new=gsub('Crotalaria/vigna?', 'Fabaceae', new)) %>% - mutate(new=gsub('Croto billb', 'Croton billbergianus subsp. pyramidalis', new)) %>% - mutate(new=gsub('Dana„ racemosa', 'Danae racemosa', new)) %>% - mutate(new=gsub('Deehasia', 'Dehaasia', new)) %>% - mutate(new=gsub('Dichapetala', 'Dichapetalum', new)) %>% - mutate(new=gsub('Distel bractea', 'Asteracaea', new)) %>% - mutate(new=gsub('Distelig asteraceae', 'Asteracaea', new)) %>% - mutate(new=gsub('Dodon visco', 'Dodonaea viscosa', new)) %>% - mutate(new=gsub('Doldenbluetler', 'Apiaceae', new)) %>% - mutate(new=gsub('Echinosurus capitatus', 'Poaceae', new)) %>% - mutate(new=gsub('Einähriges gras$', 'Poaceae', new)) %>% - mutate(new=gsub('Einähriges gras von gestern$', 'Poaceae', new)) %>% - mutate(new=gsub('Einblütiges rispengras', 'Poaceae', new)) %>% - mutate(new=gsub('Eiovaltrichtergrundblatt orchidee', 'Orchidaceae', new)) %>% - mutate(new=gsub('Elongata subsp.', 'Pohlia elongata', new)) %>% - mutate(new=gsub('Enriquebelt ', 'Enriquebeltrania ', new)) %>% - mutate(new=gsub('Entermorpha ', 'Enteromorpha ', new)) %>% - mutate(new=gsub('Erodiurn$', 'Erodium', new)) %>% - mutate(new=gsub('Euc. chloroclada x camaldulensis', 'Eucalyptus', new)) %>% - mutate(new=gsub('Euphorbiacée ipatouduluga gouduatché', 'Euphorbiaceae', new)) %>% - mutate(new=gsub('Fabacee kleeblatt stengel schwarzdrüsi', 'Fabaceae', new)) %>% - mutate(new=gsub('Fabaceenstrauch wie 132446 f', 'Fabaceae', new)) %>% - mutate(new=gsub('Fabaceenstr kleinbltrg', 'Fabaceae', new)) %>% - mutate(new=gsub('Fabacee wie lotus f', 'Fabaceae', new)) %>% - mutate(new=gsub('Farn', 'Pteridophyta', new)) %>% - mutate(new=gsub('Farn cystopteris', 'Cystopteris', new)) %>% - mutate(new=gsub('Fern', 'Pteridophyta', new)) %>% - mutate(new=replace(new, list=word(new, 1)=="Fingergras", values="Digitaria")) %>% - mutate(new=replace(new, list=word(new, 1)=="Fingerhirse", values="Digitaria")) %>% - mutate(new=gsub('Gelbe onagraceae', 'Onagraceae', new)) %>% - mutate(new=gsub('Gramine', 'Poaceae', new)) %>% - mutate(new=gsub('Graminea', 'Poaceae', new)) %>% - mutate(new=gsub('Graminia', 'Poaceae', new)) %>% - mutate(new=gsub('Grannenquecke', 'Poaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Gras", - values="Poaceae")) %>% - mutate(new=gsub('Gynostachi dicanthus', 'Gymnostachium diacanthus', new)) %>% - mutate(new=gsub('Hafer haarkranz', 'Poaceae', new)) %>% - mutate(new=gsub('Hapolosiphon', 'Hapalosiphon', new)) %>% - mutate(new=gsub('Heliocrysum', 'Helichrysum', new)) %>% - mutate(new=replace(new, list=word(new, 1)=="Hepaticae", values="Bryophyta")) %>% - mutate(new=gsub('Hepaticas', 'Bryophyta', new)) %>% - mutate(new=gsub('Hepatophyta', 'Bryophyta', new)) %>% - mutate(new=gsub('Hermerocalis', 'Hemerocallis', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Hirse", - values="Poaceae")) %>% - mutate(new=gsub('Hirte trian', 'Hirtella triandra subsp. media', new)) %>% - mutate(new=replace(new, list=word(new, 1)=="Hohlzahn", values="Lamiaceae")) %>% - mutate(new=gsub('Hondurodend urceolatum', 'Hondurodendron urceolatum', new)) %>% - mutate(new=gsub('Hornklee gelb', 'Fabaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Horstgras", - values="Poaceae")) %>% - mutate(new=replace(new, - list=word(new, 1)=="Huehnerhirse", - values="Digitaria")) %>% - mutate(new=gsub('Hydrocoleus lyngbyaceus', 'Hydrocoleum lyngbyaceum', new)) %>% - mutate(new=gsub('Hyernima nipensis', 'Hieronyma nipensis', new)) %>% - mutate(new=gsub('Hyeronima', 'Hieronyma', new)) %>% - mutate(new=gsub('Hypocal angusti', 'Hypocalymma angustifolium', new)) %>% - mutate(new=gsub('Hypocalym nambung', 'Hypocalymma', new)) %>% - mutate(new=gsub('Hyprium', 'Hypericum', new)) %>% - mutate(new=gsub('Igelkolben', 'Sparganium', new)) %>% - mutate(new=gsub('Ilexã‚â paraguariensis', 'Ilex', new)) %>% - mutate(new=gsub('Ipomea', 'Ipomoea', new)) %>% - mutate(new=gsub('Ipomoena', 'Ipomoea', new)) %>% - mutate(new=gsub('Jm kürbis stark behaart', 'Cucurbitaceae', new)) %>% - mutate(new=gsub('Juncaginacee/triglochin', 'Triglochin', new)) %>% - mutate(new=gsub('Juncas', 'Juncus', new)) %>% - mutate(new=gsub('Keilblatt cyperus', 'Cyperus', new)) %>% - mutate(new=gsub('Khh 3010 polygalacee', 'Polygalaceae', new)) %>% - mutate(new=gsub(' Khh 3014 liliacee 3f„ch. kapsel schwarze samen', 'Liliaceae', new)) %>% - mutate(new=gsub('Khh 3024 brachiaria', 'Brachiaria', new)) %>% - mutate(new=gsub('Khh 3025 liliaceae gelbe blten breite bl„tter', 'Liliaceae', new)) %>% - mutate(new=gsub('Khh 3037 ficus', 'Ficus', new)) %>% - mutate(new=gsub('Khh 3054 ficus iteophylla miq.', 'Ficus', new)) %>% - mutate(new=gsub('Kl. borstgras', 'Poaceae', new)) %>% - mutate(new=gsub('Kleine malvaceae', 'Malvaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Kletter", - values="Asteraceae")) %>% - mutate(new=gsub('Klimmer asclepiadaceae', 'Asclepiadaceae', new)) %>% - mutate(new=gsub('Klimmer curcuvitaceae', 'Cucurbitaceae', new)) %>% - mutate(new=gsub('Kl. sauergras', 'Cyperaceae', new)) %>% - mutate(new=gsub('Knabenkraut gefleckt', 'Orchis', new)) %>% - mutate(new=gsub('Knubbelblüt. gras haarkranz vgl f', 'Poaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Koenigskerze", - values="Verbascum")) %>% - mutate(new=gsub('Kriechgras zynodon', 'Poaceae', new)) %>% - mutate(new=gsub('Kürbis', 'Cucurbitaceae', new)) %>% - mutate(new=gsub('Lamiaceen strauch', 'Lamiaceae', new)) %>% - mutate(new=gsub('Lamiacee orange', 'Lamiaceae', new)) %>% - mutate(new=gsub('Lamiales orobanchaceae + phrymaceae + plantaginaceae + scrophulariaceae', 'Orobanchaceae', new)) %>% - mutate(new=gsub('Lantanacamara wandelrösschen', 'Lantana camara', new)) %>% - mutate(new=gsub('Lasiopeta watheroo k. shepherd & c. wilkins ks', 'Lasiopetalum', new)) %>% - mutate(new=gsub('Leg-inderteminada', 'Fabaceae', new)) %>% - mutate(new=gsub('Legu 1fiedrig groá schlank', 'Fabaceae', new)) %>% - mutate(new=gsub('Legume$', 'Fabaceae', new)) %>% - mutate(new=gsub('Leguminosae spgm', 'Fabaceae', new)) %>% - mutate(new=gsub('Leguminosea', 'Fabaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Leguminose", - values="Fabaceae")) %>% - mutate(new=gsub('Leheelo grass', 'Poaceae', new)) %>% - mutate(new=gsub('Lepid carra', 'Lepiderema', new)) %>% - mutate(new=gsub('Lich caloplaca', 'Caloplaca', new)) %>% - mutate(new=gsub('Liliacee', 'Liliaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Lilie", - values="Liliaceae")) %>% - mutate(new=gsub('Liliengewächs', 'Liliaceae', new)) %>% - mutate(new=gsub('Lisea', 'Litsea', new)) %>% - mutate(new=gsub('Lisymachia', 'Lysimachia', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Liverwort", - values="Bryophyta")) %>% - mutate(new=gsub('Livwort', 'Bryophyta', new)) %>% - mutate(new=gsub('Lonicerachrysantha', 'Lonicera chrysantha', new)) %>% - mutate(new=gsub('Lycoctamnus barbatus', 'Aconitum barbatum', new)) %>% - mutate(new=gsub('Lygopus', 'Lycopus', new)) %>% - mutate(new=gsub('Maitenus', 'Maytenus', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Malpighiace", - values="Malpighiaceae")) %>% - mutate(new=gsub('Malpighiales chrysobalanaceae + humiriaceae', 'Malpighiaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Malve", - values="Malvaceae")) %>% - mutate(new=replace(new, - list=word(new, 1)=="Mammutgras", - values="Poaceae")) %>% - mutate(new=gsub('Mammutgrass', 'Poaceae', new)) %>% - mutate(new=gsub('Maqui guian', 'Maquira guianensis subsp. costaricana', new)) %>% - mutate(new=gsub('Marchantiophyta', 'Bryophyta', new)) %>% - mutate(new=gsub('Mariana aphylla', 'Maireana aphylla', new)) %>% - mutate(new=gsub('Mehrfingeriges ährengras', 'Poaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Melastomata", - values="Melastomataceae")) %>% - mutate(new=gsub('Mesembr minibl', 'Mesembryanthemum', new)) %>% - mutate(new=gsub('Mesostomma kotschyanum', 'Mesostemma kotschyana', new)) %>% - mutate(new=gsub('Microhepatics', 'Bryophyta', new)) %>% - mutate(new=gsub('Micromeria micrantha', 'Micromeria graeca subsp. micrantha', new)) %>% - mutate(new=gsub('Mimose minifiedrig f', 'Fabaceae', new)) %>% - mutate(new=gsub('Miniepilobium', 'Epilobium', new)) %>% - mutate(new=gsub('Minimargerite', 'Asteraceae', new)) %>% - mutate(new=gsub('Miniochna', 'Ochna', new)) %>% - mutate(new=gsub('Minischilf 132466 f', 'Poaceae', new)) %>% - mutate(new=gsub('Mistletoe', 'Viscum', new)) %>% - mutate(new=gsub('Mniaecia', 'Mniaceae', new)) %>% - mutate(new=gsub('Molemo', 'Turraea', new)) %>% - mutate(new=gsub('Molses', 'Bryophyta', new)) %>% - mutate(new=gsub('Momisa pigra', 'Mimosa pigra', new)) %>% - mutate(new=gsub('Monandrus squarrosus', 'Cyperus squarrosus', new)) %>% - mutate(new=gsub('Monchema debile', 'Monechma debile', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Monochna", - values="Polygalaceae")) %>% - mutate(new=replace(new, - list=word(new, 1)=="Moos", - values="Bryophyta")) %>% - mutate(new=gsub('Moospolster grau-grün', 'Bryophyta', new)) %>% - mutate(new=gsub('Mortonioden ', 'Mortoniodendron ', new)) %>% - mutate(new=gsub('Mos onbekend', 'Bryophyta', new)) %>% - mutate(new=gsub('Mossen overige', 'Bryophyta', new)) %>% - mutate(new=gsub('Mougetia', 'Mougeotia', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Musci", - values="Bryophyta")) %>% - mutate(new=gsub('Myciantes', 'Myrcianthes', new)) %>% - mutate(new=gsub('Myrciaã‚â pulchra', 'Myrcia pulchra', new)) %>% - mutate(new=gsub('Myrcianov.', 'Myrcia', new, fixed = T)) %>% - mutate(new=gsub('Myrsi coria', 'Myrsine coriacea', new)) %>% - mutate(new=gsub('Myrtaceenstrauch', 'Myrtaceae', new)) %>% - mutate(new=gsub('Nachtkerze fru dreispaltig', 'Onagracaee', new)) %>% - mutate(new=gsub('Neobartsia crenoloba', 'Bartsia crenoloba', new)) %>% - mutate(new=gsub('None$', 'Nonea', new)) %>% - mutate(new=gsub('Ocos adenophylla', 'Symplocos adenophylla', new)) %>% - mutate(new=gsub('Officinale subsp. group', 'Taraxacum officinale s.l.', new)) %>% - mutate(new=gsub('Orch$', 'Orchidaceae', new)) %>% - mutate(new=gsub('Orchid', 'Orchidaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Orchidee", - values="Orchidaceae")) %>% - mutate(new=replace(new, - list=word(new, 1) %in% c("Papilonacea", "Papilionacea"), - values="Fabaceae")) %>% - mutate(new=gsub('Pasania dodoniifolia', 'Lithocarpus dodonaeifolius', new)) %>% - mutate(new=gsub('Phoebengmoensis', 'Phoebe hungmoensis', new)) %>% - mutate(new=gsub('Picra antid$', 'Picramnia antidesma subsp. fessonia', new)) %>% - mutate(new=gsub('Pinopsida', 'Coniferae', new)) %>% - mutate(new=gsub('Pisonianov.', 'Pisonia', new, fixed=T)) %>% - mutate(new=gsub('Pithecellob ', 'Pithecellobium ', new)) %>% - mutate(new=gsub('Pithecocten', 'Pithecoctenium', new)) %>% - mutate(new=gsub('Pleradenoph longicuspis', 'Pleradenophora longicuspis', new)) %>% - mutate(new=gsub('Pleuranthod ', 'Pleuranthodendron ', new)) %>% - mutate(new=gsub('Poales', 'Poaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1) %in% c("Polygalacea", "Polygalacee"), - values="Polygalaceae")) %>% - mutate(new=replace(new, - list=word(new, 1) %in% c("Polygonaceae", "Polygonacee"), - values="Polygonaceae")) %>% - mutate(new=gsub('Polygonumlongisetum', 'Polygonum longisetum', new)) %>% - mutate(new=gsub('Posoq coria subsp. maxima', 'Posoqueria coriacea subsp. maxima', new)) %>% - mutate(new=gsub('Prosthecidi ', 'Prosthecidiscus ', new)) %>% - mutate(new=gsub('Pseudo bidens', '', new)) %>% - mutate(new=replace(new, - list=word(new, 1) %in% - c("Pseudobriza", "Pseudofingergras", - "Pseudogerste", "Puschelgras", "Quecke", - "Queckenblatt", "Queckengras", - "Roggen/hafer", "Ruchgras", "Silbergras", - "Suessgras"), - values="Poaceae")) %>% - mutate(new=gsub('Ptarmica', 'Achillea', new)) %>% - mutate(new=gsub('Pterost cauline leaves n. gibson & m.n. lyons', 'Pterostegia', new)) %>% - mutate(new=gsub('Quararibeaã‚â guianensis', 'Quararibea guianensis', new)) %>% - mutate(new=gsub('Rainfarn f', 'Asteraceae', new)) %>% - mutate(new=gsub('Ranke ipomoea', 'Ipomoea', new)) %>% - mutate(new=gsub('Ranke rubiaceae', 'Rubiaceae', new)) %>% - mutate(new=gsub('Rauwolfia', 'Rauvolfia', new)) %>% - mutate(new=gsub('Rheinfarn', 'Asteraceae', new)) %>% - mutate(new=gsub('Rhodostemon kunthiana', 'Rhodostemonodaphne kunthiana', new)) %>% - mutate(new=gsub('Riccardia/aneura', 'Bryophyta', new)) %>% - mutate(new=gsub('Rietgras steril 134051a', 'Poaceae', new)) %>% - mutate(new=gsub('Rosenbergio formosum', 'Rosenbergiodendron formosum', new)) %>% - mutate(new=gsub('Rotes puschelgras', 'Poaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Rubiacea", - values="Rubiaceae")) %>% - mutate(new=gsub('Rytidospe goomallin a.g. gunness et al. oakp 10/', 'Rytidosperma', new)) %>% - mutate(new=gsub('Salacia idoensis', 'Salacia', new)) %>% - mutate(new=gsub('Samphire', 'Amaranthaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1) %in% - c("Sauergras", "Schlanksegge", "Sedge", - "Segge", "Simse"), - values="Cyperaceae")) %>% - mutate(new=gsub('Scaev repen subsp. north sandp r.j. cranf & p.j. spenc', 'Scaevola repens', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Schachtelhalm", - values="Equisetaceae")) %>% - mutate(new=replace(new, - list=word(new, 1)=="Schnittlauch", - values="Amaryllidaceae")) %>% - mutate(new=gsub('Schwertlilie trocken', 'Iridaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1) %in% c("Scropholacea", "Scrophulariacea", "Scroph."), - values="Scrophulariacea")) %>% - mutate(new=gsub('Sitzende onagraceae', 'Onagraceae', new)) %>% - mutate(new=gsub('Sonnenblume', 'Asteraceae', new)) %>% - mutate(new=gsub('Stachelgurke', 'Cucurbitaceae', new)) %>% - mutate(new=gsub('Stark behaarte malve', 'Malvaceae', new)) %>% - mutate(new=gsub('Staude asteraceae bl watteweich f', 'Asteraceae', new)) %>% - mutate(new=gsub('Staude crotalaria unterseite silber', 'Crotalaria', new)) %>% - mutate(new=gsub('Staude solanum', 'Solanaceae', new)) %>% - mutate(new=gsub('Staude tephrosia', 'Tephrosia', new)) %>% - mutate(new=gsub('Stipagrosist panicle gross', 'Stipagrostis', new)) %>% - mutate(new=gsub('Asteraceae u silber', 'Asteraceae', new)) %>% - mutate(new=gsub('Stratonostoc communeá', 'Stratonostoc commune', new)) %>% - mutate(new=gsub('Strauch asteraceae nadelblätt.', 'Asteraceae', new)) %>% - mutate(new=gsub('Strauch blatt wie salix reticulata astera', 'Asteraceae', new)) %>% - mutate(new=gsub('Strauch blatt wie salix reticulata astera 132534b', 'Asteraceae', new)) %>% - mutate(new=gsub('Strauch fabaceae gerieft schote', 'Fabaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Strauch" & - word(new,2)=="Rubiaceae", - values="Rubiaceae")) %>% - mutate(new=gsub('Fabaceae samtig bl lanzettlich', 'Fabaceae', new)) %>% - mutate(new=gsub('Ochna mini', 'Ochna', new)) %>% - mutate(new=gsub('Stryphnoden microstachyum', 'Stryphnodendron microstachyum', new)) %>% - mutate(new=gsub('Sumpfgladiole haarig', 'Gladiolus', new)) %>% - mutate(new=gsub('Sygnum ramphicarpa', 'Scrophulariaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1)=="Symplococar", - values="Symplococarpon")) %>% - mutate(new=gsub('Sysirinchium', 'Sisyrinchium', new)) %>% - mutate(new=gsub('Syzigium accuminatisima', 'Syzygium acuminatissimum', new)) %>% - mutate(new=gsub('Tabernaemon ', 'Tabernaemontana ', new)) %>% - mutate(new=gsub('Thalassodend', 'Thalassodendron', new)) %>% - mutate(new=gsub('Thinouia canescens', 'Thinouia', new)) %>% - mutate(new=gsub('Thistle', 'Asteraceae', new)) %>% - mutate(new=gsub('Trisetumicatum', 'Trisetum spicatum', new)) %>% - mutate(new=gsub('Undetermined sedge', 'Cyperaceae', new)) %>% - mutate(new=replace(new, - list=word(new, 1) %in% - c("Liverwort", "Liverworts", "Moss"), - values="Bryophyta")) %>% - mutate(new=gsub('Vismi bacci', 'Vismia baccifera subsp. ferruginea', new)) %>% - mutate(new=gsub('Weidenr”schen', 'Onagraceae', new)) %>% - mutate(new=gsub('Weißpelziger brauner Spross Asteracea', 'Asteraceae', new)) %>% - mutate(new=gsub('Wie stipagrostis', 'Poaceae', new)) %>% - mutate(new=gsub('Wincassia', 'Fabaceae', new)) %>% - mutate(new=gsub('xDactyloden st-quintini', 'Dactylodenia st-quintinii', new)) %>% - mutate(new=gsub('Zizyphus sp1 IUCN1', 'Zizyphus', new)) %>% - mutate(new=gsub('Zwiebel Lilaceae steril', 'Lilaceae', new)) %>% - mutate(new=gsub('Zwstr faurea', 'Faurea', new)) %>% - mutate(new=gsub('Quercus crispla', 'Quercus crispula', new)) %>% - mutate(new=gsub('Corallorrhiza', 'Corallorhiza', new)) - - + mutate(new=old) # delete remaining records of mushroom species tnrs.submit.iter2 <- tnrs.submit.iter2 %>% @@ -1620,40 +1614,6 @@ Backbone <- Backbone %>% Create fields `is_vascular_species` and `Taxon group` based on list of family manually classified, and on phyla from `The Catalogue of Life`. Assign all families that belong to `Tracheophyta` to category `is_vascular_species`, based on ```{r} -vascular <- c("Leguminosae" , "Alliaceae", "Bombacaceae" ,"Taxodiaceae", - "Aceraceae", "Centrolepidaceae","Callitrichaceae" ,"Flacourtiaceae", - "Compositae", "Asclepiadaceae", "Papilionaceae","Tiliaceae", - "Mimosaceae" , "Xanthorrhoeaceae","Arthropteridaceae", - "Valerianaceae", "Grammitidaceae" ,"Anarthriaceae", "Caesalpiniaceae", - "Chenopodiaceae", "Corylaceae", "Diervillaceae", "Dipsacaceae","Guttiferae", - "Haptanthaceae", "Hymenophyllopsidaceae", "Isoëtaceae","Labiatae", - "Lactoridaceae","Lemnaceae","Selaginaceae","Sterculiaceae","Myoporaceae", - "Myrsinaceae" ,"Pyrolaceae", "Rhoipteleaceae" ,"Xanthoceraceae") -lichens <- c("Acarosporaceae" , "Parmeliaceae", "Physciaceae", "Lichinaceae", - "Caliciaceae", "Lecanoraceae", "Venturiaceae" ,"Sphaerophoraceae" , - "Verrucariaceae", "Tricholomataceae","Baeomycetaceae", - "Catillariaceae" ,"Megasporaceae","Ramalinaceae","Pilocarpaceae" , - "Teloschistaceae","Candelariaceae","Rhizocarpaceae","Lecideaceae", - "Icmadophilaceae","Cladoniaceae","Collemataceae","Pannariaceae" , - "Lobariaceae", "Ophioparmaceae" ,"Psoraceae","Stereocaulaceae", - "Massalongiaceae","Peltigeraceae","Nephromataceae", "Umbilicariaceae" ) -lichen.genera <- c("Amygdalaria", "Anamylospora", "Arthonia", "Pertusaria", "Pyrenula","Opegrapha", - "Ochrolechia", "Graphis", "Micarea", "Porpidia", "Arthopyrenia", "Graphina", "Anisomeridium", - "Mycobilimbia","Peltula", "Thelotrema", "Arthothelium", "Diploschistes", "Strigula", - "Trichothelium", "Melaspilea", "Phaeographis", "Thelenella", "Chaenothecopsis","Fuscidea", - "Dactylospora", "Gyalecta", "Myriotrema", "Placynthium", "Umbilicaria", - "Lasallia", "Microthelia", "Lichenochora", "Roselliniopsis", "Homostegia", - "Verrucaria", "Leptorhaphis") -mosses <- c("Pilotrichaceae", "Chonecoleaceae", "Hypopterygiaceae", "Scorpidiaceae", - "Balantiopsaceae", "Mesoptychiaceae","Octoblepharaceae" ,"Takakiaceae") -algae_diatoms <- c("Sargassaceae", "Chordaceae", "Cocconeidaceae", "Desmarestiaceae", - "Chordariaceae", "Dinobryaceae", "Diploneidaceae", "Ectocarpaceae", - "Fragilariaceae","Sphacelariaceae","Vaucheriaceae" , - "Amphipleuraceae", "Fucaceae", "Gomphonemataceae", "Melosiraceae", - "Laminariaceae","Acinetosporaceae" ,"Botryochloridaceae", - #diatoms below - "Thalassiosiraceae", "Cymbellaceae", "Naviculaceae","Bacillariaceae") - Backbone <- Backbone %>% mutate(is_vascular_species=ifelse(phylum=="Tracheophyta", T, F)) %>% mutate(is_vascular_species=replace(is_vascular_species, @@ -1975,6 +1935,61 @@ length(unique(Backbone$Family_correct)) **Done!** -------------------- +# Appendix +## Create lists of genera manually classified into taxonomic groups +```{r eval=T, echo=F} +## fungi genera #NOT COMPLETE LIST +mushroom <- c("Mycena", "Boletus", "Russula","Calocybe","Collybia","Amanita","Amanitopsis","Coprinus", + "Galerina","Geoglossum","Hebeloma","Hydnum","Lactarius","Leucocarpia","Naucoria","Otidea","Polyporus", + "Sarcodom","Sarcoscyphus","Scleroderma","Stropharia","Tylopilus","Typhula", "Calyptella", "Chrysopsora", "Lacrymaria", "Dermoloma", + "Agaricus","Alnicola", "Amanitina", "Bovista", "Cheilymenia","Clavulinopsis", "Clitocybe", "Entoloma", "Geaster", "Inocybe", "Paxillus", + "Laccaria", "Laetiporus", "Lepista", "Macrolepiota", "Macrolepis", "Marasmius", "Panaeolus", "Psathyrella", "Psilocybe", + "Rickenella", "Sarcoscypha", "Vascellum", "Ramaria", "Agrocybe", + "Flammulaster", "Phaeocollybia", "Cortinarius", "Lepiota", "Cystoderma", + "Armillaria", "Athelia", "Ceraceomyces", "Chlorociboria", "Clavariaceae", + "Cystoderma", "Dacrymyces","Dendrographa","Dirina", "Flammulaster","Fomes","Gyrophora", + "Kirschsteiniothelia", "Lepiota","Llimoniella","Mazosia","Mollisia", + "Multiclavula","Phaeocollybia","Phellinus","Plectocarpon","Pleospora","Ramariopsis","Reinkella", + "Roccella","Roccellina","Sigridea","Stereum","Tremella","Tulostoma","Unguiculariopsis" , + "Xanthoconium") + +vascular <- c("Leguminosae" , "Alliaceae", "Bombacaceae" ,"Taxodiaceae", + "Aceraceae", "Centrolepidaceae","Callitrichaceae" ,"Flacourtiaceae", + "Compositae", "Asclepiadaceae", "Papilionaceae","Tiliaceae", + "Mimosaceae" , "Xanthorrhoeaceae","Arthropteridaceae", + "Valerianaceae", "Grammitidaceae" ,"Anarthriaceae", "Caesalpiniaceae", + "Chenopodiaceae", "Corylaceae", "Diervillaceae", "Dipsacaceae","Guttiferae", + "Haptanthaceae", "Hymenophyllopsidaceae", "Isoëtaceae","Labiatae", + "Lactoridaceae","Lemnaceae","Selaginaceae","Sterculiaceae","Myoporaceae", + "Myrsinaceae" ,"Pyrolaceae", "Rhoipteleaceae" ,"Xanthoceraceae") +lichens <- c("Acarosporaceae" , "Parmeliaceae", "Physciaceae", "Lichinaceae", + "Caliciaceae", "Lecanoraceae", "Venturiaceae" ,"Sphaerophoraceae" , + "Verrucariaceae", "Tricholomataceae","Baeomycetaceae", + "Catillariaceae" ,"Megasporaceae","Ramalinaceae","Pilocarpaceae" , + "Teloschistaceae","Candelariaceae","Rhizocarpaceae","Lecideaceae", + "Icmadophilaceae","Cladoniaceae","Collemataceae","Pannariaceae" , + "Lobariaceae", "Ophioparmaceae" ,"Psoraceae","Stereocaulaceae", + "Massalongiaceae","Peltigeraceae","Nephromataceae", "Umbilicariaceae" ) +lichen.genera <- c("Amygdalaria", "Anamylospora", "Arthonia", "Pertusaria", "Pyrenula","Opegrapha", + "Ochrolechia", "Graphis", "Micarea", "Porpidia", "Arthopyrenia", "Graphina", "Anisomeridium", + "Mycobilimbia","Peltula", "Thelotrema", "Arthothelium", "Diploschistes", "Strigula", + "Trichothelium", "Melaspilea", "Phaeographis", "Thelenella", "Chaenothecopsis","Fuscidea", + "Dactylospora", "Gyalecta", "Myriotrema", "Placynthium", "Umbilicaria", + "Lasallia", "Microthelia", "Lichenochora", "Roselliniopsis", "Homostegia", + "Verrucaria", "Leptorhaphis") +mosses <- c("Pilotrichaceae", "Chonecoleaceae", "Hypopterygiaceae", "Scorpidiaceae", + "Balantiopsaceae", "Mesoptychiaceae","Octoblepharaceae" ,"Takakiaceae") +algae_diatoms <- c("Sargassaceae", "Chordaceae", "Cocconeidaceae", "Desmarestiaceae", + "Chordariaceae", "Dinobryaceae", "Diploneidaceae", "Ectocarpaceae", + "Fragilariaceae","Sphacelariaceae","Vaucheriaceae" , + "Amphipleuraceae", "Fucaceae", "Gomphonemataceae", "Melosiraceae", + "Laminariaceae","Acinetosporaceae" ,"Botryochloridaceae", + #diatoms below + "Thalassiosiraceae", "Cymbellaceae", "Naviculaceae","Bacillariaceae") + +save(mushroom, vascular, lichens, lichen.genera, mosses, algae_diatoms, file="../derived/taxa_manual.RData") + +``` # `R`-settings diff --git a/code/07_buildCWMs.Rmd b/code/07_buildCWMs.Rmd index 68e590f..1c4aa8c 100644 --- a/code/07_buildCWMs.Rmd +++ b/code/07_buildCWMs.Rmd @@ -492,13 +492,14 @@ sum(is.na(DT.gf$GrowthForm)) ``` Step 2: Select most common species without growth-trait information to export and check manually -```{r, eval=F} +```{r} top.gf.nas <- DT.gf %>% filter(is.na(GrowthForm)) %>% group_by(species) %>% summarize(n=n()) %>% arrange(desc(n)) - +``` +```{r, eval=F} write_csv(top.gf.nas %>% filter(n>1000), path="../_derived/Species_missingGF.csv") @@ -524,8 +525,8 @@ Step 3: Import additional data on growth-form from TRY (Accessed 10 March 2020). #sed "s/'/\\'/g" 8854.txt > 8854_test.csv ``` -```{r} -all.gf <- read_delim("../_input/TRY5.0_v1.1/8854_test.txt", delim="\t") +```{r, message=F} +all.gf0 <- read_delim("../_input/TRY5.0_v1.1/8854_test.txt", delim="\t") all.gf <- all.gf0 %>% filter(TraitID==42) %>% @@ -534,9 +535,11 @@ all.gf <- all.gf0 %>% mutate(GrowthForm0=tolower(GrowthForm0)) %>% filter(AccSpeciesName %in% sPlot.species$species) %>% mutate(GrowthForm_simplified= GrowthForm0) %>% - mutate(GrowthForm_simplified=replace(GrowthForm_simplified, list=str_detect(GrowthForm0, - "vine|climber|liana|carnivore|epiphyte|^succulent|lichen|parasite| - hydrohalophyte|aquatic|cactous|parasitic|hydrophytes|carnivorous"), "other")) %>% + mutate(GrowthForm_simplified=replace(GrowthForm_simplified, + list=str_detect(GrowthForm0, + "vine|climber|liana|carnivore|epiphyte|^succulent|lichen|parasite| + hydrohalophyte|aquatic|cactous|parasitic|hydrophytes|carnivorous"), + "other")) %>% mutate(GrowthForm_simplified=replace(GrowthForm_simplified, list=str_detect(GrowthForm0, "tree|conifer|^woody$|palmoid|mangrove|gymnosperm"), "tree")) %>% mutate(GrowthForm_simplified=replace(GrowthForm_simplified, list=str_detect(GrowthForm0, "shrub|scrub|bamboo"), "shrub")) %>% mutate(GrowthForm_simplified=replace(GrowthForm_simplified, list=str_detect(GrowthForm0, "herb|sedge|graminoid|fern|forb|herbaceous|grass|chaemaephyte|geophyte|annual"), "herb")) %>% -- GitLab