rotl/0000755000176200001440000000000013543642072011240 5ustar liggesusersrotl/NAMESPACE0000644000176200001440000000631313543632526012465 0ustar liggesusers# Generated by roxygen2: do not edit by hand S3method(`[`,otl_ott_id) S3method(candidate_for_synth,study_meta) S3method(flags,match_names) S3method(flags,taxon_info) S3method(flags,taxon_mrca) S3method(get_publication,study_meta) S3method(get_study_year,study_meta) S3method(get_tree_ids,study_meta) S3method(inspect,match_names) S3method(is_in_tree,default) S3method(is_in_tree,otl_ott_id) S3method(is_suppressed,match_names) S3method(is_suppressed,taxon_info) S3method(is_suppressed,taxon_mrca) S3method(list_trees,matched_studies) S3method(ott_id,match_names) S3method(ott_id,taxon_info) S3method(ott_id,taxon_mrca) S3method(ott_id,tol_mrca) S3method(ott_id,tol_node) S3method(ott_id,tol_summary) S3method(print,study_external_data) S3method(print,study_ids) S3method(print,study_meta) S3method(print,tnrs_contexts) S3method(print,tol_mrca) S3method(print,tol_node) S3method(print,tol_summary) S3method(source_list,tol_mrca) S3method(source_list,tol_node) S3method(source_list,tol_summary) S3method(synonyms,match_names) S3method(synonyms,taxon_info) S3method(tax_lineage,taxon_info) S3method(tax_lineage,tol_node) S3method(tax_name,match_names) S3method(tax_name,taxon_info) S3method(tax_name,taxon_mrca) S3method(tax_name,tol_mrca) S3method(tax_name,tol_node) S3method(tax_name,tol_summary) S3method(tax_rank,match_names) S3method(tax_rank,taxon_info) S3method(tax_rank,taxon_mrca) S3method(tax_rank,tol_mrca) S3method(tax_rank,tol_node) S3method(tax_rank,tol_summary) S3method(tax_sources,match_names) S3method(tax_sources,taxon_info) S3method(tax_sources,taxon_mrca) S3method(tax_sources,tol_mrca) S3method(tax_sources,tol_node) S3method(tax_sources,tol_summary) S3method(tol_lineage,tol_node) S3method(unique_name,match_names) S3method(unique_name,taxon_info) S3method(unique_name,taxon_mrca) S3method(unique_name,tol_mrca) S3method(unique_name,tol_node) S3method(unique_name,tol_summary) S3method(update,match_names) export(candidate_for_synth) export(flags) export(get_publication) export(get_study) export(get_study_meta) export(get_study_subtree) export(get_study_tree) export(get_study_year) export(get_tree_ids) export(inspect) export(is_in_tree) export(is_suppressed) export(list_trees) export(ott_id) export(source_list) export(strip_ott_ids) export(studies_find_studies) export(studies_find_trees) export(studies_properties) export(study_external_IDs) export(synonyms) export(tax_lineage) export(tax_name) export(tax_rank) export(tax_sources) export(taxon_external_IDs) export(taxonomy_about) export(taxonomy_mrca) export(taxonomy_subtree) export(taxonomy_taxon_info) export(tnrs_contexts) export(tnrs_infer_context) export(tnrs_match_names) export(tol_about) export(tol_induced_subtree) export(tol_lineage) export(tol_mrca) export(tol_node_info) export(tol_subtree) export(unique_name) import(ape) importFrom(assertthat,assert_that) importFrom(assertthat,is.flag) importFrom(assertthat,is.string) importFrom(httr,GET) importFrom(httr,POST) importFrom(httr,content) importFrom(httr,parse_url) importFrom(jsonlite,fromJSON) importFrom(jsonlite,toJSON) importFrom(jsonlite,unbox) importFrom(rentrez,entrez_link) importFrom(rentrez,entrez_search) importFrom(rncl,read_newick_phylo) importFrom(stats,na.omit) importFrom(stats,setNames) importFrom(stats,update) rotl/LICENSE0000644000176200001440000000011713056156657012254 0ustar liggesusersYEAR: 2017 COPYRIGHT HOLDER: Francois Michonneau, Joseph W. Brown, David Winterrotl/README.md0000644000176200001440000001455613543633314012531 0ustar liggesusers [![Build Status](https://travis-ci.org/ropensci/rotl.svg?branch=master)](https://travis-ci.org/ropensci/rotl) [![Build status](https://ci.appveyor.com/api/projects/status/qr4k9a8wlrjl65rp?svg=true)](https://ci.appveyor.com/project/ropensci/rotl) [![codecov.io](https://codecov.io/github/ropensci/rotl/coverage.svg?branch=master)](https://codecov.io/github/ropensci/rotl?branch=master) [![](http://www.r-pkg.org/badges/version/rotl)](http://www.r-pkg.org/pkg/rotl) [![CRAN RStudio mirror downloads](http://cranlogs.r-pkg.org/badges/rotl)](http://www.r-pkg.org/pkg/rotl) [![](https://badges.ropensci.org/17_status.svg)](https://github.com/ropensci/onboarding/issues/17) [![Project Status: Active – The project has reached a stable, usable state and is being actively developed.](https://www.repostatus.org/badges/latest/active.svg)](https://www.repostatus.org/#active) # An R interface to Open Tree API `rotl` is an R package to interact with the Open Tree of Life data APIs. It was initially developed as part of the [NESCENT/OpenTree/Arbor hackathon](http://blog.opentreeoflife.org/2014/06/11/apply-for-tree-for-all-a-hackathon-to-access-opentree-resources/). Client libraries to interact with the Open Tree of Life API also exists for [Python](https://github.com/OpenTreeOfLife/pyopentree) and [Ruby](https://github.com/SpeciesFileGroup/bark). ## Installation The current stable version is available from CRAN, and can be installed by typing the following at the prompt in R: ``` r install.packages("rotl") ``` If you want to test the development version, you first need to install the `remotes` package. ``` r install.packages("remotes") ``` Then you can install `rotl` using: ``` r remotes::install_github("ropensci/rotl") ``` ## Vignettes There are three vignettes: - Start by checking out the “How to use `rotl`?” by typing: `vignette("rotl", package="rotl")` after installing the package. - Then explore how you can use `rotl` with other packages to combine your data with trees from the Open Tree of Life project by typing: `vignette("data_mashups", package="rotl")`. - The vignette “Using the Open Tree Synthesis in a comparative analsysis” demonstrates how you can reproduce an analysis of a published paper by downloading the tree they used, and data from the supplementary material: `vignette("meta-analysis", package="rotl")`. The vignettes are also available from CRAN: [How to use `rotl`?](https://cran.r-project.org/package=rotl/vignettes/rotl.html), [Data mashups](https://cran.r-project.org/package=rotl/vignettes/data_mashups.html), and [Using the Open Tree synthesis in a comparative analysis](https://cran.r-project.org/package=rotl/vignettes/meta-analysis.html). ## Quick start ### Get a little bit of the big Open Tree tree Taxonomic names are represented in the Open Tree by numeric identifiers, the `ott_ids` (Open Tree Taxonomy identifiers). To extract a portion of a tree from the Open Tree, you first need to find `ott_ids` for a set of names using the `tnrs_match_names` function: ``` r library(rotl) apes <- c("Pongo", "Pan", "Gorilla", "Hoolock", "Homo") (resolved_names <- tnrs_match_names(apes)) ``` ## search_string unique_name approximate_match ott_id is_synonym flags ## 1 pongo Pongo FALSE 417949 FALSE ## 2 pan Pan FALSE 417957 FALSE ## 3 gorilla Gorilla FALSE 417969 FALSE ## 4 hoolock Hoolock FALSE 712902 FALSE ## 5 homo Homo FALSE 770309 FALSE ## number_matches ## 1 2 ## 2 2 ## 3 1 ## 4 1 ## 5 1 Now we can get the tree with just those tips: ``` r tr <- tol_induced_subtree(ott_ids = ott_id(resolved_names)) ``` ## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes ## with labels: Ponginae ott1082538, Hylobatidae ott166544 ``` r plot(tr) ``` ![](https://i.imgur.com/KTApZbS.png) The code above can be summarized in a single pipe: ``` r library(magrittr) ## or expressed as a pipe: c("Pongo", "Pan", "Gorilla", "Hoolock", "Homo") %>% tnrs_match_names() %>% ott_id() %>% tol_induced_subtree() %>% plot() ``` ## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes ## with labels: Ponginae ott1082538, Hylobatidae ott166544 ![](https://i.imgur.com/1TCS3iA.png) ## Citation and Manuscript To cite `rotl` in publications pleases use: > Michonneau, F., Brown, J. W. and Winter, D. J. (2016), rotl: an R > package to interact with the Open Tree of Life data. Methods in > Ecology and Evolution. 7(12):1476-1481. doi: > [10.1111/2041-210X.12593](https://doi.org/10.1111/2041-210X.12593) You may also want to cite the paper for the Open Tree of Life > Hinchliff, C. E., et al. (2015). Synthesis of phylogeny and taxonomy > into a comprehensive tree of life. Proceedings of the National Academy > of Sciences 112.41 (2015): 12764-12769 doi: > [10.1073/pnas.1423041112](https://doi.org/10.1073/pnas.1423041112) The manuscript in *Methods in Ecology and Evolution* includes additional examples on how to use the package. The manuscript and the code it contains are also hosted on GitHub at: ## Versioning Starting with v3.0.0 of the package, the major and minor version numbers (the first 2 digits of the version number) will be matched to those of the API. The patch number (the 3rd digit of the version number) will be used to reflect bug fixes and other changes that are independent from changes to the API. `rotl` can be used to access other versions of the API (if they are available) but most likely the high level functions will not work. Instead, you will need to parse the output yourself using the “raw” returns from the unexported low-level functions (all prefixed with a `.`). For instance to use the `tnrs/match_names` endpoint for `v2` of the API: ``` r rotl:::.tnrs_match_names(c("pan", "pango", "gorilla", "hoolock", "homo"), otl_v = "v2") ``` ### Code of Conduct Please note that this project is released with a [Contributor Code of Conduct](https://github.com/ropensci/rotl/blob/master/CONDUCT.md). By participating in this project you agree to abide by its terms. [![](http://ropensci.org/public_images/github_footer.png)](http://ropensci.org) rotl/man/0000755000176200001440000000000013543637134012016 5ustar liggesusersrotl/man/get_study_tree.Rd0000644000176200001440000000436113543603103015324 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{get_study_tree} \alias{get_study_tree} \title{Study Tree} \usage{ get_study_tree( study_id = NULL, tree_id = NULL, object_format = c("phylo"), tip_label = c("original_label", "ott_id", "ott_taxon_name"), file_format, file, deduplicate = TRUE, ... ) } \arguments{ \item{study_id}{the identifier of a study (character)} \item{tree_id}{the identifier of a tree within the study} \item{object_format}{the class of the object to be returned (default and currently only possible value \code{phylo} from the \code{\link[ape]{ape}} package).} \item{tip_label}{the format of the tip labels. \dQuote{\code{original_label}} (default) returns the original labels as provided in the study, \dQuote{\code{ott_id}} labels are replaced by their ott IDs, \dQuote{\code{ott_taxon_name}} labels are replaced by their Open Tree Taxonomy taxon name.} \item{file_format}{the format of the file to be generated (\code{newick} default, \code{nexus}, or \code{json}).} \item{file}{the file name where the output of the function will be saved.} \item{deduplicate}{logical (default \code{TRUE}). If the tree returned by the study contains duplicated taxon names, should they be made unique? It is normally illegal for NEXUS/Newick tree strings to contain duplicated tip names. This is a workaround to circumvent this requirement. If \code{TRUE}, duplicated tip labels will be appended \code{_1}, \code{_2}, etc.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ if \code{file_format} is missing, an object of class \code{phylo}, otherwise a logical indicating whether the file was successfully created. } \description{ Returns a specific tree from within a study } \examples{ \dontrun{ tree <- get_study_tree(study_id="pg_1144", tree_id="tree2324") ## comparison of the first few tip labels depending on the options used head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="original_label")$tip.label) head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="ott_id")$tip.label) head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="ott_taxon_name")$tip.label) } } rotl/man/rotl.Rd0000644000176200001440000000365613543603103013264 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/rotl-package.R \docType{package} \name{rotl} \alias{rotl} \title{An Interface to the Open Tree of Life API} \description{ The Open Tree of Life is an NSF funded project that is generating an online, comprehensive phylogenetic tree for 1.8 million species. \code{rotl} provides an interface that allows you to query and retrieve the parts of the tree of life that is of interest to you. } \details{ \code{rotl} provides function to most of the end points the API provides. The documentation of the API is available at: \url{https://github.com/OpenTreeOfLife/opentree/wiki/Open-Tree-of-Life-APIs} } \section{Customizing API calls}{ All functions that use API end points can take 2 arguments to customize the API call and are passed as \code{...} arguments. \itemize{ \item{ \code{otl_v} } { This argument controls which version of the API your call is using. The default value for this argument is a call to the non-exported function \code{otl_version()} which returns the current version of the Open Tree of Life APIs (v2).} \item{ \code{dev_url} } { This argument controls whether to use the development version of the API. By default, \code{dev_url} is set to \code{FALSE}, using \code{dev_url = TRUE} in your function calls will use the development version.} } For example, to use the development version of the API, you could use: \code{tnrs_match_names("anas", dev_url=TRUE)} Additional arguments can also be passed to the \code{\link[httr]{GET}} and \code{\link[httr]{POST}} methods. } \section{Acknowledgments}{ This package was started during the Open Tree of Life \href{http://blog.opentreeoflife.org/2014/06/11/apply-for-tree-for-all-a-hackathon-to-access-opentree-resources/}{Hackathon} organized by OpenTree, the NESCent Hackathon Interoperability Phylogenetic group, and Arbor. } rotl/man/studies_find_trees.Rd0000644000176200001440000000563113543603103016161 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{studies_find_trees} \alias{studies_find_trees} \title{Find Trees} \usage{ studies_find_trees( property = NULL, value = NULL, verbose = FALSE, exact = FALSE, detailed = TRUE, ... ) } \arguments{ \item{property}{The property to be searched on (character)} \item{value}{The property-value to be searched on (character)} \item{verbose}{Should the output include all metadata? (logical, default \code{FALSE})} \item{exact}{Should exact matching be used for the value? (logical, default \code{FALSE})} \item{detailed}{Should a detailed report be provided? If \code{TRUE} (default), the output will include metadata about the study that include trees matching the property. Otherwise, only information about the trees will be provided.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A data frame that summarizes the trees found (and their associated studies) for the requested criteria. If a study has more than 5 trees, the \code{tree_ids} of the first ones will be shown, followed by \code{...} to indicate that more are present. If \code{detailed=FALSE}, the data frame will include the study ids of the study (\code{study_ids}), the number of trees in this study that match the search criteria (\code{n_matched_trees}), the tree ids that match the search criteria (\code{match_tree_ids}). If \code{detailed=TRUE}, in addition of the fields listed above, the data frame will also contain the total number of trees associated with the study (\code{n_trees}), all the tree ids associated with the study (\code{tree_ids}), the tree id that is a potential candidate for inclusion in the synthetic tree (if any) (\code{candidate}), the year the study was published (\code{study_year}), the title of the study (\code{title}), the DOI for the study (\code{study_doi}). } \description{ Return a list of studies for which trees match a given set of properties } \details{ The list of possible values to be used as values for the argument \code{property} can be found using the function \code{\link{studies_properties}}. } \examples{ \dontrun{ res <- studies_find_trees(property="ot:ottTaxonName", value="Drosophilia", detailed=FALSE) ## summary of the trees and associated studies that match this criterion res ## With metadata about the studies (default) res <- studies_find_trees(property="ot:ottTaxonName", value="Drosophilia", detailed=TRUE) ## The list of trees for each study that match the search criteria list_trees(res) ## the trees for a given study list_trees(res, study_id = "pg_2769") } } \seealso{ \code{\link{studies_properties}} which lists properties the studies can be searched on. \code{\link{list_trees}} for listing the trees that match the query. } rotl/man/taxonomy_taxon_info.Rd0000644000176200001440000000445713543603103016406 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/taxonomy.R \name{taxonomy_taxon_info} \alias{taxonomy_taxon_info} \alias{tax_rank.taxon_info} \alias{tax_name.taxon_info} \alias{unique_name.taxon_info} \alias{synonyms.taxon_info} \alias{ott_id.taxon_info} \alias{tax_sources.taxon_info} \alias{is_suppressed.taxon_info} \alias{flags.taxon_info} \title{Taxon information} \usage{ taxonomy_taxon_info( ott_ids, include_children = FALSE, include_lineage = FALSE, include_terminal_descendants = FALSE, ... ) \method{tax_rank}{taxon_info}(tax, ...) \method{tax_name}{taxon_info}(tax, ...) \method{unique_name}{taxon_info}(tax, ...) \method{synonyms}{taxon_info}(tax, ...) \method{ott_id}{taxon_info}(tax, ...) \method{tax_sources}{taxon_info}(tax, ...) \method{is_suppressed}{taxon_info}(tax, ...) \method{flags}{taxon_info}(tax, ...) } \arguments{ \item{ott_ids}{the ott ids of the taxon of interest (numeric or character containing only numbers)} \item{include_children}{whether to include information about all the children of this taxon. Default \code{FALSE}.} \item{include_lineage}{whether to include information about all the higher level taxa that include the \code{ott_ids}. Default \code{FALSE}.} \item{include_terminal_descendants}{whether to include the list of terminal \code{ott_ids} contained in the \code{ott_ids} provided.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} \item{tax}{an object generated by the \code{taxonomy_taxon_info} function} } \value{ \code{taxonomy_taxon_info} returns a list detailing information about the taxa. \code{tax_rank} and \code{tax_name} return a vector. \code{synonyms} returns a list whose elements are the synonyms for each of the \code{ott_id} requested. } \description{ Information about taxa. } \details{ Given a vector of ott ids, \code{taxonomy_taxon_info} returns information about the specified taxa. The functions \code{tax_rank}, \code{tax_name}, and \code{synonyms} can extract this information from an object created by the \code{taxonomy_taxon_info()}. } \examples{ \dontrun{ req <- taxonomy_taxon_info(ott_id=515698) tax_rank(req) tax_name(req) synonyms(req) } } \seealso{ \code{\link{tnrs_match_names}} to obtain \code{ott_id} from a taxonomic name. } rotl/man/tol_subtree.Rd0000644000176200001440000000302013543603103014614 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tol.R \name{tol_subtree} \alias{tol_subtree} \title{Extract a subtree from the synthetic tree} \usage{ tol_subtree(ott_id = NULL, node_id = NULL, label_format = NULL, file, ...) } \arguments{ \item{ott_id}{Numeric. The ott id of the node in the tree that should serve as the root of the tree returned.} \item{node_id}{Character. The node id of the node in the tree that should serve as the root of the tree returned.} \item{label_format}{Character. Defines the label type; one of \dQuote{\code{name}}, \dQuote{\code{id}}, or \dQuote{\code{name_and_id}} (the default).} \item{file}{If specified, the function will write the subtree to a file in newick format.} \item{...}{additional arguments to customize the API call (see \code{\link{rotl}} for more information).} } \value{ If no value is specified to the \code{file} argument (default), a phylogenetic tree of class \code{phylo}. Otherwise, the function returns invisibly a logical indicating whether the file was successfully created. } \description{ Extract a subtree from the synthetic tree from an Open Tree node id. } \details{ Given a node, return the subtree of the synthetic tree descended from that node. The start node may be specified using either a node id or an ott id, but not both. If the specified node is not in the synthetic tree an error will be returned. There is a size limit of 25000 tips for this method. } \examples{ \dontrun{ res <- tol_subtree(ott_id=241841)} } rotl/man/source_list.Rd0000644000176200001440000000151113055075704014633 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/methods.R, R/tol.R \name{source_list} \alias{source_list} \alias{source_list.tol_summary} \title{List of studies used in the Tree of Life} \usage{ source_list(tax, ...) \method{source_list}{tol_summary}(tax, ...) } \arguments{ \item{tax}{a list containing a \code{source_id_map} slot.} \item{...}{additional arguments (currently unused)} } \value{ a data frame } \description{ Retrieve the detailed information for the list of studies used in the Tree of Life. } \details{ This function takes the object resulting from \code{tol_about(study_list = TRUE)}, \code{tol_mrca()}, \code{tol_node_info()}, and returns a data frame listing the \code{tree_id}, \code{study_id} and \code{git_sha} for the studies currently included in the Tree of Life. } rotl/man/studies_properties.Rd0000644000176200001440000000220313055075704016233 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{studies_properties} \alias{studies_properties} \title{Properties of the Studies} \usage{ studies_properties(...) } \arguments{ \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A list of the study properties that can be used to find studies and trees that are contributing to the synthetic tree. } \description{ Return the list of study properties that can be used to search studies and trees used in the synthetic tree. } \details{ The list returned has 2 elements \code{tree_properties} and \code{studies_properties}. Each of these elements lists additional arguments to customize the API request properties that can be used to search for trees and studies that are contributing to the synthetic tree. The definitions of these properties are available from \url{https://github.com/OpenTreeOfLife/phylesystem-api/wiki/NexSON} } \examples{ \dontrun{ all_the_properties <- studies_properties() unlist(all_the_properties$tree_properties) } } \seealso{ \code{\link{studies_find_trees}} } rotl/man/taxonomy_subtree.Rd0000644000176200001440000000440013543603103015677 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/taxonomy.R \name{taxonomy_subtree} \alias{taxonomy_subtree} \title{Taxonomy subtree} \usage{ taxonomy_subtree( ott_id = NULL, output_format = c("taxa", "newick", "phylo", "raw"), label_format = NULL, file, ... ) } \arguments{ \item{ott_id}{The ott id of the taxon of interest.} \item{output_format}{the format of the object to be returned. See the \sQuote{Return} section.} \item{label_format}{Character. Defines the label type; one of \dQuote{\code{name}}, \dQuote{\code{id}}, or \dQuote{\code{name_and_id}} (the default).} \item{file}{the file name where to save the output of the function. Ignored unless \code{output_format} is set to \dQuote{\code{phylo}}.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ If the \code{file} argument is missing: \itemize{ \item{\dQuote{\code{taxa}}} { a list of the taxa names (species) in slot \code{tip_label}, and higher-level taxonomy (e.g., families, genera) in slot \code{edge_label}, descending from the taxa corresponding to the \code{ott_id} provided. } \item{\dQuote{\code{newick}}} { a character vector containing the newick formatted string corresponding to the taxonomic subtree for the \code{ott_id} provided. } \item{\dQuote{\code{phylo}}} { an object of the class \code{phylo} from the \code{\link[ape]{ape}} package. } \item{\dQuote{\code{raw}}} { the direct output from the API, i.e., a list with an element named \sQuote{newick} that contains the subtree as a newick formatted string. } } If a \code{file} argument is provided (and \code{output_format} is set to \dQuote{\code{phylo}}), a logical indicating whether the file was successfully created. } \description{ Given an ott id, return the inclusive taxonomic subtree descended from the specified taxon. } \details{ If the output of this function is exported to a file, the only possible value for the \code{output_format} argument is \dQuote{\code{newick}}. If the file provided already exists, it will be silently overwritten. } \examples{ \dontrun{ req <- taxonomy_subtree(ott_id=515698) plot(taxonomy_subtree(ott_id=515698, output_format="phylo")) } } rotl/man/synonyms.match_names.Rd0000644000176200001440000000346713057544607016476 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/match_names.R \name{synonyms.match_names} \alias{synonyms.match_names} \title{List the synonyms for a given name} \usage{ \method{synonyms}{match_names}(tax, row_number, taxon_name, ott_id, ...) } \arguments{ \item{tax}{a data frame generated by the \code{\link{tnrs_match_names}} function} \item{row_number}{the row number corresponding to the name for which to list the synonyms} \item{taxon_name}{the taxon name corresponding to the name for which to list the synonyms} \item{ott_id}{the ott id corresponding to the name for which to list the synonyms} \item{...}{currently ignored} } \value{ a list whose elements are all synonym names (as vectors of character) for the taxonomic names that match the query (the names of the elements of the list). } \description{ When querying the Taxonomic Name Resolution Services for a particular taxonomic name, the API returns as possible matches all names that include the queried name as a possible synonym. This function allows you to explore other synonyms for an accepted name, and allows you to determine why the name you queried is returning an accepted synonym. } \details{ To list synonyms for a given taxonomic name, you need to provide the object resulting from a call to the \code{\link{tnrs_match_names}} function, as well as one of either the row number corresponding to the name in this object, the name itself (as used in the original query), or the ott_id listed for this name. Otherwise, the synonyms for all the currently matched names are returned. } \examples{ \dontrun{ echino <- tnrs_match_names(c("Diadema", "Acanthaster", "Fromia")) ## These 3 calls are identical synonyms(echino, taxon_name="Acanthaster") synonyms(echino, row_number=2) synonyms(echino, ott_id=337928) } } rotl/man/taxonomy-methods.Rd0000644000176200001440000000165713055075704015632 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/methods.R \name{tax_rank} \alias{tax_rank} \alias{ott_id} \alias{synonyms} \alias{tax_sources} \alias{is_suppressed} \alias{unique_name} \alias{tax_name} \title{Methods for Taxonomy} \usage{ tax_rank(tax, ...) ott_id(tax, ...) synonyms(tax, ...) tax_sources(tax, ...) is_suppressed(tax, ...) unique_name(tax, ...) tax_name(tax, ...) } \arguments{ \item{tax}{an object returned by \code{\link{taxonomy_taxon_info}}, \code{\link{taxonomy_mrca}}, or \code{\link{tnrs_match_names}}} \item{...}{additional arguments (see \code{\link{tnrs_match_names}})} } \description{ Methods for dealing with objects containing taxonomic information (Taxonomy, TNRS endpoints) } \details{ This is the page for the generic methods. See the help pages for \code{\link{taxonomy_taxon_info}}, \code{\link{taxonomy_mrca}}, and \code{\link{tnrs_match_names}} for more information. } rotl/man/tol_induced_subtree.Rd0000644000176200001440000000406213543603103016316 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tol.R \name{tol_induced_subtree} \alias{tol_induced_subtree} \title{Subtree from the Open Tree of Life} \usage{ tol_induced_subtree( ott_ids = NULL, node_ids = NULL, label_format = NULL, file, ... ) } \arguments{ \item{ott_ids}{Numeric vector. OTT ids indicating nodes to be used as tips in the induced tree.} \item{node_ids}{Character vector. Node ids indicating nodes to be used as tips in the induced tree.} \item{label_format}{Character. Defines the label type; one of \dQuote{\code{name}}, \dQuote{\code{id}}, or \dQuote{\code{name_and_id}} (the default).} \item{file}{If specified, the function will write the subtree to a file in newick format.} \item{...}{additional arguments to customize the API call (see \code{\link{rotl}} for more information).} } \value{ If no value is specified to the \code{file} argument (default), a phylogenetic tree of class \code{phylo}. Otherwise, the function returns invisibly a logical indicating whether the file was successfully created. Note that the tree returned when specifying a file name with the \code{file} argument is the \dQuote{raw} Newick string returned by Open Tree of Life. This string contains singleton nodes, and therefore will be different from the tree returned as a \code{phylo} object which will not contain these singleton nodes. } \description{ Return the induced subtree on the synthetic tree that relates a list of nodes. } \details{ Return a tree with tips corresponding to the nodes identified in the input set that is consistent with the topology of the current synthetic tree. This tree is equivalent to the minimal subtree induced on the draft tree by the set of identified nodes. } \examples{ \dontrun{ ## Result as a `phylo` object res <- tol_induced_subtree(ott_ids = c(292466, 267845, 316878, 102710)) ## Raw Newick string from Open Tree of Life tree_file <- tempfile(fileext = ".tre") tol_induced_subtree(ott_ids = c(292466, 267845, 316878, 102710), file=tree_file) } } rotl/man/tax_lineage.Rd0000644000176200001440000000163313055075704014565 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/methods.R, R/taxonomy.R \name{tax_lineage} \alias{tax_lineage} \alias{tax_lineage.taxon_info} \title{Lineage of a taxon} \usage{ tax_lineage(tax, ...) \method{tax_lineage}{taxon_info}(tax, ...) } \arguments{ \item{tax}{an object created by \code{\link{taxonomy_taxon_info}} using the argument \code{include_lineage=TRUE}.} \item{...}{additional arguments (currently unused).} } \value{ A list with one slot per taxon that contains a data frame with 3 columns: the taxonomy rank, the name, and unique name for all taxa included in the lineage of the taxon up to the root of the tree. } \description{ Extract the lineage information (higher taxonomy) from an object returned by \code{\link{taxonomy_taxon_info}}. } \details{ The object passed to this function must have been created using the argument \code{include_lineage=TRUE}. } rotl/man/list_trees.Rd0000644000176200001440000000244113543603103014450 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies-methods.R \name{list_trees} \alias{list_trees} \alias{list_trees.matched_studies} \title{List trees ids in objects returned by \code{\link{studies_find_studies}} and \code{\link{studies_find_trees}}.} \usage{ list_trees(matched_studies, ...) \method{list_trees}{matched_studies}(matched_studies, study_id, ...) } \arguments{ \item{matched_studies}{an object created by \code{studies_find_trees} or \code{studies_find_studies}.} \item{study_id}{a \code{study_id} listed in the object returned by \code{studies_find_trees}} \item{...}{Currently unused} } \value{ \code{list_trees} returns a list of the tree_ids for each study that match the requested criteria. If a \code{study_id} is provided, then only the trees for this study are returned as a vector. } \description{ \code{list_trees} returns all trees associated with a particular study when used on an object returned by \code{\link{studies_find_studies}}, but only the trees that match the search criteria when used on objects returned by \code{\link{studies_find_trees}}. } \seealso{ \code{\link{studies_find_studies}} and \code{\link{studies_find_trees}}. The help for these functions have examples demonstrating the use of \code{list_trees}. } rotl/man/tnrs_infer_context.Rd0000644000176200001440000000177113055075704016225 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tnrs.R \name{tnrs_infer_context} \alias{tnrs_infer_context} \title{Infer the taxonomic context from a list of names} \usage{ tnrs_infer_context(names = NULL, ...) } \arguments{ \item{names}{Vector of taxon names.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A list including the context name, the context ott id and possibly the names in the query that have an ambiguous taxonomic meaning in the query. } \description{ Return a taxonomic context given a list of taxonomic names } \details{ Find the least inclusive taxonomic context that includes all the unambiguous names in the input set. Unambiguous names are names with exact matches to non-homonym taxa. Ambiguous names (those without exact matches to non-homonym taxa) are indicated in results. } \examples{ \dontrun{ res <- tnrs_infer_context(names=c("Stellula calliope", "Struthio camelus")) } } rotl/man/match_names-methods.Rd0000644000176200001440000000355613055075704016233 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/match_names.R, R/methods.R \name{ott_id.match_names} \alias{ott_id.match_names} \alias{flags.match_names} \alias{flags} \title{\code{ott_id} and \code{flags} for taxonomic names matched by \code{tnrs_match_names}} \usage{ \method{ott_id}{match_names}(tax, row_number, taxon_name, ott_id, ...) \method{flags}{match_names}(tax, row_number, taxon_name, ott_id, ...) flags(tax, ...) } \arguments{ \item{tax}{an object returned by \code{\link{tnrs_match_names}}} \item{row_number}{the row number corresponding to the name for which to list the synonyms} \item{taxon_name}{the taxon name corresponding to the name for which to list the synonyms} \item{ott_id}{the ott id corresponding to the name for which to list the synonyms} \item{...}{currently ignored} } \value{ A list of the ott ids or flags for the taxonomic names matched with \code{\link{tnrs_match_names}}, for either one or all the names. } \description{ \code{rotl} provides a collection of functions that allows users to extract relevant information from an object generated by \code{\link{tnrs_match_names}} function. } \details{ These methods optionally accept one of the arguments \code{row_number}, \code{taxon_name} or \code{ott_id} to retrieve the corresponding information for one of the matches in the object returned by the \code{\link{tnrs_match_names}} function. If these arguments are not provided, these methods can return information for the matches currently listed in the object returned by \code{\link{tnrs_match_names}}. } \examples{ \dontrun{ rsp <- tnrs_match_names(c("Diadema", "Tyrannosaurus")) rsp$ott_id # ott id for match currently in use ott_id(rsp) # similar as above but elements are named ## flags() is useful for instance to determine if a taxon is extinct flags(rsp, taxon_name="Tyrannosaurus") } } rotl/man/tnrs_contexts.Rd0000644000176200001440000000200513055075704015214 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tnrs.R \name{tnrs_contexts} \alias{tnrs_contexts} \title{TNRS contexts} \usage{ tnrs_contexts(...) } \arguments{ \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ Returns invisibly a list for each major clades (e.g., animals, microbes, plants, fungi, life) whose elements contains the possible contexts. } \description{ This function returns a list of pre-defined taxonomic contexts (i.e. clades) which can be used to limit the scope of tnrs queries. } \details{ Taxonomic contexts are available to limit the scope of TNRS searches. These contexts correspond to uncontested higher taxa such as 'Animals' or 'Land plants'. This service returns a list containing all available taxonomic context names, which may be used as input (via the \code{context_name} argument in other functions) to limit the search scope of other services including \code{\link{tnrs_match_names}}. } rotl/man/tol_about.Rd0000644000176200001440000000766013055075704014303 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tol.R \name{tol_about} \alias{tol_about} \alias{tax_rank.tol_summary} \alias{tax_sources.tol_summary} \alias{unique_name.tol_summary} \alias{tax_name.tol_summary} \alias{ott_id.tol_summary} \title{Information about the Tree of Life} \usage{ tol_about(include_source_list = FALSE, ...) \method{tax_rank}{tol_summary}(tax, ...) \method{tax_sources}{tol_summary}(tax, ...) \method{unique_name}{tol_summary}(tax, ...) \method{tax_name}{tol_summary}(tax, ...) \method{ott_id}{tol_summary}(tax, ...) } \arguments{ \item{include_source_list}{Logical (default = \code{FALSE}). Return an ordered list of source trees.} \item{...}{additional arguments to customize the API call (see \code{\link{rotl}} for more information).} \item{tax}{an object created with a call to \code{tol_about}.} } \value{ An invisible list of synthetic tree summary statistics: \itemize{ \item {date_created} {String. The creation date of the tree.} \item {num_source_studies} {Integer. The number of studies (publications)used as sources.} \item {num_source_trees} {The number of trees used as sources (may be >1 tree per study).} \item {taxonomy_version} {The Open Tree Taxonomy version used as a source.} \item {filtered_flags} {List. Taxa with these taxonomy flags were not used in construction of the tree.} \item {root} {List. Describes the root node:} \itemize{ \item {node_id} {String. The canonical identifier of the node.} \item {num_tips} {Numeric. The number of descendent tips.} \item {taxon} {A list of taxonomic properties:} \itemize{ \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ott_id).} \item {name} {String. The taxonomic name of the queried node.} \item {unique_name} {String. The string that uniquely identifies the taxon in OTT.} \item {rank} {String. The taxonomic rank of the taxon in OTT.} \item {tax_sources} {List. A list of identifiers for taxonomic sources, such as other taxonomies, that define taxa judged equivalent to this taxon.} } } \item {source_list} {List. Present only if \code{include_source_list} is \code{TRUE}. The sourceid ordering is the precedence order for synthesis, with relationships from earlier trees in the list having priority over those from later trees in the list. See \code{source_id_map} below for study details.} \item {source_id_map} {Named list of lists. Present only if \code{include_source_list} is \code{TRUE}. Names correspond to the \sQuote{sourceids} used in \code{source_list} above. Source trees will have the following properties:} \itemize{ \item {git_sha} {String. The git SHA identifying a particular source version.} \item {tree_id} {String. The tree id associated with the study id used.} \item {study_id} {String. The study identifier. Will typically include a prefix ("pg_" or "ot_").} } \item {synth_id} {The unique string for this version of the tree.} } } \description{ Basic information about the Open Tree of Life (the synthetic tree) } \details{ Summary information about the current draft tree of life, including information about the list of trees and the taxonomy used to build it. The object returned by \code{tol_about} can be passed to the taxonomy methods (\code{tax_name()}, \code{tax_rank()}, \code{tax_sources()}, \code{ott_id}), to extract relevant taxonomic information for the root of the synthetic tree. } \examples{ \dontrun{ res <- tol_about() tax_sources(res) ott_id(res) studies <- source_list(tol_about(include_source_list=TRUE))} } \seealso{ \code{\link{source_list}} to explore the list of studies used in the synthetic tree (see example). } rotl/man/taxon_external_IDs.Rd0000644000176200001440000000167513057544607016112 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/external_data.R \name{taxon_external_IDs} \alias{taxon_external_IDs} \title{Get external identifiers for data associated with an Open Tree taxon} \usage{ taxon_external_IDs(taxon_id) } \arguments{ \item{taxon_id}{An open tree study ID} } \value{ a data.frame in which each row represents a unique record in an external database. The column "source" provides and abbreviated name for the database, and "id" the unique ID for the record. } \description{ The Open Tree taxonomy is a synthesis of multiple reference taxonomies. This function retrieves identifiers to external taxonomic records that have contributed the rank, position and definition of a given Open Tree taxon. } \examples{ \dontrun{ gibbon_IDs <- taxon_external_IDs(712902) } } \seealso{ tnrs_matchnames, which can be used to search for taxa by name. taxonomy_taxon, for more information about a given taxon. } rotl/man/get_study_subtree.Rd0000644000176200001440000000432313543603103016034 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{get_study_subtree} \alias{get_study_subtree} \title{Study Subtree} \usage{ get_study_subtree( study_id, tree_id, subtree_id, object_format = c("phylo"), tip_label = c("original_label", "ott_id", "ott_taxon_name"), file_format, file, deduplicate = TRUE, ... ) } \arguments{ \item{study_id}{the study identifier (character)} \item{tree_id}{the tree identifier (character)} \item{subtree_id, }{either a node id that specifies a subtree or \dQuote{ingroup} which returns the ingroup for this subtree.} \item{object_format}{the class of the object returned by the function (default, and currently only possibility \code{phylo} from the \code{\link[ape]{ape}} package)} \item{tip_label}{the format of the tip labels. \dQuote{\code{original_label}} (default) returns the original labels as provided in the study, \dQuote{\code{ott_id}} labels are replaced by their ott IDs, \dQuote{\code{ott_taxon_name}} labels are replaced by their Open Tree Taxonomy taxon name.} \item{file_format}{character, the file format to use to save the results of the query (possible values, \sQuote{newick} or \sQuote{nexus}).} \item{file}{character, the path and file name where the output should be written.} \item{deduplicate}{logical (default \code{TRUE}). If the tree returned by the study contains duplicated taxon names, should they be made unique? It is normally illegal for NEXUS/Newick tree strings to contain duplicated tip names. This is a workaround to circumvent this requirement. If \code{TRUE}, duplicated tip labels will be appended \code{_1}, \code{_2}, etc.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \description{ Retrieve subtree from a specific tree in the Open Tree of Life data store } \examples{ \dontrun{ small_tr <- get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="node991044") ingroup <- get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="ingroup") nexus_file <- tempfile(fileext=".nex") get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="ingroup", file=nexus_file, file_format="nexus") } } rotl/man/taxonomy_about.Rd0000644000176200001440000000212413057544607015356 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/taxonomy.R \name{taxonomy_about} \alias{taxonomy_about} \title{Information about the Open Tree Taxonomy} \usage{ taxonomy_about(...) } \arguments{ \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A list with the following properties: \itemize{ \item {weburl} {String. The release page for this version of the taxonomy.} \item {author} {String. The author string.} \item {name} {String. The name of the taxonomy.} \item {source} {String. The full identifying information for this version of the taxonomy.} \item {version} {String. The version number of the taxonomy.} } } \description{ Summary information about the Open Tree Taxonomy (OTT) } \details{ Return metadata and information about the taxonomy itself. Currently, the available metadata is fairly sparse, but includes (at least) the version, and the location from which the complete taxonomy source files can be downloaded. } \examples{ \dontrun{ taxonomy_about() } } rotl/man/get_study_meta.Rd0000644000176200001440000000375013543603103015314 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies-methods.R, R/studies.R \name{get_tree_ids} \alias{get_tree_ids} \alias{get_publication} \alias{candidate_for_synth} \alias{get_study_year} \alias{get_tree_ids.study_meta} \alias{get_publication.study_meta} \alias{candidate_for_synth.study_meta} \alias{get_study_year.study_meta} \alias{get_study_meta} \title{Study Metadata} \usage{ get_tree_ids(sm) get_publication(sm) candidate_for_synth(sm) get_study_year(sm) \method{get_tree_ids}{study_meta}(sm) \method{get_publication}{study_meta}(sm) \method{candidate_for_synth}{study_meta}(sm) \method{get_study_year}{study_meta}(sm) get_study_meta(study_id, ...) } \arguments{ \item{study_id}{the study identifier (character)} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} \item{sm}{an object created by \code{get_study_meta}} } \value{ named-list containing the metadata associated with the study requested } \description{ Retrieve metadata about a study in the Open Tree of Life datastore. } \details{ \code{get_study_meta} returns a long list of attributes for the studies that are contributing to the synthetic tree. To help with the extraction of relevant information from this list, several helper functions exists: \itemize{ \item {get_tree_ids} { The identifiers of the trees associated with the study } \item {get_publication} { The citation information of the publication for the study. The DOI (or URL) for the study is available as an attribute to the returned object (i.e., \code{attr(object, "DOI")} ) }. \item {candidate_for_synth} { The identifier of the tree(s) from the study used in the synthetic tree. This is a subset of the result of \code{get_tree_ids}. \item {get_study_year} { The year of publication of the study. } } } } \examples{ \dontrun{ req <- get_study_meta("pg_719") get_tree_ids(req) candidate_for_synth(req) get_publication(req) get_study_year(req) } } rotl/man/studies_find_studies.Rd0000644000176200001440000000477613543603103016530 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{studies_find_studies} \alias{studies_find_studies} \title{Find a Study} \usage{ studies_find_studies( property = NULL, value = NULL, verbose = FALSE, exact = FALSE, detailed = TRUE, ... ) } \arguments{ \item{property}{The property to be searched on (character)} \item{value}{The property value to be searched on (character)} \item{verbose}{Should the output include all metadata (logical default \code{FALSE})} \item{exact}{Should exact matching be used? (logical, default \code{FALSE})} \item{detailed}{If \code{TRUE} (default), the function will return a data frame that summarizes information about the study (see \sQuote{Value}). Otherwise, it only returns the study identifiers.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ If \code{detailed=TRUE}, the function returns a data frame listing the study id (\code{study_ids}), the number of trees associated with this study (\code{n_trees}), the tree ids (at most 5) associated with the studies (\code{tree_ids}), the tree id that is a candidate for the synthetic tree if any (\code{candidate}), the year of publication of the study (\code{study_year}), the title of the publication for the study (\code{title}), and the DOI (Digital Object Identifier) for the study (\code{study_doi}). If \code{detailed=FALSE}, the function returns a data frame with a single column containing the study identifiers. } \description{ Return the identifiers of studies that match given properties } \examples{ \dontrun{ ## To match a study for which the identifier is already known one_study <- studies_find_studies(property="ot:studyId", value="pg_719") list_trees(one_study) ## To find studies pertaining to Mammals mammals <- studies_find_studies(property="ot:focalCladeOTTTaxonName", value="mammalia") ## To extract the tree identifiers for each of the studies list_trees(mammals) ## ... or for a given study list_trees(mammals, "ot_308") ## Just the identifiers without other information about the studies mammals <- studies_find_studies(property="ot:focalCladeOTTTaxonName", value="mammalia", detailed=FALSE) } } \seealso{ \code{\link{studies_properties}} which lists properties against which the studies can be searched. \code{\link{list_trees}} that returns a list for all tree ids associated with a study. } rotl/man/tnrs_match_names.Rd0000644000176200001440000000607513543603103015627 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tnrs.R \name{tnrs_match_names} \alias{tnrs_match_names} \title{Match names to the Open Tree Taxonomy} \usage{ tnrs_match_names( names = NULL, context_name = NULL, do_approximate_matching = TRUE, ids = NULL, include_suppressed = FALSE, ... ) } \arguments{ \item{names}{taxon names to be queried. Currently limited to 10,000 names for exact matches and 2,500 names for approximate matches (character vector)} \item{context_name}{name of the taxonomic context to be searched (length-one character vector). Must match (case sensitive) one of the values returned by \code{\link{tnrs_contexts}}.} \item{do_approximate_matching}{A logical indicating whether or not to perform approximate string (a.k.a. \dQuote{fuzzy}) matching. Using \code{FALSE} will greatly improve speed. Default, however, is \code{TRUE}.} \item{ids}{A vector of ids to use for identifying names. These will be assigned to each name in the names array. If ids is provided, then ids and names must be identical in length.} \item{include_suppressed}{Ordinarily, some quasi-taxa, such as incertae sedis buckets and other non-OTUs, are suppressed from TNRS results. If this parameter is true, these quasi-taxa are allowed as possible TNRS results.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A data frame summarizing the results of the query. The original query output is appended as an attribute to the returned object (and can be obtained using \code{attr(object, "original_response")}). } \description{ Match taxonomic names to the Open Tree Taxonomy. } \details{ Accepts one or more taxonomic names and returns information about potential matches for these names to known taxa in the Open Tree Taxonomy. This service uses taxonomic contexts to disambiguate homonyms and misspelled names; a context may be specified using the \code{context_name} argument. If no context is specified, then the context will be inferred (i.e., the shallowest taxonomic context that contains all unambiguous names in the input). Taxonomic contexts are uncontested higher taxa that have been selected to allow limits to be applied to the scope of TNRS searches (e.g. 'match names only within flowering plants'). Once a context has been identified (either user-specified or inferred), all taxon name matches will performed only against taxa within that context. For a list of available taxonomic contexts, see \code{\link{tnrs_contexts}}. A name is considered unambiguous if it is not a synonym and has only one exact match to any taxon name in the entire taxonomy. Several functions listed in the \sQuote{See also} section can be used to inspect and manipulate the object generated by this function. } \examples{ \dontrun{ deuterostomes <- tnrs_match_names(names=c("echinodermata", "xenacoelomorpha", "chordata", "hemichordata")) } } \seealso{ \code{\link{inspect.match_names}}, \code{\link{update.match_names}}, \code{\link{synonyms.match_names}}. } rotl/man/match_names.Rd0000644000176200001440000000500013543603103014544 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/match_names.R \name{inspect.match_names} \alias{inspect.match_names} \alias{inspect} \alias{update.match_names} \title{Inspect and Update alternative matches for a name returned by tnrs_match_names} \usage{ \method{inspect}{match_names}(response, row_number, taxon_name, ott_id, ...) inspect(response, ...) \method{update}{match_names}(object, row_number, taxon_name, ott_id, new_row_number, new_ott_id, ...) } \arguments{ \item{response}{an object generated by the \code{\link{tnrs_match_names}} function} \item{row_number}{the row number corresponding to the name to inspect} \item{taxon_name}{the taxon name corresponding to the name to inspect} \item{ott_id}{the ott id corresponding to the name to inspect} \item{...}{currently ignored} \item{object}{an object created by \code{\link{tnrs_match_names}}} \item{new_row_number}{the row number in the output of \code{\link{inspect}} to replace the taxa specified by \code{row_number}, \code{taxon_name}, or \code{ott_id}.} \item{new_ott_id}{the ott id of the taxon to replace the taxa specified by \code{row_number}, \code{taxon_name}, or \code{ott_id}.} } \value{ a data frame } \description{ Taxonomic names may have different meanings in different taxonomic contexts, as the same genus name can be applied to animals and plants for instance. Additionally, the meaning of a taxonomic name may have change throughout its history, and may have referred to a different taxon in the past. In such cases, a given names might have multiple matches in the Open Tree Taxonomy. These functions allow users to inspect (and update) alternative meaning of a given name and its current taxonomic status according to the Open Tree Taxonomy. } \details{ To inspect alternative taxonomic meanings of a given name, you need to provide the object resulting from a call to the tnrs_match_names function, as well as one of either the row number corresponding to the name in this object, the name itself (as used in the original query), or the ott_id listed for this name. To update one of the name, you also need to provide the row number in which the name to be replaced appear or its ott id. } \examples{ \dontrun{ matched_names <- tnrs_match_names(c("holothuria", "diadema", "boletus")) inspect(matched_names, taxon_name="diadema") new_matched_names <- update(matched_names, taxon_name="diadema", new_ott_id = 631176) new_matched_names } } \seealso{ \code{\link{tnrs_match_names}} } rotl/man/taxonomy_mrca.Rd0000644000176200001440000000331613055075704015165 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/taxonomy.R \name{taxonomy_mrca} \alias{taxonomy_mrca} \alias{tax_rank.taxon_mrca} \alias{tax_name.taxon_mrca} \alias{ott_id.taxon_mrca} \alias{unique_name.taxon_mrca} \alias{tax_sources.taxon_mrca} \alias{flags.taxon_mrca} \alias{is_suppressed.taxon_mrca} \title{Taxonomic MRCA} \usage{ taxonomy_mrca(ott_ids = NULL, ...) \method{tax_rank}{taxon_mrca}(tax, ...) \method{tax_name}{taxon_mrca}(tax, ...) \method{ott_id}{taxon_mrca}(tax, ...) \method{unique_name}{taxon_mrca}(tax, ...) \method{tax_sources}{taxon_mrca}(tax, ...) \method{flags}{taxon_mrca}(tax, ...) \method{is_suppressed}{taxon_mrca}(tax, ...) } \arguments{ \item{ott_ids}{a vector of ott ids for the taxa whose MRCA is to be found (numeric).} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} \item{tax}{an object generated by the \code{taxonomy_mrca} function} } \value{ \itemize{ \item{\code{taxonomy_mrca}} { returns a list about the taxonomic information relating to the MRCA for the ott_ids provided. } \item{\code{tax_rank}} { returns a character vector of the taxonomic rank for the MRCA. } \item{\code{tax_name}} { returns a character vector the Open Tree Taxonomy name for the MRCA. } \item{\code{ott_id}} { returns a numeric vector of the ott id for the MRCA. } } } \description{ Taxonomic Least Inclusive Common Ancestor (MRCA) } \details{ Given a set of OTT ids, get the taxon that is the most recent common ancestor (the MRCA) of all the identified taxa. } \examples{ \dontrun{ req <- taxonomy_mrca(ott_ids=c(515698,590452,643717)) tax_rank(req) tax_name(req) ott_id(req) } } rotl/man/get_study.Rd0000644000176200001440000000375613543603103014314 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/studies.R \name{get_study} \alias{get_study} \title{Get all the trees associated with a particular study} \usage{ get_study( study_id = NULL, object_format = c("phylo", "nexml"), file_format, file, ... ) } \arguments{ \item{study_id}{the study ID for the study of interest (character)} \item{object_format}{the class of the object the query should return (either \code{phylo} or \code{nexml}). Ignored if \code{file_format} is specified.} \item{file_format}{the format of the file to be generated (\code{newick}, \code{nexus}, \code{nexml} or \code{json}).} \item{file}{the file name where the output of the function will be saved.} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ if \code{file_format} is missing, an object of class \code{phylo} or \code{nexml}, otherwise a logical indicating whether the file was successfully created. } \description{ Returns the trees associated with a given study } \details{ If \code{file_format} is missing, the function returns an object of the class \code{phylo} from the \code{\link[ape]{ape}} package (default), or an object of the class \code{nexml} from the \code{RNeXML} package. Otherwise \code{file_format} can be either \code{newick}, \code{nexus}, \code{nexml} or \code{json}, and the function will generate a file of the selected format. In this case, a file name needs to be provided using the argument \code{file}. If a file with the same name already exists, it will be silently overwritten. } \examples{ \dontrun{ that_one_study <- get_study(study_id="pg_719", object_format="phylo") if (require(RNeXML)) { ## if RNeXML is installed get the object directly nexml_study <- get_study(study_id="pg_719", object_format="nexml") } else { ## otherwise write it to a file get_study(study_id="pg_719", file_format="nexml", file=tempfile(fileext=".nexml")) } } } \seealso{ \code{\link{get_study_meta}} } rotl/man/strip_ott_ids.Rd0000644000176200001440000000163513065231640015167 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tol.R \name{strip_ott_ids} \alias{strip_ott_ids} \title{Strip OTT ids from tip labels} \usage{ strip_ott_ids(tip_labels, remove_underscores = FALSE) } \arguments{ \item{tip_labels}{a character vector containing tip labels (most likely the \code{tip.label} element from a tree returned by \code{\link{tol_induced_subtree}}} \item{remove_underscores}{logical (defaults to FALSE). If set to TRUE underscores in tip labels are converted to spaces} } \value{ A character vector containing the contents of \code{tip_labels} with any OTT ids removed. } \description{ Strip OTT ids from tip labels } \examples{ \dontrun{ genera <- c("Perdix", "Setophaga", "Cinclus", "Struthio") tr <- tol_induced_subtree(ott_ids=c(102710, 285198, 267845, 292466)) tr$tip.label \%in\% genera tr$tip.label <- strip_ott_ids(tr$tip.label) tr$tip.label \%in\% genera } } rotl/man/tol_node_info.Rd0000644000176200001440000001041313543603103015107 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/methods.R, R/tol.R \name{tol_lineage} \alias{tol_lineage} \alias{tol_node_info} \alias{tax_rank.tol_node} \alias{tax_sources.tol_node} \alias{unique_name.tol_node} \alias{tax_name.tol_node} \alias{ott_id.tol_node} \alias{source_list.tol_node} \alias{tax_lineage.tol_node} \alias{tol_lineage.tol_node} \title{Node info} \usage{ tol_lineage(tax, ...) tol_node_info(ott_id = NULL, node_id = NULL, include_lineage = FALSE, ...) \method{tax_rank}{tol_node}(tax, ...) \method{tax_sources}{tol_node}(tax, ...) \method{unique_name}{tol_node}(tax, ...) \method{tax_name}{tol_node}(tax, ...) \method{ott_id}{tol_node}(tax, ...) \method{source_list}{tol_node}(tax, ...) \method{tax_lineage}{tol_node}(tax, ...) \method{tol_lineage}{tol_node}(tax, ...) } \arguments{ \item{ott_id}{Numeric. The OpenTree taxonomic identifier.} \item{node_id}{Character. The OpenTree node identifier.} \item{include_lineage}{Logical (default = FALSE). Whether to return the lineage of the node from the synthetic tree.} \item{...}{additional arguments to customize the API call (see ?rotl for more information)} \item{tax}{an object returned by \code{tol_node_info}.} } \value{ \code{tol_node_info} returns an invisible list of summary information about the queried node: \itemize{ \item {node_id} {String. The canonical identifier of the node.} \item {num_tips} {Numeric. The number of descendent tips.} \item {partial_path_of} {List. The edge below this synthetic tree node is compatible with the edge below each of these input tree nodes (one per tree). Each returned element is reported as sourceid:nodeid.} \item {query} { The node id that resolved to this node. This can differ from the node_id field if the query id is not canonical. } \item {taxon} {A list of taxonomic properties. Only returned if the queried node is a taxon. Each source has:} \itemize{ \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} \item {name} {String. The taxonomic name of the queried node.} \item {unique_name} {String. The string that uniquely identifies the taxon in OTT.} \item {rank} {String. The taxonomic rank of the taxon in OTT.} \item {tax_sources} {List. A list of identifiers for taxonomic sources, such as other taxonomies, that define taxa judged equivalent to this taxon.} } The following properties list support/conflict for the node across synthesis source trees. All properties involve sourceid keys and nodeid values (see \code{source_id_map} below). \item {supported_by} {List. Input tree nodes (one per tree) that support this synthetic tree node. Each returned element is reported as sourceid:nodeid.} \item {terminal} {List. Input tree nodes (one per tree) that are equivalent to this synthetic tree node (via an exact mapping, or the input tree terminal may be the only terminal descended from this synthetic tree node. Each returned element is reported as sourceid:nodeid.} \item {conflicts_with} {Named list of lists. Names correspond to sourceid keys. Each list contains input tree node ids (one or more per tree) that conflict with this synthetic node.} } \code{tol_lineage} and \code{tax_lineage} return data frames. \code{tol_lineage} indicate for each ancestor its node identifier, the number of tips descending from that node, and whether it corresponds to a taxonomic level. } \description{ Get summary information about a node in the synthetic tree } \details{ Returns summary information about a node in the graph. The node of interest may be specified using either a node id or an taxon id, but not both. If the specified node or OTT id is not in the graph, an error will be returned. If the argument \code{include_lineage=TRUE} is used, you can use \code{tax_lineage()} or \code{tol_lineage} to return the taxonomic information or the node information for all the ancestors to this node, down to the root of the tree. } \examples{ \dontrun{ birds <- tol_node_info(ott_id=81461, include_lineage=TRUE) source_list(birds) tax_rank(birds) ott_id(birds) tax_lineage(birds) tol_lineage(birds)} } rotl/man/is_in_tree.Rd0000644000176200001440000000263113056074002014413 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/is_in_tree.R \name{is_in_tree} \alias{is_in_tree} \title{Check that OTT ids occur in the Synthetic Tree} \usage{ is_in_tree(ott_ids, ...) } \arguments{ \item{ott_ids}{a vector of Open Tree Taxonomy identifiers} \item{...}{additional arguments to customize the API request (see \code{\link{rotl}} package documentation).} } \value{ A named logical vector. \code{TRUE} indicates that the OTT id is in the synthetic tree, and \code{FALSE} that it is not. } \description{ Some valid taxonomic names do not occur in the Synthetic Tree. This convenience function allows you to check whether a given Open Tree Taxonomy identifier (OTT id) is in the tree. A taxonomic name may not occur in the synthetic tree because (1) it is an extinct or invalid taxon, or (2) it is part of a group that is not monophyletic in the tree. } \examples{ \dontrun{ plant_families <- c("Asteraceae", "Solanaceae", "Poaceae", "Amaranthaceae", "Zamiaceae", "Araceae", "Juncaceae") matched_names <- tnrs_match_names(plant_families) ## This fails because some ott ids are not in the tree ## plant_tree <- tol_induced_subtree(ott_id(matched_names)) ## So let's check which ones are actually in the tree first: in_tree <- is_in_tree(ott_id(matched_names)) ## This now works: plant_tree <- tol_induced_subtree(ott_id(matched_names)[in_tree]) } } rotl/man/tol_mrca.Rd0000644000176200001440000001343613065234715014111 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/tol.R \name{tol_mrca} \alias{tol_mrca} \alias{tax_sources.tol_mrca} \alias{unique_name.tol_mrca} \alias{tax_name.tol_mrca} \alias{tax_rank.tol_mrca} \alias{ott_id.tol_mrca} \alias{source_list.tol_mrca} \title{MRCA of taxa from the synthetic tree} \usage{ tol_mrca(ott_ids = NULL, node_ids = NULL, ...) \method{tax_sources}{tol_mrca}(tax, ...) \method{unique_name}{tol_mrca}(tax, ...) \method{tax_name}{tol_mrca}(tax, ...) \method{tax_rank}{tol_mrca}(tax, ...) \method{ott_id}{tol_mrca}(tax, ...) \method{source_list}{tol_mrca}(tax, ...) } \arguments{ \item{ott_ids}{Numeric vector. The ott ids for which the MRCA is desired.} \item{node_ids}{Character vector. The node ids for which the MRCA is desired.} \item{...}{additional arguments to customize the API call (see \code{\link{rotl}} for more information).} \item{tax}{an object returned by \code{tol_mrca()}.} } \value{ An invisible list of the MRCA node properties: \itemize{ \item {mrca} {List of node properties.} \itemize{ \item {node_id} {String. The canonical identifier of the node.} \item {num_tips} {Numeric. The number of descendent tips.} \item {taxon} {A list of taxonomic properties. Only returned if the queried node is a taxon. (If the node is not a taxon, a \code{nearest_taxon} list is returned (see below)).} \itemize{ \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} \item {name} {String. The taxonomic name of the queried node.} \item {unique_name} {String. The string that uniquely identifies the taxon in OTT.} \item {rank} {String. The taxonomic rank of the taxon in OTT.} \item {tax_sources} {List. A list of identifiers for taxonomic sources, such as other taxonomies, that define taxa judged equivalent to this taxon.} } The following properties list support/conflict for the node across synthesis source trees. All properties involve sourceid keys and nodeid values (see \code{source_id_map} below) Not all properties are are present for every node. \item {partial_path_of} {List. The edge below this synthetic tree node is compatible with the edge below each of these input tree nodes (one per tree). Each returned element is reported as sourceid:nodeid.} \item {supported_by} {List. Input tree nodes (one per tree) that support this synthetic tree node. Each returned element is reported as sourceid:nodeid.} \item {terminal} {List. Input tree nodes (one per tree) that are equivalent to this synthetic tree node (via an exact mapping, or the input tree terminal may be the only terminal descended from this synthetic tree node. Each returned element is reported as sourceid:nodeid.} \item {conflicts_with} {Named list of lists. Names correspond to sourceid keys. Each list contains input tree node ids (one or more per tree) that conflict with this synthetic node.} } \item {nearest_taxon} {A list of taxonomic properties of the nearest rootward taxon node to the MRCA node. Only returned if the MRCA node is a not taxon (otherwise the \code{taxon} list above is returned).} \itemize{ \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} \item {name} {String. The taxonomic name of the queried node.} \item {unique_name} {String. The string that uniquely identifies the taxon in OTT.} \item {rank} {String. The taxonomic rank of the taxon in OTT.} \item {tax_sources} {List. A list of identifiers for taxonomic sources, such as other taxonomies, that define taxa judged equivalent to this taxon.} } \item {source_id_map} {Named list of lists. Names correspond to the sourceid keys used in the support/conflict properties of the \code{mrca} list above. Source trees will have the following properties:} \itemize{ \item {git_sha} {The git SHA identifying a particular source version.} \item {tree_id} {The tree id associated with the study id used.} \item {study_id} {The study identifier. Will typically include a prefix ("pg_" or "ot_").} } The only sourceid that does not correspond to a source tree is the taxonomy, which will have the name "ott"+`taxonomy_version`, and the value is the ott_id of the taxon in that taxonomy version. "Taxonomy" will only ever appear in \code{supported_by}. } } \description{ Most Recent Common Ancestor for a set of nodes } \details{ Get the MRCA of a set of nodes on the current synthetic tree. Accepts any combination of node ids and ott ids as input. Returns information about the most recent common ancestor (MRCA) node as well as the most recent taxonomic ancestor (MRTA) node (the closest taxonomic node to the MRCA node in the synthetic tree; the MRCA and MRTA may be the same node). If they are the same, the taxonomic information will be in the \code{mrca} slot, otherwise they will be in the \code{nearest_taxon} slot of the list. If any of the specified nodes is not in the synthetic tree an error will be returned. Taxonomic methods (\code{tax_sources()}, \code{ott_id()}, \code{unique_name()}, ...) are available on the objects returned by \code{tol_mrca()}. If the MRCA node is MRTA, the name of the object returned by these methods will start with \sQuote{ott}, otherwise it will start with \sQuote{mrca}. } \examples{ \dontrun{ birds_mrca <- tol_mrca(ott_ids=c(412129, 119214)) ott_id(birds_mrca) tax_sources(birds_mrca) } } rotl/man/study_external_IDs.Rd0000644000176200001440000000256213057544607016125 0ustar liggesusers% Generated by roxygen2: do not edit by hand % Please edit documentation in R/external_data.R \name{study_external_IDs} \alias{study_external_IDs} \title{Get external identifiers for data associated with an Open Tree study} \usage{ study_external_IDs(study_id) } \arguments{ \item{study_id}{An open tree study ID} } \value{ A study_external_data object (which inherits from a list) which contains some of the following. doi, character, the DOI for the paper describing this study external_data_url, character, a URL to an external data repository (e.g. a treebase entry) if one exists. pubmed_id character, the unique ID for this study in the NCBI's pubmed database popset_ids character, vector of IDs for the NCBI's popset database nucleotide_ids character, vector of IDs for the NCBI's nucleotide database } \description{ Data associated with studies contributing to the Open Tree synthesis may be available from other databases. In particular, trees and alignments may be available from treebase and DNA sequences and bibliographic information associated with a given study may be available from the NCBI. This function retrieves that information for a given study. } \examples{ \dontrun{ flies <- studies_find_studies(property="ot:focalCladeOTTTaxonName", value="Drosophilidae") study_external_IDs(flies[2,]$study_ids) } } \seealso{ studies_find_studies (used to discover study IDs) } rotl/DESCRIPTION0000644000176200001440000000423213543642072012747 0ustar liggesusersPackage: rotl Title: Interface to the 'Open Tree of Life' API Version: 3.0.10 Authors@R: c(person(given = "Francois", family = "Michonneau", role = c("aut", "cre"), email = "francois.michonneau@gmail.com", comment = c(ORCID = "0000-0002-9092-966X")), person(given = "Joseph", family = "Brown", role = "aut", comment = c(ORCID = "0000-0002-3835-8062")), person(given = "David", family = "Winter", role = "aut", comment = c(ORCID = "0000-0002-6165-0029")), person(given = "Scott", family = "Chamberlain", role = "rev", comment = c(ORCID = "0000-0003-1444-9135"))) Description: An interface to the 'Open Tree of Life' API to retrieve phylogenetic trees, information about studies used to assemble the synthetic tree, and utilities to match taxonomic names to 'Open Tree identifiers'. The 'Open Tree of Life' aims at assembling a comprehensive phylogenetic tree for all named species. License: BSD_2_clause + file LICENSE URL: https://github.com/ropensci/rotl BugReports: https://github.com/ropensci/rotl/issues Depends: R (>= 3.1.1) Imports: ape, assertthat (>= 0.1), httr, jsonlite, rentrez, rncl (>= 0.6.0) Suggests: fulltext (>= 0.1.6), knitr (>= 1.12), MCMCglmm, phylobase, readxl, rmarkdown (>= 0.7), RNeXML, testthat VignetteBuilder: knitr Encoding: UTF-8 LazyData: true RoxygenNote: 6.1.99.9001 X-schema.org-isPartOf: https://ropensci.org X-schema.org-keywords: metadata, ropensci, phylogenetics, independant-contrasts, biodiversity X-schema.org-relatedLink: https://codemeta.github.io/codemetar NeedsCompilation: no Packaged: 2019-09-28 11:05:00 UTC; francois Author: Francois Michonneau [aut, cre] (), Joseph Brown [aut] (), David Winter [aut] (), Scott Chamberlain [rev] () Maintainer: Francois Michonneau Repository: CRAN Date/Publication: 2019-09-28 11:30:02 UTC rotl/build/0000755000176200001440000000000013543637133012341 5ustar liggesusersrotl/build/vignette.rds0000644000176200001440000000046313543637133014703 0ustar liggesusersRMK0M? ~w{e<(7 m|&k?u&C3oo 1) expect_true(all(grepl("^(ot|pg)", source_list(req)[["study_id"]]))) expect_true(all(grepl("^tr", source_list(req)[["tree_id"]], ignore.case = TRUE))) }) test_that("tol_node tax_rank method", { skip_on_cran() expect_true(inherits( tax_rank(req), c("otl_rank", "list") )) expect_equal(tax_rank(req)[[1]], "no rank") }) test_that("tol_node ott_id method", { skip_on_cran() expect_true(inherits( ott_id(req), c("otl_ott_id", "list") )) expect_equal(ott_id(req)[[1]], 93302) expect_equal(names(ott_id(req)), "cellular organisms") }) test_that("tol_node tax_sources", { skip_on_cran() expect_true(inherits( tax_sources(req), c("otl_tax_sources", "list") )) expect_true(any(grepl("ncbi", tax_sources(req)[[1]]))) expect_equal(names(tax_sources(req)), "cellular organisms") }) test_that("tol_node unique_name", { skip_on_cran() expect_true(inherits( unique_name(req), c("otl_unique_name", "list") )) expect_equal(unique_name(req)[[1]], "cellular organisms") expect_equal(names(unique_name(req)), "cellular organisms") }) test_that("tol_node tax_name", { skip_on_cran() expect_true(inherits( tax_name(req), c("otl_name", "list") )) expect_equal(tax_name(req)[[1]], "cellular organisms") expect_equal(names(tax_name(req)), "cellular organisms") }) ### ott_id() -------------------------------------------------------------------- test_that("taxonomy_taxon_info with ott_id for tol_about", { skip_on_cran() expect_equal( ott_id(req), ott_id(taxonomy_taxon_info(ott_id(req))) ) }) ## can't do that, it's pulling the whole tree ## test_that("taxonomy_subtree with ott_id for tol_about", { ## taxonomy_subtree(ott_id = ott_id(req)) ## }) test_that("tol_node_info with ott_id for tol_about", { skip_on_cran() expect_equal( ott_id(req), ott_id(tol_node_info(ott_id(req))) ) }) ## can't do that, it's pulling the whole tree ## test_that("tol_subtree with ott_id for tol_about", { ## tol_subtree(ott_id = ott_id(req)) ## }) test_that("tol_mrca with ott_id for tol_about", { skip_on_cran() expect_equal( ott_id(req)[1], ott_id(tol_mrca(ott_id(req)))[1] ) }) test_that("tol_induced_subtree with ott_id for tol_about", { skip_on_cran() expect_error( tol_induced_subtree(ott_id(req)), "least two valid" ) }) test_that("taxonomy_mrca with ott_id for tol_about", { skip_on_cran() expect_equal( ott_id(req), ott_id(taxonomy_mrca(ott_id(req))) ) }) ############################################################################ ## tol_subtree ## ############################################################################ context("test tol_subtree") test_that("tol_subtree fails if ott_id is invalid", { skip_on_cran() expect_error(tol_subtree(ott_id = 6666666)) }) test_that("tol_subtree fails if more than one ott_id is provided", { skip_on_cran() expect_error( tol_subtree(ott_id = c(666666, 6666667)), "Please provide a single" ) }) test_that("tol_subtree fails if ott_id doesn't look like a number", { skip_on_cran() expect_error( tol_subtree(ott_id = "111A1111"), "must look like numbers" ) }) test_that("tol_subtree returns a phylo object by default", { skip_on_cran() expect_warning( expect_true(inherits(tol_subtree(ott_id = 81461), "phylo")), "Dropping" ) }) test_that("tol_subtree returns a newick file when providing a file argument", { skip_on_cran() ff <- tempfile(fileext = ".tre") tr <- tol_subtree(ott_id = 81461, file = ff) expect_true(tr) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) ############################################################################ ## tol_induced_subtree ## ############################################################################ context("test tol_induced_subtree") test_that("warning for node ids that are not in TOL graph", { skip_on_cran() expect_error( tol_induced_subtree(ott_ids = c(357968, 867416, 939325, 9999999)), "not found" ) }) test_that("error if ott_ids provided don't look like numbers", { skip_on_cran() expect_error( tol_induced_subtree(ott_ids = c("13242", "kitten")), "must look like numbers" ) }) ## test_that("warning for ott ids not in tree", ## ???) test_that("tol_induced_subtree generates a newick file when providing a file argument", { skip_on_cran() ff <- tempfile(fileext = ".tre") tr <- tol_induced_subtree(ott_ids = c(292466, 267845, 292466), file = ff) expect_true(tr) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) ############################################################################ ## tol_mrca ## ############################################################################ if (identical(Sys.getenv("NOT_CRAN"), "true")) { birds <- tol_mrca(ott_ids = c(412129, 292466)) hol <- tol_mrca(c(431586, 957434)) mono <- tol_mrca(ott_ids = c(962377, 79623)) } test_that("tol_mrca fails if ott_ids are not numbers", { skip_on_cran() expect_error( tol_mrca(ott_ids = c(13243, "a13415")), "must look like numbers" ) }) test_that("tol_mrca returns a list", { skip_on_cran() expect_true(inherits(birds, "list")) expect_true(inherits(birds, "tol_mrca")) expect_true(all(names(birds) %in% c( "mrca", "source_id_map", "synth_id" ))) }) test_that("methods for tol_mrca where the node is a taxon", { skip_on_cran() expect_true(inherits( tax_sources(hol), c("otl_tax_sources", "list") )) expect_true(inherits( unique_name(hol), c("otl_unique_name", "list") )) expect_true(inherits( tax_name(hol), c("otl_name", "list") )) expect_true(inherits( tax_rank(hol), c("otl_rank", "list") )) expect_true(inherits( ott_id(hol), c("otl_ott_id", "list") )) expect_true(length(tax_sources(hol)[[1]]) > 1) expect_true(any(grepl("worms", tax_sources(hol)[[1]]))) expect_equal(unique_name(hol)[[1]], "Holothuria") expect_equal(tax_name(hol)[[1]], "Holothuria") expect_equal(tax_rank(hol)[[1]], "genus") expect_equal(ott_id(hol)[[1]], 924443) expect_equal(names(tax_sources(hol)), "Holothuria") expect_true(all(names(source_list(hol)) %in% c( "tree_id", "study_id", "git_sha" ))) expect_equal(attr(tax_sources(hol), "taxon_type"), "mrca") }) test_that("methods for tol_mrca where the node is not a taxon", { skip_on_cran() expect_true(inherits(birds, "list")) expect_true(inherits( tax_sources(birds), c("otl_tax_sources", "list") )) expect_true(inherits( unique_name(birds), c("otl_unique_name", "list") )) expect_true(inherits( tax_name(birds), c("otl_name", "list") )) expect_true(inherits( tax_rank(birds), c("otl_rank", "list") )) expect_true(inherits( ott_id(birds), c("otl_ott_id", "list") )) expect_true(length(tax_sources(birds)[[1]]) >= 1) expect_true(any(grepl("ncbi", tax_sources(birds)[[1]]))) expect_equal(unique_name(birds)[[1]], "Aves") expect_equal(tax_name(birds)[[1]], "Aves") expect_equal(tax_rank(birds)[[1]], "class") expect_equal(ott_id(birds)[[1]], 81461) expect_equal(names(ott_id(birds)), "Aves") expect_true(all(names(source_list(birds)) %in% c( "tree_id", "study_id", "git_sha" ))) expect_equal(attr(tax_sources(birds), "taxon_type"), "mrca") }) ### ott_id() -------------------------------------------------------------------- test_that("taxonomy_taxon_info with ott_id for tol_mrca", { skip_on_cran() expect_equal( ott_id(mono)[1], ott_id(taxonomy_taxon_info(ott_id(mono)))[1] ) }) test_that("taxonomy_subtree with ott_id for tol_mrca", { skip_on_cran() tt <- taxonomy_subtree(ott_id = ott_id(mono)) expect_true(length(tt[["tip_label"]]) > 10) expect_true(length(tt[["edge_label"]]) > 7) }) test_that("tol_node_info with ott_id for tol_mrca", { skip_on_cran() expect_equal( ott_id(mono)[1], ott_id(tol_node_info(ott_id(mono)))[1] ) }) test_that("tol_subtree with ott_id for tol_mrca", { skip_on_cran() expect_warning( tt <- tol_subtree(ott_id = ott_id(mono)), "Dropping" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(length(tt$node.label) > 1) }) test_that("tol_mrca with ott_id for tol_mrca", { skip_on_cran() expect_equal( ott_id(mono)[1], ott_id(tol_mrca(ott_id(mono)))[1] ) }) test_that("tol_induced_subtree with ott_id for tol_mrca", { skip_on_cran() expect_error( tol_induced_subtree(ott_id(mono)), "least two valid" ) }) test_that("taxonomy_mrca with ott_id for tol_mrca", { skip_on_cran() expect_equivalent( ott_id(mono), ott_id(taxonomy_mrca(ott_id(mono))) ) }) ############################################################################ ## strip_ott_ids ## ############################################################################ test_that("OTT ids can be striped from tip labels to allow taxon-matching", { skip_on_cran() genera <- c("Perdix", "Cinclus", "Struthio") expect_warning(tr <- tol_induced_subtree(ott_ids = c(102710, 267845, 292466))) expect_true(all(strip_ott_ids(tr$tip.label) %in% genera)) }) ############################################################################ ## tol_node_info ## ############################################################################ if (identical(Sys.getenv("NOT_CRAN"), "true")) { tol_info <- tol_node_info(ott_id = 81461) tol_lin <- tol_node_info(ott_id = 81461, include_lineage = TRUE) tol_mono <- tol_node_info(ott_id = 962396) } test_that("tol node info.", { skip_on_cran() expect_true(all(names(tol_info) %in% c( "node_id", "num_tips", "partial_path_of", "query", "source_id_map", "supported_by", "synth_id", "taxon", "terminal" ))) expect_true(inherits(tol_info, "tol_node")) }) ### methods --------------------------------------------------------------------- test_that("tol_node tax_rank method", { skip_on_cran() expect_true(inherits( tax_rank(tol_info), c("otl_tax_rank", "list") )) expect_equal(tax_rank(tol_info)[[1]], "class") }) test_that("tol_node ott_id method", { skip_on_cran() expect_true(inherits( ott_id(tol_info), c("otl_ott_id", "list") )) expect_equal(ott_id(tol_info)[[1]], 81461) expect_equal(names(ott_id(tol_info)), "Aves") }) test_that("tol_node tax_sources", { skip_on_cran() expect_true(inherits( tax_sources(tol_info), c("otl_tax_sources", "list") )) expect_true(any(grepl("worms", tax_sources(tol_info)[[1]]))) expect_equal(names(tax_sources(tol_info)), "Aves") }) test_that("tol_node unique_name", { skip_on_cran() expect_true(inherits( unique_name(tol_info), c("otl_unique_name", "list") )) expect_equal(unique_name(tol_info)[[1]], "Aves") expect_equal(names(unique_name(tol_info)), "Aves") }) test_that("tol_node tax_name", { skip_on_cran() expect_true(inherits( tax_name(tol_info), c("otl_name", "list") )) expect_equal(tax_name(tol_info)[[1]], "Aves") expect_equal(names(tax_name(tol_info)), "Aves") }) test_that("tol_node source_list method", { skip_on_cran() expect_true(inherits(source_list(tol_info), "data.frame")) expect_true(all(names(source_list(tol_info)) %in% c("study_id", "tree_id", "git_sha"))) }) test_that("tol_node tol_lineage", { skip_on_cran() expect_error(tol_lineage(tol_info), "needs to be created") expect_true(inherits(tol_lineage(tol_lin), "data.frame")) expect_true(nrow(tol_lineage(tol_lin)) > 1) expect_true(all(names(tol_lineage(tol_lin)) %in% c( "node_id", "num_tips", "is_taxon" ))) expect_true(all(grepl("^(ott|mrca)", tol_lineage(tol_lin)[["node_id"]]))) }) test_that("tol_node tax_lineage", { skip_on_cran() expect_error(tax_lineage(tol_info), "needs to be created") expect_true(inherits(tax_lineage(tol_lin), "data.frame")) expect_true(nrow(tax_lineage(tol_lin)) > 1) expect_true(all(names(tax_lineage(tol_lin)) %in% c( "rank", "name", "unique_name", "ott_id" ))) expect_true(any(grepl("no rank", tax_lineage(tol_lin)[["rank"]]))) expect_true(any(grepl("cellular organisms", tax_lineage(tol_lin)[["name"]]))) }) ### ott_id() -------------------------------------------------------------------- test_that("taxonomy_taxon_info with ott_id for tol_info", { skip_on_cran() expect_equivalent( ott_id(tol_mono), ott_id(taxonomy_taxon_info(ott_id(tol_mono))) ) }) test_that("taxonomy_subtree with ott_id for tol_info", { skip_on_cran() tt <- taxonomy_subtree(ott_id = ott_id(tol_mono)) expect_true(length(tt[["tip_label"]]) > 10) expect_true(length(tt[["edge_label"]]) > 7) }) test_that("tol_node_info with ott_id for tol_info", { skip_on_cran() expect_equivalent( ott_id(tol_mono), ott_id(tol_node_info(ott_id(tol_mono))) ) }) test_that("tol_subtree with ott_id for tol_info", { skip_on_cran() expect_warning( tt <- tol_subtree(ott_id = ott_id(tol_mono)), "Dropping" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(length(tt$node.label) > 1) }) test_that("tol_mrca with ott_id for tol_info", { skip_on_cran() expect_equivalent( ott_id(tol_mono), ott_id(tol_mrca(ott_id(tol_mono))) ) }) test_that("tol_induced_subtree with ott_id for tol_info", { skip_on_cran() expect_error( tol_induced_subtree(ott_id(tol_mono)), "least two valid" ) }) test_that("taxonomy_mrca with ott_id for tol_info", { skip_on_cran() expect_equivalent( ott_id(tol_mono), ott_id(taxonomy_mrca(ott_id(tol_mono))) ) }) rotl/tests/testthat/test-api-tnrs.R0000644000176200001440000000400713543627002017074 0ustar liggesuserscontext("tnrs API") ############################################################################ ## .tnrs_match_names ## ############################################################################ test_that("names argument is provided for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names(NULL, NULL, TRUE, NULL, FALSE), "must supply" ) }) test_that("names argument is character for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names(TRUE, NULL, TRUE, NULL, FALSE), "character" ) }) test_that("names and ids have the same lengths for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names("Felis", NULL, TRUE, c("abc", "def"), FALSE), "same length" ) }) test_that("ids must be character for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names("Felis", NULL, TRUE, TRUE, FALSE), "character" ) }) test_that("do_approximate_matching is logical for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names("Felis", NULL, "true", NULL, FALSE), "logical" ) }) test_that("include_suppressed is logical for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names("Felis", NULL, TRUE, NULL, "true"), "logical" ) }) test_that("context_name is character for .tnrs_match_names", { skip_on_cran() expect_error( .tnrs_match_names("Felis", TRUE, TRUE, NULL, FALSE, TRUE), "character" ) }) ############################################################################ ## .tnrs_infer_context ## ############################################################################ test_that("names is not NULL for .tnrs_infer_context", { skip_on_cran() expect_error( .tnrs_infer_context(NULL), "Must supply" ) }) test_that("names is character for .tnrs_infer_context", { skip_on_cran() expect_error( .tnrs_infer_context(TRUE), "character" ) }) rotl/tests/testthat/test-api-tol.R0000644000176200001440000000433113543627003016705 0ustar liggesuserscontext("Tree of Life API") ############################################################################ ## .tol_about ## ############################################################################ test_that("include_source_list is logical for .tol_about", { skip_on_cran() expect_error( .tol_about("true"), "logical" ) }) ############################################################################ ## .tol_mrca ## ############################################################################ test_that("neither ott_ids nor node_ids are NULL for .tol_mrca", { skip_on_cran() expect_error( .tol_mrca(NULL), "Must provide" ) }) ############################################################################ ## .tol_subtree ## ############################################################################ test_that("ott_id is not NULL", { skip_on_cran() expect_error( .tol_subtree(ott_id = NULL, node_id = NULL), "Must provide" ) }) ############################################################################ ## .tol_induced_subtree ## ############################################################################ test_that("ott_ids is not NULL", { skip_on_cran() expect_error( .tol_induced_subtree(ott_ids = NULL), "Must provide" ) }) test_that("NAs are not accepted for ott_ids", { skip_on_cran() expect_error( .tol_induced_subtree(ott_ids = c(123, NA, 456)), "NAs are not allowed" ) }) #################### ## .tol_node_info ## #################### test_that("include_lineage must be logical with .tol_node_info", { skip_on_cran() expect_error( .tol_node_info(ott_id = "ott_123", include_lineage = "123"), "logical" ) }) test_that("ott_id must be a numeric with .tol_node_info", { skip_on_cran() expect_error( .tol_node_info(ott_id = "test"), "look like numbers" ) }) test_that("node_id must be a character with .tol_node_info", { skip_on_cran() expect_error( .tol_node_info(node_id = 123), "must look like" ) }) rotl/tests/testthat/test-studies.R0000644000176200001440000004521213543627031017024 0ustar liggesusersif (FALSE) { context("test of studies") ############################################################################ ## studies_properties ## ############################################################################ test_that("studies_properties is a list with 2 elements (if breaks, need to update documentation)", { skip_on_cran() expect_true(all(names(studies_properties() %in% c("tree_properties", "study_properties")))) }) ############################################################################ ## get_study ## ############################################################################ test_that("get_study returns an error when asking for a study that doesn't exist", { skip_on_cran() expect_error(get_study("tt_666666")) }) test_that("get_study generates a phylo object", { skip_on_cran() tr <- get_study("pg_719", object_format = "phylo") expect_true(inherits(tr, "multiPhylo")) expect_equal(length(tr), 3) expect_true(length(tr[[1]]$tip.label) > 1) }) test_that("get_study returns an error if file is specied but file_format is not", { skip_on_cran() expect_error( get_study("pg_719", file = "test"), "must be specified" ) }) test_that("get_study generates a nexml object", { skip_on_cran() tr <- get_study("pg_719", object_format = "nexml") expect_true(inherits(tr, "nexml")) }) test_that("get_study generates a newick file", { skip_on_cran() ff <- tempfile() tr <- get_study("pg_719", file_format = "newick", file = ff) expect_true(tr) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study generates a nexus file", { skip_on_cran() ff <- tempfile() tr <- get_study("pg_719", file_format = "nexus", file = ff) expect_true(tr) expect_true(grepl("^#NEXUS", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study generates a nexml file", { skip_on_cran() ff <- tempfile() tr <- get_study("pg_719", file_format = "nexml", file = ff) expect_true(tr) expect_true(grepl("^<\\?xml", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study generates a json file", { skip_on_cran() ff <- tempfile() tr <- get_study("pg_719", file_format = "json", file = ff) expect_true(tr) expect_true(grepl("^\\{", readLines(ff, n = 1, warn = FALSE))) }) ############################################################################ ## get_study_tree ## ############################################################################ test_that("get_study_tree returns error when tree doesn't exist", { skip_on_cran() expect_error(get_study_tree("2655", "tree5555")) }) test_that("get_study_tree returns error when study doesn't exist", { skip_on_cran() expect_error(get_study_tree("5555555", "tree555555")) }) test_that("get_study_tree generates nexus file", { skip_on_cran() ff <- tempfile(fileext = ".nex") tt <- get_study_tree("pg_1144", "tree2324", file_format = "nexus", file = ff ) expect_true(tt) expect_true(grepl("^#NEXUS", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study_tree generates newick file", { skip_on_cran() ff <- tempfile(fileext = ".tre") tt <- get_study_tree("pg_1144", "tree2324", file_format = "newick", file = ff ) expect_true(tt) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study_tree generates json file", { skip_on_cran() ff <- tempfile(fileext = ".json") tt <- get_study_tree("pg_1144", "tree2324", file_format = "json", file = ff ) expect_true(tt) expect_true(grepl("^\\{", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study_tree returns a phylo object", { skip_on_cran() tt <- get_study_tree("pg_1144", "tree2324", object_format = "phylo") expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) }) ### Test types of labels with phylo objects test_that("get_study_tree returns a phylo object and ott_id for tip labels", { skip_on_cran() tt <- get_study_tree("pg_1144", "tree2324", object_format = "phylo", tip_label = "ott_id" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(grepl("^[0-9]+$", tt$tip.label[1])) }) test_that("get_study_tree returns a phylo object and ott_taxon_names for tip labels", { skip_on_cran() tt <- get_study_tree("pg_1144", "tree2324", object_format = "phylo", tip_label = "ott_taxon_name" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(sum(!grepl("^[A-Za-z]+(_[a-z]+)?$", tt$tip.label)) < 3) }) test_that("get_study_tree returns a phylo object and original labels for tip labels", { skip_on_cran() tt <- get_study_tree("pg_1144", "tree2324", object_format = "phylo", tip_label = "original_label" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_equal(sum(!grepl("^[A-Za-z]+_[a-z]+$", tt$tip.label)), 45) }) ### Test types of labels with files (skipping json for now because there is no good way of doing it) test_that("get_study_tree returns an error if file is given but file format is not", { skip_on_cran() expect_error( get_study_tree(study_id = "pg_1144", tree_id = "tree2324", file = "test"), "must be specified" ) }) test_that("get_study_tree returns nexus file and ott_id for tip labels", { skip_on_cran() ff <- tempfile(fileext = ".nex") tt <- get_study_tree("pg_1144", "tree2324", file_format = "nexus", tip_label = "ott_id", file = ff ) expect_true(tt) tr <- rncl::read_nexus_phylo(ff) expect_true(length(tr$tip.label) > 1) expect_true(grepl("^[0-9]+$", tr$tip.label[1])) }) test_that("get_study_tree returns a phylo object and ott_taxon_names for tip labels", { skip_on_cran() ff <- tempfile(fileext = ".tre") tt <- get_study_tree("pg_1144", "tree2324", file_format = "newick", tip_label = "ott_taxon_name", file = ff ) expect_true(tt) tr <- rncl::read_newick_phylo(ff) expect_true(length(tr$tip.label) > 1) expect_true(sum(!grepl("^[A-Za-z]+(_[a-z]+)?$", tr$tip.label)) < 3) }) ############################################################################ ## get_study_subtree ## ############################################################################ test_that("get_study_subtree returns an error when study_id doesn't exist", { skip_on_cran() expect_error(get_study_subtree("pg_55555", "tree55555", subtree_id = "node555555")) }) test_that("get_study_subtree returns an error when tree_id doesn't exist", { skip_on_cran() expect_error(get_study_subtree("pg_1144", "tree55555", subtree_id = "node555555")) }) test_that("get_study_subtree returns an error when the subtree_id is invalid", { skip_on_cran() expect_error(get_study_subtree("pg_1144", "tree2324", "foobar")) }) test_that("get_study_subtree returns a phylo object", { skip_on_cran() tt <- get_study_subtree("pg_420", "tree522", subtree_id = "ingroup", object_format = "phylo" ) sub_tt <- get_study_subtree("pg_420", "tree522", subtree_id = "node208580", object_format = "phylo" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(inherits(sub_tt, "phylo")) expect_true(length(sub_tt$tip.label) > 1) expect_true(length(tt$tip.label) > length(sub_tt$tip.label)) }) test_that("get_study_subtree fails if file name is given but no file format", { skip_on_cran() expect_error(get_study_subtree("pg_420", "tree522", subtree_id = "ingroup", file = "test" ), "must be specified") }) test_that("get_study_subtree returns a nexus file", { skip_on_cran() ff <- tempfile(fileext = ".nex") tt <- get_study_subtree("pg_420", "tree522", subtree_id = "ingroup", file_format = "nexus", file = ff ) expect_true(tt) expect_true(grepl("^#NEXUS", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study_subtree returns a newick file", { skip_on_cran() ff <- tempfile(fileext = ".tre") tt <- get_study_subtree("pg_420", "tree522", subtree_id = "ingroup", file_format = "newick", file = ff ) expect_true(tt) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) test_that("get_study_subtree can deduplicate labels", { skip_on_cran() expect_warning( get_study_subtree( study_id = "pg_710", tree_id = "tree1277", tip_label = "ott_taxon_name", subtree_id = "ingroup", deduplicate = TRUE ), "and have been modified" ) }) test_that("get_study_subtree fails with duplicate labels", { skip_on_cran() expect_error( get_study_subtree( study_id = "pg_710", tree_id = "tree1277", tip_label = "ott_taxon_name", subtree_id = "ingroup", deduplicate = FALSE ), "has already been encountered" ) }) ############################################################################ ## get_study_meta ## ############################################################################ if (identical(Sys.getenv("NOT_CRAN"), "true")) { sm <- get_study_meta("pg_719") } test_that("get_study meta returns a study_meta object", { skip_on_cran() expect_true(inherits(sm, "study_meta")) }) test_that("get_tree_ids method for study_meta", { skip_on_cran() expect_equal(get_tree_ids(sm), c("tree1294", "tree1295", "tree1296")) }) test_that("get_publication method for study_meta", { skip_on_cran() expect_equal(attr(get_publication(sm), "DOI"), "http://dx.doi.org/10.1600/036364411X605092") }) test_that("candidate_for_synth method for study_meta", { skip_on_cran() expect_true(candidate_for_synth(sm) %in% get_tree_ids(sm)) }) test_that("get_study_year method for study_meta", { skip_on_cran() expect_equal(get_study_year(sm), 2011) }) ############################################################################ ## tol_about ## ############################################################################ test_that("tol_about returns class tol_summary", { skip_on_cran() expect_true(inherits(tol_about(), "tol_summary")) }) test_that("study_about", { skip_on_cran() ta <- source_list(tol_about(TRUE)) expect_true(inherits(ta, "data.frame")) expect_true(nrow(ta) > 100) expect_equal(names(ta), c("study_id", "tree_id", "git_sha")) }) ############################################################################ ## studies_find_studies ## ############################################################################ test_that("single study detailed=TRUE", { skip_on_cran() res <- studies_find_studies( property = "ot:studyId", value = "ot_248", detailed = TRUE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_true(all(names(res) %in% c( "study_ids", "n_trees", "tree_ids", "candidate", "study_year", "title", "study_doi" ))) expect_true(nrow(res) >= 1L) expect_equal(res[["study_ids"]], "ot_248") expect_equal(res[["n_trees"]], "1") expect_equal(res[["candidate"]], "Tr76302") expect_equal(res[["study_year"]], "2014") expect_equal(res[["study_doi"]], "http://dx.doi.org/10.1016/j.cub.2014.06.060") expect_equal(res[["title"]], "'Phylogenomic Resolution of the Class Ophiuroidea Unlocks a Global Microfossil Record'") expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("single study detailed=FALSE", { skip_on_cran() res <- studies_find_studies( property = "ot:studyId", value = "ot_248", detailed = FALSE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "study_ids")) expect_true(inherits(res, "matched_studies")) expect_match(attr(res, "found_trees"), "list of the trees associated") expect_equal(names(res), "study_ids") expect_equal(res[1, 1], "ot_248") expect_equal(nrow(res), 1L) expect_equal(ncol(res), 1L) expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("multiple studies detailed=TRUE", { skip_on_cran() res <- studies_find_studies( property = "ot:focalCladeOTTTaxonName", value = "mammalia", detailed = TRUE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_true(all(names(res) %in% c( "study_ids", "n_trees", "tree_ids", "candidate", "study_year", "title", "study_doi" ))) expect_true(nrow(res) >= 8L) expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("multiple studies detailed=FALSE", { skip_on_cran() res <- studies_find_studies( property = "ot:focalCladeOTTTaxonName", value = "mammalia", detailed = FALSE ) expect_true(inherits(res, "study_ids")) expect_true(inherits(res, "matched_studies")) expect_true(inherits(res, "data.frame")) expect_equal(ncol(res), 1L) expect_true(nrow(res) >= 8) expect_equal(names(res), "study_ids") expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) ############################################################################ ## studies_find_trees ## ############################################################################ test_that("studies_find_trees single study detailed=FALSE", { skip_on_cran() res <- studies_find_trees( property = "ot:studyId", value = "ot_248", detailed = FALSE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_match(attr(res, "found_trees")[[1]], "Tr76302") expect_equal(names(res), c( "study_ids", "n_matched_trees", "match_tree_ids" )) expect_equal(res[1, 1], "ot_248") expect_equal(nrow(res), 1L) expect_equal(ncol(res), 3L) expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("studies_find_trees single study detailed=TRUE", { skip_on_cran() res <- studies_find_trees( property = "ot:studyId", value = "ot_248", detailed = TRUE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_equal(names(res), c( "study_ids", "n_trees", "tree_ids", "candidate", "study_year", "title", "study_doi", "n_matched_trees", "match_tree_ids" )) expect_equal(nrow(res), 1L) expect_equal(res[["study_ids"]], "ot_248") expect_equal(res[["n_trees"]], "1") expect_equal(res[["candidate"]], "Tr76302") expect_equal(res[["study_year"]], "2014") expect_equal(res[["study_doi"]], "http://dx.doi.org/10.1016/j.cub.2014.06.060") expect_equal(res[["title"]], "'Phylogenomic Resolution of the Class Ophiuroidea Unlocks a Global Microfossil Record'") expect_equal(res[["tree_ids"]], "Tr76302") expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("studies_find_trees multiple studies detailed=TRUE", { skip_on_cran() res <- studies_find_trees( property = "ot:ottTaxonName", value = "Echinodermata", detailed = TRUE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_equal(names(res), c( "study_ids", "n_trees", "tree_ids", "candidate", "study_year", "title", "study_doi", "n_matched_trees", "match_tree_ids" )) expect_true(nrow(res) >= 5L) expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) test_that("studies_find_trees multiple studies detailed=FALSE", { skip_on_cran() res <- studies_find_trees( property = "ot:ottTaxonName", value = "Echinodermata", detailed = FALSE ) expect_true(inherits(res, "data.frame")) expect_true(inherits(res, "matched_studies")) expect_equal(names(res), c( "study_ids", "n_matched_trees", "match_tree_ids" )) expect_true(nrow(res) >= 5L) expect_true(length(attr(res, "metadata")) > 0) expect_true(length(attr(res, "found_trees")) > 0) }) ############################################################################ ## list_trees ## ############################################################################ test_that("list_trees with studies_find_studies and detailed = FALSE", { skip_on_cran() expect_match( list_trees(studies_find_studies( property = "ot:focalCladeOTTTaxonName", value = "Aves", detailed = FALSE )), "If you want to get a list of the trees associated with the studies" ) }) test_that("list_trees with studies_find_studies and detailed = TRUE", { skip_on_cran() res <- studies_find_studies( property = "ot:focalCladeOTTTaxonName", value = "mammalia", detailed = TRUE ) expect_true(inherits(list_trees(res), "list")) expect_true(length(list_trees(res)) >= 8) expect_true(sum(names(list_trees(res)) %in% c( "pg_2647", "ot_308", "pg_2812", "ot_109", "pg_2582", "pg_1428", "ot_755", "pg_2550" )) >= 8) }) test_that("list_trees with studies_find_trees and detailed=FALSE", { skip_on_cran() res <- studies_find_trees( property = "ot:ottTaxonName", value = "Echinodermata", detailed = FALSE ) lt <- list_trees(res) expect_true(inherits(lt, "list")) expect_true(length(names(lt)) >= 5L) expect_true(all(sapply(lt, length) >= 1L)) }) test_that("list_trees with studies_find_trees and detailed=TRUE", { skip_on_cran() res <- studies_find_trees( property = "ot:ottTaxonName", value = "Echinodermata", detailed = TRUE ) lt <- list_trees(res) expect_true(inherits(lt, "list")) expect_true(length(names(lt)) >= 5L) expect_true(all(sapply(lt, length) >= 1L)) }) } rotl/tests/testthat/test-taxonomy.R0000644000176200001440000002731213543627040017223 0ustar liggesuserscontext("taxonomy") ############################################################################ ## taxonomy about ## ############################################################################ test_that("taxonomy_about is a list", { skip_on_cran() tt <- taxonomy_about() expect_true(inherits(tt, "list")) }) test_that("taxonomy_about has the names listed in documentation (if it breaks update documentation)", { skip_on_cran() tt <- taxonomy_about() expect_true(all(names(tt) %in% c("weburl", "author", "name", "source", "version"))) }) ############################################################################ ## taxon Info ## ############################################################################ test_that("taxonomy taxon info", { skip_on_cran() tid <- 515698 tt <- taxonomy_taxon_info(tid) expect_equal(tt[[1]][["ott_id"]], tid) expect_true(inherits(tt, "taxon_info")) }) test_that("taxonomy with include_lineage=TRUE", { skip_on_cran() tt <- taxonomy_taxon_info(515698, include_lineage = TRUE) expect_true(exists("lineage", tt[[1]])) expect_true(length(tt[[1]]$lineage) > 1) }) test_that("taxonomy with include_lineage=FALSE", { skip_on_cran() tt <- taxonomy_taxon_info(515698, include_lineage = FALSE) expect_false(exists("lineage", tt[[1]])) }) test_that("taxonomy with include_terminal_descendants=TRUE", { skip_on_cran() tt <- taxonomy_taxon_info(515698, include_terminal_descendants = TRUE) expect_true(exists("terminal_descendants", tt[[1]])) expect_true(length(tt[[1]][["terminal_descendants"]]) > 1) }) test_that("taxonomy with include_terminal_descendants=FALSE", { skip_on_cran() tt <- taxonomy_taxon_info(515698, include_terminal_descendants = FALSE) expect_false(exists("terminal_descendants", tt[[1]])) }) if (identical(Sys.getenv("NOT_CRAN"), "true")) { tid <- c(957430, 337928, 631176) tax_info <- taxonomy_taxon_info(tid) } test_that("taxonomy_taxon tax_rank method", { skip_on_cran() expect_true(inherits( tax_rank(tax_info), c("otl_tax_rank", "list") )) expect_equal( names(tax_rank(tax_info)), c( "Actinopyga", "Acanthaster", "Diadema (genus in Holozoa)" ) ) expect_equal( unlist(unname(tax_rank(tax_info))), rep("genus", 3) ) }) test_that("taxonomy_taxon ott_taxon_name method", { skip_on_cran() expect_true(inherits( tax_name(tax_info), c("otl_tax_info", "list") )) expect_equal( names(tax_name(tax_info)), c( "Actinopyga", "Acanthaster", "Diadema (genus in Holozoa)" ) ) expect_equal( unlist(unname(tax_name(tax_info))), c("Actinopyga", "Acanthaster", "Diadema") ) }) test_that("taxonomy_taxon synonyms method", { skip_on_cran() expect_true(inherits( synonyms(tax_info), c("otl_synonyms", "list") )) expect_equal( names(synonyms(tax_info)), c( "Actinopyga", "Acanthaster", "Diadema (genus in Holozoa)" ) ) expect_true(all(c("Diamema", "Centrechinus") %in% synonyms(tax_info)[[3]])) }) test_that("taxonomy_taxon is_suppressed method", { skip_on_cran() expect_true(inherits( is_suppressed(tax_info), c("otl_is_suppressed", "list") )) expect_equal( names(is_suppressed(tax_info)), c( "Actinopyga", "Acanthaster", "Diadema (genus in Holozoa)" ) ) expect_equal( unlist(unname(is_suppressed(tax_info))), c(FALSE, FALSE, FALSE) ) }) test_that("taxonomy_taxon flags method", { skip_on_cran() expect_true(inherits( flags(tax_info), c("otl_flags", "list") )) expect_equal( names(flags(tax_info)), c( "Actinopyga", "Acanthaster", "Diadema (genus in Holozoa)" ) ) expect_equal( unlist(unname(flags(tax_info))), NULL ) }) test_that("higher taxonomy method", { skip_on_cran() expect_error(tax_lineage(tax_info), "needs to be created") lg <- tax_lineage(taxonomy_taxon_info(tid, include_lineage = TRUE)) expect_true(inherits(lg, "list")) expect_true(inherits(lg[[1]], "data.frame")) expect_true(all(names(lg[[1]]) %in% c("rank", "name", "unique_name", "ott_id"))) expect_true(any(grepl("no rank", lg[[1]][["rank"]]))) expect_true(any(grep("life", lg[[1]][["name"]]))) }) ### ott_id() -------------------------------------------------------------------- test_that("taxonomy_taxon_info with ott_id for tax_info", { skip_on_cran() expect_equivalent( ott_id(tax_info), ott_id(taxonomy_taxon_info(ott_id(tax_info))) ) }) test_that("taxonomy_subtree with ott_id for tax_info", { skip_on_cran() expect_error( taxonomy_subtree(ott_id = ott_id(tax_info)), "supply one" ) }) test_that("tol_node_info with ott_id for tax_info", { skip_on_cran() expect_error( tol_node_info(ott_id(tax_info)), "provide a single" ) }) test_that("tol_subtree with ott_id for tax_info", { skip_on_cran() expect_error( tol_subtree(ott_id = ott_id(tax_info)), "provide a single" ) }) test_that("tol_mrca with ott_id for tax_info", { skip_on_cran() expect_equivalent( list("Euleutheroza" = 317277), ott_id(tol_mrca(ott_id(tax_info))) ) }) test_that("tol_induced_subtree with ott_id for tax_info", { skip_on_cran() expect_warning( expect_true(inherits( tol_induced_subtree(ott_id(tax_info)), "phylo" )) ) }) test_that("taxonomy_mrca with ott_id for tax_info", { skip_on_cran() expect_equivalent( list("Euleutheroza" = 317277), ott_id(taxonomy_mrca(ott_id(tax_info))) ) }) test_that("ott_id subset works", { skip_on_cran() expect_true(inherits(ott_id(tax_info), "otl_ott_id")) expect_true(inherits(ott_id(tax_info)[1], "otl_ott_id")) expect_true(!is.null(names(ott_id(tax_info)))) }) ############################################################################ ## taxon subtree ## ############################################################################ test_that("taxonomy subtree raw output", { skip_on_cran() tt <- taxonomy_subtree(515698, output_format = "raw") expect_true(inherits(tt, "list")) expect_identical(names(tt), "newick") }) test_that("taxonomy subtree returns warning if file is provided with something else than newick output", { skip_on_cran() expect_warning( taxonomy_subtree(515698, output_format = "raw", file = "/foo/bar"), "ignored" ) }) test_that("taxonomy subtree writes a 'valid' newick file", { skip_on_cran() ff <- tempfile(fileext = ".tre") tt <- taxonomy_subtree(515698, output_format = "newick", file = ff) expect_true(tt) expect_true(grepl("^\\(", readLines(ff, n = 1, warn = FALSE))) }) test_that("taxonomy subtree returns a valid newick string", { skip_on_cran() tt <- taxonomy_subtree(515698, output_format = "newick") expect_true(inherits(ape::read.tree(text = tt), "phylo")) }) test_that("taxonomy subtree returns a valid phylo object", { skip_on_cran() tt <- taxonomy_subtree(515698, output_format = "phylo") expect_true(inherits(tt, "phylo")) }) test_that("taxonomy subtree returns valid internal node names", { skip_on_cran() tt <- taxonomy_subtree(515698, output_format = "taxa") expect_true(inherits(tt, "list")) expect_equal(length(tt), 2) expect_equal(length(tt$tip_label), 14) expect_equal(length(tt$edge_label), 2) }) test_that("taxonomy subtree works if taxa has only 1 descendant", { skip_on_cran() tt <- taxonomy_subtree(ott_id = 3658331, output_format = "taxa") expect_true(inherits(tt, "list")) expect_equal(length(tt), 2) expect_true(inherits(tt$tip_label, "character")) }) ############################################################################ ## taxonomic MRCA ## ############################################################################ if (identical(Sys.getenv("NOT_CRAN"), "true")) { tax_mrca <- taxonomy_mrca(ott_id = c(515698, 590452, 643717)) tax_mrca_mono <- taxonomy_mrca(ott_id = c(79623, 962377)) } test_that("taxonomic most recent common ancestor", { skip_on_cran() expect_true(inherits(tax_mrca, "taxon_mrca")) expect_true(inherits(tax_mrca, "list")) }) test_that("mrca tax_rank method", { skip_on_cran() expect_equal( tax_rank(tax_mrca)[1], list("Asterales" = "order") ) }) test_that("mrca tax_name method", { skip_on_cran() expect_equal( tax_name(tax_mrca)[1], list("Asterales" = "Asterales") ) }) test_that("mrca ott_id method", { skip_on_cran() expect_equivalent( ott_id(tax_mrca)[1], list("Asterales" = 1042120) ) expect_true(inherits(ott_id(tax_mrca), "otl_ott_id")) }) test_that("mrca unique_name method", { skip_on_cran() expect_equal( unique_name(tax_mrca)[1], list("Asterales" = "Asterales") ) expect_true(inherits( unique_name(tax_mrca), "otl_unique_name" )) }) test_that("mrca tax_sources method", { skip_on_cran() ## issue with their taxonomy skip("need to fixed upstream") expect_equal( tax_sources(tax_mrca)[1], list( "Asterales" = c( "ncbi:4209", "worms:234044", "gbif:414", "irmng:10011" ) ) ) expect_true(inherits( tax_sources(tax_mrca), "otl_tax_sources" )) }) test_that("mrca is_suppressed method", { skip_on_cran() expect_true(inherits( is_suppressed(tax_mrca), c("otl_is_suppressed", "list") )) expect_equal( is_suppressed(tax_mrca)[1], list("Asterales" = FALSE) ) }) test_that("mrca flags method", { skip_on_cran() expect_true(inherits( flags(tax_mrca), c("otl_flags", "list") )) expect_equal( flags(tax_mrca)[1], list("Asterales" = NULL) ) }) ### ott_id() -------------------------------------------------------------------- test_that("taxonomy_taxon_info with ott_id for tax_mrca", { skip_on_cran() expect_equivalent( ott_id(tax_mrca_mono), ott_id(taxonomy_taxon_info(ott_id(tax_mrca_mono))) ) }) test_that("taxonomy_subtree with ott_id for tax_mrca", { skip_on_cran() tt <- taxonomy_subtree(ott_id = ott_id(tax_mrca_mono)) expect_true(length(tt[["tip_label"]]) > 10) expect_true(length(tt[["edge_label"]]) > 1) }) test_that("tol_node_info with ott_id for tax_mrca", { skip_on_cran() expect_equivalent( ott_id(tax_mrca_mono), ott_id(tol_node_info(ott_id(tax_mrca_mono))) ) }) test_that("tol_subtree with ott_id for tax_mrca", { skip_on_cran() expect_warning( tt <- tol_subtree(ott_id = ott_id(tax_mrca_mono)), "Dropping" ) expect_true(inherits(tt, "phylo")) expect_true(length(tt$tip.label) > 1) expect_true(length(tt$node.label) > 1) }) test_that("tol_mrca with ott_id for tax_mrca", { skip_on_cran() expect_equivalent( ott_id(tax_mrca_mono), ott_id(tol_mrca(ott_id(tax_mrca_mono))) ) }) test_that("tol_induced_subtree with ott_id for tax_mrca", { skip_on_cran() expect_error( tol_induced_subtree(ott_id(tax_mrca_mono)), "least two valid" ) }) test_that("taxonomy_mrca with ott_id for tax_mrca", { skip_on_cran() expect_equivalent( ott_id(tax_mrca_mono), ott_id(taxonomy_mrca(ott_id(tax_mrca_mono))) ) }) test_that("ott_id subset works", { skip_on_cran() expect_true(inherits(ott_id(tax_mrca_mono), "otl_ott_id")) expect_true(inherits(ott_id(tax_mrca_mono)[1], "otl_ott_id")) expect_true(!is.null(names(ott_id(tax_mrca_mono)))) }) ### is_in_tree() --------------------------------------------------------------- if (identical(Sys.getenv("NOT_CRAN"), "true")) { spp <- c("Tyrannosaurus rex", "Velociraptor", "Fabaceae", "Solanaceae") ot_names <- tnrs_match_names(spp) ot_ids <- ott_id(ot_names) } test_that("test is_in_tree", { skip_on_cran() in_tree <- is_in_tree(ot_ids) expect_equal(sum(in_tree), 2) expect_true(all(names(in_tree) %in% spp)) }) rotl/tests/testthat/test-deduplicate_labels.R0000644000176200001440000000313113543627007021146 0ustar liggesuserstr_string <- " ((A,A),A 1); ((B.1,B,C),B); ((D,D_1),D.1); ((('A 1','A 1'),A.1),'A 1'); ((('A A A','A A A'),A.1),'A 1'); ((((A_1:0.1,B__2:0.1)cats:0.1,(A_1:0.1,A_1:0.1)dogs:0.1)mammals:0.1):0.1)fur:0.1; " file_dup <- tempfile() cat(tr_string, file = file_dup, sep = "\n") ############################################################################ ## parse_newick ## ############################################################################ context("parse_newick") test_that("parse newick works correctly", { prsed_str <- parse_newick(file_dup) expect_true(is.character(prsed_str)) expect_equal(length(prsed_str), 6L) }) ############################################################################ ## deduplicate_labels ## ############################################################################ context("deduplicate_labels") test_that("deduplicate labels works on made up example", { expect_warning( dedup_tr <- deduplicate_labels(file_dup), "Some tip labels were duplicated" ) expect_true(file.exists(dedup_tr)) expect_warning(phylo_tr <- rncl::read_newick_phylo(file = dedup_tr), "Dropping singleton") expect_true(inherits(phylo_tr, "multiPhylo")) expect_equal(phylo_tr[[6]]$tip.label, c("A_1_1", "B__2", "A_1_2", "A_1")) }) test_that("deduplicate labels works on a OTL study", { skip_on_cran() expect_warning( get_study_tree(study_id = "pg_710", tree_id = "tree1277", tip_label = "ott_taxon_name"), "Some tip labels were duplicated" ) }) unlink(file_dup) rotl/tests/testthat/test-api-studies.R0000644000176200001440000001354013543627000017566 0ustar liggesuserscontext("studies API tests") ########################### ## .studies_find_studies ## ########################### test_that("argument verbose needs to be logical for .studies_find_studies", { skip_on_cran() expect_error( .studies_find_studies(NULL, NULL, "123", FALSE), "logical" ) }) test_that("argument exact needs to be logical for .studies_find_studies", { skip_on_cran() expect_error( .studies_find_studies(NULL, NULL, TRUE, "123"), "logical" ) }) test_that("argument property needs to be character for .studies_find_studies", { skip_on_cran() expect_error( .studies_find_studies(123, NULL, TRUE, TRUE), "character" ) }) test_that("argument value needs to be character for .studies_find_studies", { skip_on_cran() ## there is an error but not because of the argument "value" is ## character, it looks like a number so it's OK. Failure is ## because of the value doesn't exist. expect_error( .studies_find_studies("test", "123", TRUE, TRUE), "Study property test is unknown" ) }) test_that("both property & value need to be provided for .studies_find_studies", { skip_on_cran() expect_error( .studies_find_studies("test", NULL, TRUE, TRUE), "Must supply" ) }) test_that("both property & value need to be provided for .studies_find_studies", { skip_on_cran() expect_error( .studies_find_studies(NULL, "test", TRUE, TRUE), "Must supply" ) }) ########################### ## .studies_find_trees ## ########################### test_that("argument verbose needs to be logical for .studies_find_trees", { skip_on_cran() expect_error( .studies_find_trees(NULL, NULL, "123", FALSE), "logical" ) }) test_that("argument exact needs to be logical for .studies_find_trees", { skip_on_cran() expect_error( .studies_find_trees(NULL, NULL, TRUE, "123"), "logical" ) }) test_that("argument property needs to be character for .studies_find_trees", { skip_on_cran() expect_error( .studies_find_trees(123, NULL, TRUE, TRUE), "character" ) }) test_that("argument value needs to be character for .studies_find_trees", { skip_on_cran() ## there is an error but not because of the argument "value" is ## character, it looks like a number so it's OK. Failure is ## because of the value doesn't exist. expect_error(.studies_find_trees("test", "123", TRUE, TRUE)) }) test_that("both property & value need to be provided for .studies_find_trees", { skip_on_cran() expect_error( .studies_find_trees("test", NULL, TRUE, TRUE), "Must supply" ) }) test_that("both property & value need to be provided for .studies_find_trees", { skip_on_cran() expect_error( .studies_find_trees(NULL, "test", TRUE, TRUE), "Must supply" ) }) test_that("exact works as intended", { skip_on_cran() expect_equal(length(.studies_find_studies("ot:focalCladeOTTTaxonName", "felidae", exact = TRUE )$matched_studies), 0) }) test_that("exact works as intended", { skip_on_cran() expect_true(length(.studies_find_studies("ot:focalCladeOTTTaxonName", "Felidae", exact = TRUE )$matched_studies) >= 1) }) ############################################################################ ## .get_study ## ############################################################################ test_that("study_id isn't NULL for .get_study", { skip_on_cran() expect_error( .get_study(NULL, "test"), "Must supply" ) }) test_that("study_id is character for .get_study", { skip_on_cran() expect_error( .get_study(TRUE, "test"), "character" ) }) ############################################################################ ## .get_study_tree ## ############################################################################ test_that("study_id isn't NULL for .get_study_tree", { skip_on_cran() expect_error( .get_study_tree(NULL, NULL), "Must supply" ) }) test_that("study_id isn't NULL for .get_study_tree", { skip_on_cran() expect_error( .get_study_tree("123", NULL), "Must supply" ) }) test_that("study_id isn't NULL for .get_study_tree", { skip_on_cran() expect_error( .get_study_tree(NULL, "123"), "Must supply" ) }) test_that("study_id is character for .get_study", { skip_on_cran() expect_error( .get_study_tree(TRUE, "test"), "character" ) }) test_that("study_id is character for .get_study", { skip_on_cran() expect_error( .get_study_tree("test", TRUE), "character" ) }) ############################################################################ ## .get_study_subtree ## ############################################################################ test_that("study_id isn't NULL for .get_study_subtree", { skip_on_cran() expect_error( .get_study_subtree(NULL, NULL, NULL), "Must supply" ) }) test_that("tree_id isn't NULL for .get_study_subtree", { skip_on_cran() expect_error( .get_study_subtree("123", NULL, "123"), "Must supply" ) }) test_that("subtree_id isn't NULL for .get_study_subtree", { skip_on_cran() expect_error( .get_study_subtree(NULL, "123", "123"), "Must supply" ) }) test_that("study_id isn't NULL for .get_study_subtree", { skip_on_cran() expect_error( .get_study_subtree("123", "123", NULL), "Must supply" ) }) test_that("study_id is character for .get_study", { skip_on_cran() expect_error( .get_study_subtree(TRUE, "test", "test"), "character" ) }) test_that("tree_id is character for .get_study", { skip_on_cran() expect_error( .get_study_subtree("test", TRUE, "test"), "character" ) }) test_that("subtree_id is character for .get_study", { skip_on_cran() expect_error( .get_study_subtree("test", "test", TRUE), "character" ) }) rotl/tests/testthat/test-API.R0000644000176200001440000001345713543627006015765 0ustar liggesusers#### ## Making use of the shared OpenTree testing architecture #### ## The R, Python and Ruby wrappers for the Open Tree share a very similar design, ## allowing them to make use of a single test suite for the low-level functions ## (thus, the tests both checkvan individual library works as expected, and that ## the different libraries stay in line with each other). ## ## This file pulls the current version of the test from a github repo ## (https://github.com/OpenTreeOfLife/shared-api-tests) and translates the json ## files into tests that run in testthat. This takes a considerable amount of ## infrastructure so I'll briefly described the rational here. ## ## The JSON test-specificaton is defined at the github repo linked above, to ## translate these tests I have created custom testthat expectation-functionals ## (contains(), (key_has_value()... ). Because many of the test blocks in the ## JSON files have multiple expectiatoins (i.e. many key-value pairs for ## test_equals) there are functions starting with `test_` that run an entire ## test block for a given expectation. Since many of these tests require ## translation between R-objects and JSON encoded strings there is a set of ## convienence functions to automate that step and a function "test_map" that ## returns the appropriate test_* function for r given JSON test block. ## ## Finally, testthat_json_test uses the above functions to runs an entire test ## from a JSON object, and run_shared_tests() runs every tests in a JSON file. # functionals that start with a response contains <- function(key_name) { function(x) { expectation(key_name %in% names(x), sprintf("Missing key name: %s", key_name)) } } key_has_value <- function(key, value) { function(x) { if (length(value) == 0) { expectation( length(x[[key]]) == 0, paste("Key", key, "is not empty") ) } else if (length(value) == 1) { expectation( x[[key]] == value, paste("Key", key, "doesn't have value", value) ) } else { expectation( all(x[[key]] %in% value), paste("Key", key, "doesn't contain all of", value) ) } } } value_is_longer_than <- function(key, len) { function(x) { expectation( length(x[[key]]) > len, paste("Value for key", key, "is shorter than", len) ) } } value_is_error <- function(key_name) { function(x) { expectation( x[[key_name]] == "error", sprintf("Key %s is not 'error'", key_name) ) } } ## Functions to test entire test blocks with the above expectations test_contains <- function(response, test_block) { key_names <- test_block[, 1] sapply(key_names, function(k) expect_that(response, contains(k))) } test_equals <- function(response, test_block) { kv_pairs <- sapply(test_block, "[[", 1) for (i in 1:length(kv_pairs)) { expect_that(response, key_has_value(kv_pairs[[1]], kv_pairs[[2]])) } } test_of_type <- function(response, test_block) { rtype <- type_map(test_block[[1]]) expect_that(response, is_a(rtype)) } test_deep_equals <- function(response, test_block) { cat("*") expect_true(TRUE) } test_length_greater_than <- function(response, test_block) { vl_pairs <- sapply(test_block, "[[", 1) apply(vl_pairs, 2, function(v) { expect_that(response, value_is_longer_than(v[[1]], v[[2]])) }) } test_contains_error <- function(response, test_block) { errs <- test_block[, 1] sapply(errs, function(e) expect_that(reponse, contains_error(e))) } ## convience functions obj_map <- function(input) { if (is.character(input) & length(input) == 1) { switch(tolower(input), "true" = TRUE, "false" = FALSE, "null" = NULL, input ) } else { input } } json_to_r <- function(test_input) { if (length(test_input) == 0) { return(test_input) } return(lapply(test_input, obj_map)) } type_map <- function(json_type) { switch(json_type, "dict" = "list", stop(sprintf("unknown json type in testing file: %s", json_type)) ) } test_map <- function(test_type) { switch(test_type, "contains" = test_contains, "equals" = test_equals, "deep_equals" = test_deep_equals, "error" = stop("Error tests should be handled first"), "length_greater_than" = test_length_greater_than, "of_type" = test_of_type, stop(sprintf("Unkown error type in JSON test: %s", test_type)) ) } make_request <- function(json_test) { test_fxn <- paste0(".", json_test$test_function) do.call(what = test_fxn, args = json_to_r(json_test$test_input)) } testthat_json_test <- function(test_obj, test_name) { tests_to_run <- names(test_obj[[test_name]]$tests) if (length(tests_to_run) == 1) { if (grepl("error", tests_to_run)) { expect_error(make_request(test_obj[[test_name]])) } } else { response <- make_request(test_obj[[test_name]]) for (i in 1:length(tests_to_run)) { test_block <- test_obj[[test_name]]$tests[[ tests_to_run[i] ]] test_fxn <- test_map(tests_to_run[i]) test_fxn(response, test_block) } } } run_shared_test <- function(json_obj) { all_tests <- names(json_obj) for (i in 1:length(all_tests)) { test_that(all_tests[i], { skip_on_cran() testthat_json_test(json_obj, all_tests[i]) }) } } ## if (identical(Sys.getenv("NOT_CRAN"), "true")) { ## base_url <- "https://raw.githubusercontent.com/OpenTreeOfLife/shared-api-tests/master/" ## apis <- c("graph_of_life", ## "studies", ## "taxonomy", ## "tree_of_life", ## "tnrs" ## ) ## for(i in 1:length(apis)){ ## context( paste(apis[i], "API") ) ## test_text <- httr::GET(paste0(base_url, apis[i], ".json")) ## test_description <- jsonlite::fromJSON(httr::content(test_text)) ## run_shared_test(test_description) ## } ## } rotl/tests/tree_of_life.json0000644000176200001440000000705612705157664015736 0ustar liggesusers{ "test_mrca_normal_input": { "test_function": "tol_mrca", "test_input": {"ott_ids":[412129, 536234]}, "tests": { "of_type": ["dict","Response is of wrong type"] , "equals": [ [["nearest_taxon_mrca_rank","'superorder'"],"Fails that nearest_taxon_mrca_rank contains superorder"] ], "contains": [ ["nearest_taxon_mrca_ott_id","Doesn't contain nearest_taxon_mrca_ott_id"] ] } }, "test_mrca_empty_list_input": { "test_function": "tol_mrca", "test_input": {"ott_ids":[]}, "tests": { "error": [ ["ValueError","Return wrong kind of error, or did return error"] ] } }, "test_mrca_empty_list_input_two": { "test_function": "tol_mrca", "test_input": {"ott_ids":[], "node_ids":[]}, "tests": { "error": [ ["ValueError","Return wrong kind of error, or did return error"] ] } }, "test_mrca_non_existing_node": { "test_function": "tol_mrca", "test_input": {"ott_ids":[4259824365942365972436598732]}, "tests": { "error": [ ["OpenTreeService.OpenTreeError","Return wrong kind of error, or did return error"] ] } }, "test_mrca_non_existing_empty": { "test_function": "tol_mrca", "test_input": "null", "tests": { "error": [ ["ValueError","Return wrong kind of error, or did return error"] ] } }, "test_subtree_demo": { "test_function": "tol_subtree", "test_input": {"ott_id":3599390}, "tests": { "of_type": ["dict","Response is of wrong type"] , "contains": [ ["newick","Doesn't contain a newick string"] ] } }, "test_subtree_null": { "test_function": "tol_subtree", "test_input": {}, "tests": { "error": [ ["ValueError","Return wrong kind of error, or did return error"] ], "of_type": ["jfdsm"] } }, "test_induced_tree_good": { "test_function": "tol_induced_tree", "test_input": {"ott_ids":[292466, 501678, 267845, 666104, 316878, 102710, 176458]}, "tests": { "of_type": ["dict","Response is of wrong type"] , "contains": [ ["subtree","Doesn't contain a subtree string"] ] } }, "test_induced_tree_null": { "test_function": "tol_induced_tree", "test_input": {}, "tests": { "error": [ ["ValueError","Return wrong kind of error, or did return error"] ], "of_type": ["something"] } }, "test_about": { "test_function": "tol_about", "test_input": {}, "tests": { "contains": [ ["root_taxon_name","Output doesn't contain root_taxon_name"], ["num_source_studies","Output doesn't contain num_source_studies"], ["taxonomy_version","Output doesn't contain taxonomy_version"], ["root_ott_id","Output doesn't contain root_ott_id"], ["num_tips","Output doesn't contain num_tips"] ] } } } rotl/vignettes/0000755000176200001440000000000013543637133013252 5ustar liggesusersrotl/vignettes/meta-analysis.Rmd0000644000176200001440000002351113543632562016470 0ustar liggesusers--- title: "Using the Open Tree synthesis in a comparative analysis" author: "David Winter" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{Using the Open Tree synthesis in a comparative analysis} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} %\VignetteEncoding{UTF-8} --- ## Phylogenetic Comparative Methods The development of phylogenetic comparative methods has made phylogenies and important source of data in fields as diverse as ecology, genomic and medicine. Comparative methods can be used to investigate patterns in the evolution of traits or the diversification of lineages. In other cases a phylogeny is treated as a "nuisance parameter", allowing with the autocorrelation created by the shared evolutionary history of the different species included to be controlled for. In many cases finding a tree that relates the species for which trait data are available is a rate-limiting step in such comparative analyses. Here we show how the synthetic tree provided by Open Tree of Life (and made available in R via `rotl`) can help to fill this gap. ## A phylogenetic meta-analysis To demonstrate the use of `rotl` in a comparative analysis, we will partially reproduce the results of [Rutkowska _et al_ 2014](https://doi.org/10.1111/jeb.12282). Very briefly, this study is a meta-analysis summarising the results of multiple studies testing for systematic differences in the size of eggs which contain male and female offspring. Such a difference might mean that birds invest more heavily in one sex than the other. Because this study involves data from 51 different species, Rutkowska _et al_ used a phylogenetic comparative approach to account for the shared evolutionary history among some of the studied-species. ### Gather the data If we are going to reproduce this analysis, we will first need to gather the data. Thankfully, the data is available as supplementary material from the publisher's website. We can collect the data from using `fulltext` (with the papers DOI as input) and read it into memory with `readxl::read_excel`: ```{r load-package} library(rotl) ``` ```{r egg_data} ## This should work, but Wiley has currently broken the URLs to access the ## SI. ## if (require(readxl) && require(fulltext)) { ## doi <- "10.1111/jeb.12282" ## xl_file <- try(ft_get_si(doi, 1, save.name="egg.xls"), silent = TRUE) ## egg_data <- read_excel(xl_file) ## } else { egg_data <- read.csv(system.file("extdata", "egg.csv", package = "rotl"), stringsAsFactors = FALSE ) ## } head(egg_data) ``` The most important variable in this dataset is `Zr`, which is a [normalized effect size](https://en.wikipedia.org/wiki/Fisher_transformation) for difference ,in size between eggs that contain males and females. Values close to zero come from studies that found the sex of an egg's inhabitant had little effect in its size, while large positive or negative values correspond to studies with substantial sex biases (towards males and females respectively). Since this is a meta-analysis we should produce the classic [funnel plot](https://en.wikipedia.org/wiki/Funnel_plot) with effects-size on the y-axis and precision (the inverse of the sample standard error) on the x-axis. Here we calculate precision from the sample variance (`Vzr`): ```{r eggs_in_a_funnel, fig.width=6, fig.height=3} plot(1 / sqrt(egg_data$VZr), egg_data$Zr, pch = 16, ylab = "Effect size (Zr)", xlab = "Precision (1/SE)", main = "Effect sizes for sex bias in egg size among 51 brid species" ) ``` In order to use this data later on we need to first convert it to a standard `data.frame`. We can also convert the `animal` column (the species names) to lower case, and remove the underscores in their names, which will make it easier to match names later on: ```{r, clean_eggs} egg_data <- as.data.frame(egg_data) ## Convert taxon names to lower case egg_data$animal <- tolower(egg_data$animal) ## Let's remove the underscores (_) from the taxon names egg_data$animal <- gsub("_", " ", egg_data$animal) ``` ### Find the species in OTT We can use the OTL synthesis tree to relate these species. To do so we first need to find Open Tree Taxonomy (OTT) IDs for each species. We can do that with the Taxonomic Name Resolution Service function `tnrs_match_names`: ```{r birds} taxa <- tnrs_match_names(unique(egg_data$animal), context = "Animals") head(taxa) ``` All of these species are in OTT, but a few of them go by different names in the Open Tree than we have in our data set. Because the tree `rotl` fetches will have Open Tree names, we need to create a named vector that maps the names we have for each species to the names Open Tree uses for them: ```{r bird_map} taxon_map <- structure(taxa$search_string, names = taxa$unique_name) ``` Now we can use this map to retrieve "data set names" from "OTT names": ```{r odd_duck} taxon_map["Anser caerulescens"] ``` ### Get a tree Now we can get the tree. There are really too many tips here to show nicely, so we will leave them out of this plot ```{r birds_in_a_tree, fig.width=5, fig.height=5, fig.align='center'} tr <- tol_induced_subtree(ott_id(taxa)[is_in_tree(ott_id(taxa))]) plot(tr, show.tip.label = FALSE) ``` There are a few things to note here. First, the tree has no branch lengths. At present this is true for the whole of the Open Tree synthetic tree. Some comparative methods require either branch lengths or an ultrametric tree. Before you can use one of those methods you will need to get a tree with branch lengths. You could try looking for published trees made available by the Open Tree with `studies_find_trees`. Alternatively, you could estimate branch lengths from the toplogy of a phylogeny returned by `tol_induced_subtree`, perhaps by downloading DNA sequences from the NCBI with `rentrez` or "hanging" the tree on nodes of known-age using penalized likelihood method in `ape::chronos`. In this case, we will use only the topology of the tree as input to our comparative analysis, so we can skip these steps. Second, the tip labels contain OTT IDs, which means they will not perfectly match the species names in our dataset or the taxon map that we created earlier: ```{r tip_lab} tr$tip.label[1:4] ``` Finally, the tree contains node labels for those nodes that match a higher taxonomic group, and empty character vectors (`""`) for all other nodes. Some comparative methods either do no expect node labels at all, or require all labeled nodes to have a unique name (meaning multiple "empty" labels will cause and error). We can deal with all these details easily. `rotl` provides the convenience function `strip_ott_ids` to remove the extra information from the tip labels. With the IDs removed, we can use our taxon map to replace the tip labels in the tree with the species names from dataset. ```{r clean_tips} otl_tips <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label <- taxon_map[ otl_tips ] ``` Finally, we can remove the node labels by setting the `node.label` attribute of the tree to `NULL`. ```{r remove_nodes} tr$node.label <- NULL ``` ```{r match_species_tree} egg_data <- egg_data[egg_data$animal %in% tr$tip.label, ] ``` ### Perform the meta-analysis Now we have data and a tree, and we know the names in the tree match the ones in the data. It's time to do the comparative analysis. Rutkowska _et al_. used `MCMCglmm`, a Bayesian MCMC approach to fitting multi-level models,to perform their meta-analysis, and we will do the same. Of course, to properly analyse these data you would take some care in deciding on the appropriate priors to use and inspect the results carefully. In this case, we are really interested in using this as a demonstration, so we will just run a simple model. Specifically we sill fit a model where the only variable that might explain the values of `Zr` is the random factor `animal`, which corresponds to the phylogenetic relationships among species. We also provide `Zvr` as the measurement error variance, effectively adding extra weight to the results of more powerful studies. Here's how we specify and fit that model with `MCMCglmm`: ```{r model} set.seed(123) if (require(MCMCglmm, quietly = TRUE)) { pr <- list( R = list(V = 1, nu = 0.002), G = list(G1 = list(V = 1, nu = 0.002)) ) model <- MCMCglmm(Zr ~ 1, random = ~animal, pedigree = tr, mev = egg_data$VZr, prior = pr, data = egg_data, verbose = FALSE ) } else { model <- readRDS(file = system.file("extdata", "mcmcglmm_model.rds", package = "rotl")) } ``` Now that we have a result we can find out how much phylogenetic signal exists for sex-biased differences in egg-size. In a multi-level model we can use variance components to look at this, specifically the proportion of the total variance that can be explained by phylogeny is called the phylogenetic reliability, _H_. Let's calculate the _H_ for this model: ```{r PhyH} var_comps <- colMeans(model$VCV) var_comps["animal"] / sum(var_comps) ``` It appears there is almost no phylogenetic signal to the data. The relationships among species explain much less that one percent of the total variance in the data. If you were wondering, Rutkowska _et al_. report a similar result, even after adding more predictors to their model most of the variance in `Zr` was left unexplained. ## What other comparative methods can I use in R? Here we have demonstrated just one comparative analysis that you might do in R. There are an ever-growing number of packages that allow an ever-growing number of analysis to performed in R. Some "classics" like ancestral state reconstruction, phylogenetic independent contrasts and lineage through time plots are implemented in `ape`. Packages like `phytools`, `caper` and `diversitree` provide extensions to these methods. The [CRAN Phylogenetics Taskview](https://CRAN.R-project.org/view=Phylogenetics) gives a good idea of the diversity of packages and analyses that can be completed in R. rotl/vignettes/data_mashups.Rmd0000644000176200001440000002037113543632563016374 0ustar liggesusers--- title: "Connecting data to Open Tree trees" author: "David Winter" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{Connecting data to Open Tree trees} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} \usepackage[utf8]{inputenc} --- ## Combining data from OToL and other sources. One of the major goals of `rotl` is to help users combine data from other sources with the phylogenetic trees in the Open Tree database. This examples document describes some of the ways in which a user might connect data to trees from Open Tree. ## Get Open Tree IDs to match your data. Let's say you have a dataset where each row represents a measurement taken from one species, and your goal is to put these measurements in some phylogenetic context. Here's a small example: the best estimate of the mutation rate for a set of unicellular Eukaryotes along with some other property of those species which might explain the mutation rate: ```{r, data} csv_path <- system.file("extdata", "protist_mutation_rates.csv", package = "rotl") mu <- read.csv(csv_path, stringsAsFactors = FALSE) mu ``` If we want to get a tree for these species we need to start by finding the unique ID for each of these species in the Open Tree database. We can use the Taxonomic Name Resolution Service (`tnrs`) functions to do this. Before we do that we should see if any of the taxonomic contexts, which can be used to narrow a search and avoid conflicts between different codes, apply to our group of species: ```{r, context} library(rotl) tnrs_contexts() ``` Hmm, none of those groups contain all of our species. In this case we can search using the `All life` context and the function `tnrs_match_names`: ```{r, match} taxon_search <- tnrs_match_names(names = mu$species, context_name = "All life") knitr::kable(taxon_search) ``` Good, all of our species are known to Open Tree. Note, though, that one of the names is a synonym. _Saccharomyces pombe_ is older name for what is now called _Schizosaccharomyces pombe_. As the name suggests, the Taxonomic Name Resolution Service is designed to deal with these problems (and similar ones like misspellings), but it is always a good idea to check the results of `tnrs_match_names` closely to ensure the results are what you expect. In this case we have a good ID for each of our species so we can move on. Before we do that, let's ensure we can match up our original data to the Open Tree names and IDs by adding them to our `data.frame`: ```{r, munge} mu$ott_name <- unique_name(taxon_search) mu$ott_id <- taxon_search$ott_id ``` ## Find a tree with your taxa Now let's find a tree. There are two possible options here: we can search for published studies that include our taxa or we can use the 'synthetic tree' from Open Tree. We can try both approaches. ### Published trees Before we can search for published studies or trees, we should check out the list of properties we can use to perform such searches: ```{r, properties} studies_properties() ``` We have `ottIds` for our taxa, so let's use those IDs to search for trees that contain them. Starting with our first species _Tetrahymena thermophila_ we can use `studies_find_trees` to do this search. ```{r taxon_count} studies_find_trees(property = "ot:ottId", value = as.character(ott_id(taxon_search)[1])) ``` Well... that's not very promising. We can repeat that process for all of the IDs to see if the other species are better represented. ```{r, all_taxa_count} hits <- lapply(mu$ott_id, studies_find_trees, property = "ot:ottId", detailed = FALSE) sapply(hits, function(x) sum(x[["n_matched_trees"]])) ``` OK, most of our species are not in any of the published trees available. You can help fix this sort of problem by [making sure you submit your published trees to Open Tree](https://tree.opentreeoflife.org/curator). ### A part of the synthesis tree Thankfully, we can still use the complete Tree of Life made from the combined results of all of the published trees and taxonomies that go into Open Tree. The function `tol_induced_subtree` will fetch a tree relating a set of IDs. Using the default arguments you can get a tree object into your R session: ```{r subtree, fig.width=7, fig.height=4} ott_in_tree <- ott_id(taxon_search)[is_in_tree(ott_id(taxon_search))] tr <- tol_induced_subtree(ott_ids = ott_in_tree) plot(tr) ``` ### Connect your data to the tips of your tree Now we have a tree for of our species, how can we use the tree and the data together? The package `phylobase` provide an object class called `phylo4d`, which is designed to represent a phylogeny and data associated with its tips. In oder to get our tree and data into one of these objects we have to make sure the labels in the tree and in our data match exactly. That's not quite the case at the moment (tree labels have underscores and IDs appended): ```{r, match_names} mu$ott_name[1] tr$tip.label[4] ``` `rotl` provides a convienence function `strip_ott_ids` to deal with these. ```{r, sub} tr$tip.label <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label %in% mu$ott_name ``` Ok, now the tips are together we can make a new dataset. The `phylo4d()` functions matches tip labels to the row names of a `data.frame`, so let's make a new dataset that contains just the relevant data and has row names to match the tree ```{r phylobase} library(phylobase) mu_numeric <- mu[, c("mu", "pop.size", "genome.size")] rownames(mu_numeric) <- mu$ott_name tree_data <- phylo4d(tr, mu_numeric) ``` And now we can plot the data and the tree together ```{r, fig.width=7, fig.height=5} plot(tree_data) ``` ## Find external data associated with studies, trees and taxa from Open Tree In the above example we looked for a tree that related species in another dataset. Now we will go the other way, and try to find data associated with Open Tree records in other databases. ### Get external data from a study Let's imagine you were interested in extending or reproducing the results of a published study. If that study is included in Open Tree you can find it via `studies_find_studies` or `studies_find_trees` and retrieve the published trees with `get_study`. `rotl` will also help you find external. The function `study_external_IDs` retrieves the DOI for a given study, and uses that to gather some more data: ```{r} extra_data <- try(study_external_IDs("pg_1980"), silent = TRUE) if (!inherits(extra_data, "try-error")) { extra_data } ``` Here the returned object contains an `external_data_url` (in this case a link to the study in Treebase), a pubmed ID for the paper and a vector IDs for the NCBI's nuleotide database. The packages `treebase` and `rentrez` provide functions to make use of these IDs within R. As an example, let's use `rentrez` to download the first two DNA seqences and print them. ```{r} library(rentrez) seqs <- try(entrez_fetch(db = "nucleotide", id = extra_data$nucleotide_ids[1:2], rettype = "fasta"), silent = TRUE) if (inherits(seqs, "try-error")) { cat("NCBI temporarily down.") } else { cat(seqs) } ``` You could further process these sequences in R with the function `read.dna` from `ape` or save them to disk by specifying a file name with `cat`. ### Find a OTT taxon in another taxonomic database It is also possible map an Open Tree taxon to a record in another taxonomic database. For instance, if we wanted to search for data about one of the tips of the sub-tree we fetched in the example above we could do so using `taxon_external_IDs`: ```{r} Tt_ids <- taxon_external_IDs(mu$ott_id[2]) Tt_ids ``` A user could then use `rgbif` to find locality records using the gbif ID or `rentrez` to get genetic or bibliometric data about from the NCBI's databases. ## What next The demonstration gets you to the point of visualizing your data in a phylogenetic context. But there's a lot more you do with this sort of data in R. For instance, you could use packages like `ape`, `caper`, `phytools` and `mcmcGLMM` to perform phylogenetic comparative analyses of your data. You could gather more data on your species using packages that connect to trait databases like `rfishbase`, `AntWeb` or `rnpn` which provides data from the US National Phenology Network. You could also use `rentrez` to find genetic data for each of your species, and use that data to generate branch lengths for the phylogeny. rotl/vignettes/rotl.Rmd0000644000176200001440000002552013543632564014705 0ustar liggesusers--- title: "How to use rotl?" author: "François Michonneau" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{How to use rotl?} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} \usepackage[utf8]{inputenc} --- `rotl` provides an interface to the Open Tree of Life (OTL) API and allows users to query the API, retrieve parts of the Tree of Life and integrate these parts with other R packages. The OTL API provides services to access: * the **Tree of Life** a.k.a. TOL (the synthetic tree): a single draft tree that is a combination of **the OTL taxonomy** and the **source trees** (studies) * the **Taxonomic name resolution services** a.k.a. TNRS: the methods for resolving taxonomic names to the internal identifiers used by the TOL and the GOL (the `ott ids`). * the **Taxonomy** a.k.a. OTT (for Open Tree Taxonomy): which represents the synthesis of the different taxonomies used as a backbone of the TOL when no studies are available. * the **Studies** containing the source trees used to build the TOL, and extracted from the scientific literature. In `rotl`, each of these services correspond to functions with different prefixes: | Service | `rotl` prefix | |---------------|---------------| | Tree of Life | `tol_` | | TNRS | `tnrs_` | | Taxonomy | `taxonomy_` | | Studies | `studies_` | `rotl` also provides a few other functions and methods that can be used to extract relevant information from the objects returned by these functions. ## Demonstration of a basic workflow The most common use for `rotl` is probably to start from a list of species and get the relevant parts of the tree for these species. This is a two step process: 1. the species names need to be matched to their `ott_id` (the Open Tree Taxonomy identifiers) using the Taxonomic name resolution services (TNRS) 1. these `ott_id` will then be used to retrieve the relevant parts of the Tree of Life. ### Step 1: Matching taxonomy to the `ott_id` Let's start by doing a search on a diverse group of taxa: a tree frog (genus _Hyla_), a fish (genus _Salmo_), a sea urchin (genus _Diadema_), and a nautilus (genus _Nautilus_). ```{r} library(rotl) taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) ``` It's always a good idea to check that the resolved names match what you intended: `r knitr::kable(resolved_names)` The column `unique_name` sometimes indicates the higher taxonomic level associated with the name. The column `number_matches` indicates the number of `ott_id` that corresponds to a given name. In this example, our search on _Diadema_ returns 2 matches, and the one returned by default is indeed the sea urchin that we want for our query. The argument `context_name` allows you to limit the taxonomic scope of your search. _Diadema_ is also the genus name of a fungus. To ensure that our search is limited to animal names, we could do: ```{r} resolved_names <- tnrs_match_names(taxa, context_name = "Animals") ``` If you are trying to build a tree with deeply divergent taxa that the argument `context_name` cannot fix, see "How to change the ott ids assigned to my taxa?" in the FAQ below. ### Step 2: Getting the tree corresponding to our taxa Now that we have the correct `ott_id` for our taxa, we can ask for the tree using the `tol_induced_subtree()` function. By default, the object returned by `tol_induced_subtree` is a phylo object (from the [ape](https://cran.r-project.org/package=ape) package), so we can plot it directly. ```{r, fig.width=7, fig.height=4} my_tree <- tol_induced_subtree(ott_ids = resolved_names$ott_id) plot(my_tree, no.margin = TRUE) ``` ## FAQ ### How to change the ott ids assigned to my taxa? If you realize that `tnrs_match_names` assigns the incorrect taxonomic group to your name (e.g., because of synonymy) and changing the `context_name` does not help, you can use the function `inspect`. This function takes the object resulting from `tnrs_match_names()`, and either the row number, the taxon name (you used in your search in lowercase), or the `ott_id` returned by the initial query. To illustrate this, let's re-use the previous query but this time pretending that we are interested in the fungus _Diadema_ and not the sea urchin: ```{r} taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) resolved_names inspect(resolved_names, taxon_name = "diadema") ``` In our case, we want the second row in this data frame to replace the information that initially matched for _Diadema_. We can now use the `update()` function, to change to the correct taxa (the fungus not the sea urchin): ```{r} resolved_names <- update(resolved_names, taxon_name = "diadema", new_row_number = 2 ) ## we could also have used the ott_id to replace this taxon: ## resolved_names <- update(resolved_names, taxon_name = "diadema", ## new_ott_id = 4930522) ``` And now our `resolved_names` data frame includes the taxon we want: `r knitr::kable(resolved_names)` ### How do I know that the taxa I'm asking for is the correct one? The function `taxonomy_taxon_info()` takes `ott_ids` as arguments and returns taxonomic information about the taxa. This output can be passed to some helpers functions to extract the relevant information. Let's illustrate this with our _Diadema_ example ```{r} diadema_info <- taxonomy_taxon_info(631176) tax_rank(diadema_info) synonyms(diadema_info) tax_name(diadema_info) ``` In some cases, it might also be useful to investigate the taxonomic tree descending from an `ott_id` to check that it's the correct taxon and to determine the species included in the Open Tree Taxonomy: ```{r} diadema_tax_tree <- taxonomy_subtree(631176) diadema_tax_tree ``` By default, this function return all taxa (including self, and internal) descending from this `ott_id` but it also possible to return `phylo` object. ### How do I get the tree for a particular taxonomic group? If you are looking to get the tree for a particular taxonomic group, you need to first identify it by its node id or ott id, and then use the `tol_subtree()` function: ```{r, fig.width=7, fig.height=4} mono_id <- tnrs_match_names("Monotremata") mono_tree <- tol_subtree(ott_id = ott_id(mono_id)) plot(mono_tree) ``` ### How do I find trees from studies focused on my favourite taxa? The function `studies_find_trees()` allows the user to search for studies matching a specific criteria. The function `studies_properties()` returns the list of properties that can be used in the search. ```{r} furry_studies <- studies_find_studies(property = "ot:focalCladeOTTTaxonName", value = "Mammalia") furry_ids <- furry_studies$study_ids ``` Now that we know the `study_id`, we can ask for the meta data information associated with this study: ```{r} furry_meta <- get_study_meta("pg_2550") get_publication(furry_meta) ## The citation for the source of the study get_tree_ids(furry_meta) ## This study has 10 trees associated with it candidate_for_synth(furry_meta) ## None of these trees are yet included in the OTL ``` Using `get_study("pg_2550")` would returns a `multiPhylo` object (default) with all the trees associated with this particular study, while `get_study_tree("pg_2550", "tree5513")` would return one of these trees. ### The tree returned by the API has duplicated tip labels, how can I work around it? You may encounter the following error message: ``` Error in rncl(file = file, ...) : Taxon number 39 (coded by the token Pratia angulata) has already been encountered in this tree. Duplication of taxa in a tree is prohibited. ``` This message occurs as duplicate labels are not allowed in the NEXUS format and it is stricly enforced by the part of the code used by `rotl` to import the trees in memory. If you use a version of `rotl` more recent than 0.4.1, this should not happen by default for the function `get_study_tree`. If it happens with another function, please [let us know](https://github.com/ropensci/rotl/issues). The easiest way to work around this is to save the tree in a file, and use APE to read it in memory: ```{r, eval=FALSE} get_study_tree( study_id = "pg_710", tree_id = "tree1277", tip_label = "ott_taxon_name", file = "/tmp/tree.tre", file_format = "newick" ) tr <- ape::read.tree(file = "/tmp/tree.tre") ``` ### How do I get the higher taxonomy for a given taxa? If you encounter a taxon name you are not familiar with, it might be useful to obtain its higher taxonomy to see where it fits in the tree of life. We can combine several taxonomy methods to extract this information easily. ```{r} giant_squid <- tnrs_match_names("Architeuthis") tax_lineage(taxonomy_taxon_info(ott_id(giant_squid), include_lineage = TRUE)) ``` ### Why are OTT IDs discovered with `rotl` missing from an induced subtree? Some taxonomic names that can be retrieved through the taxonomic name resolution service are not part of the Open Tree's synthesis tree. These are usually traditional higher-level taxa that have been found to be paraphyletic. For instance, if you wanted to fetch a tree relating the three birds that go into a [Turkducken](https://en.wikipedia.org/wiki/Turducken) as well as the pork used for stuffing, you might search for the turkey, duck, chicken, and pork genera: ```{r} turducken <- c("Meleagris", "Anas", "Gallus", "Sus") taxa <- tnrs_match_names(turducken, context = "Animals") taxa ``` We have the OTT ids for each genus, however, if we tried to get the induced subtree from these results, we would get an error: ```{r, error=TRUE} tr <- tol_induced_subtree(ott_id(taxa)) ``` As the error message suggests, some of the taxa are not found in the synthetic tree. This occurs for 2 main reasons: either the taxa is invalid, or it is part of a group that is not monophyletic in the synthetic tree. There are two ways to get around this issue: (1) removing the taxa that are not part of the Open Tree; (2) using the complete species name. #### Removing the taxa missing from the synthetic tree To help with this situation, `rotl` provides a way to identify the OTT ids that are not part of the synthetic tree. The function `is_in_tree()` takes the output of the `ott_id()` function and returns a vector of logical indicating whether the taxa are part of the synthetic tree. We can then use to only keep the taxa that appear in the synthetic tree: ```{r} in_tree <- is_in_tree(ott_id(taxa)) in_tree tr <- tol_induced_subtree(ott_id(taxa)[in_tree]) ``` #### Using the full taxonomic names The best way to avoid these problems is to specify complete species names (species being the lowest level of classification in the Open Tree taxonomy they are guaranteed to be monophyletic): ```{r, fig.width=7, fig.height=4} turducken_spp <- c("Meleagris gallopavo", "Anas platyrhynchos", "Gallus gallus", "Sus scrofa") taxa <- tnrs_match_names(turducken_spp, context = "Animals") tr <- tol_induced_subtree(ott_id(taxa)) plot(tr) ``` rotl/vignettes/vignette.css0000644000176200001440000000726612647504570015626 0ustar liggesusersbody { background-color: #fff; margin: 1em auto; max-width: 700px; overflow: visible; padding-left: 2em; padding-right: 2em; font-family: "Open Sans", "Helvetica Neue", Helvetica, Arial, sans-serif; font-size: 14px; line-height: 1.35; } #header { text-align: center; } #TOC { clear: both; margin: 0 0 10px 10px; padding: 4px; width: 400px; border: 1px solid #CCCCCC; border-radius: 5px; background-color: #f6f6f6; font-size: 13px; line-height: 1.3; } #TOC .toctitle { font-weight: bold; font-size: 15px; margin-left: 5px; } #TOC ul { padding-left: 40px; margin-left: -1.5em; margin-top: 5px; margin-bottom: 5px; } #TOC ul ul { margin-left: -2em; } #TOC li { line-height: 16px; } table { margin: 1em auto; border-width: 1px; border-color: #DDDDDD; border-style: outset; border-collapse: collapse; } table th { border-width: 2px; padding: 5px; border-style: inset; } table td { border-width: 1px; border-style: inset; line-height: 18px; padding: 5px 5px; } table, table th, table td { border-left-style: none; border-right-style: none; } table thead, table tr.even { background-color: #f7f7f7; } p { margin: 0.5em 0; } blockquote { background-color: #f6f6f6; padding: 0.25em 0.75em; } hr { border-style: solid; border: none; border-top: 1px solid #777; margin: 28px 0; } dl { margin-left: 0; } dl dd { margin-bottom: 13px; margin-left: 13px; } dl dt { font-weight: bold; } ul { margin-top: 0; } ul li { list-style: circle outside; } ul ul { margin-bottom: 0; } pre, code { background-color: #f7f7f7; border-radius: 3px; color: #333; white-space: pre-wrap; } pre { /*white-space: pre-wrap; /* Wrap long lines */ border-radius: 3px; margin: 5px 0px 10px 0px; padding: 10px; } pre:not([class]) { background-color: #f7f7f7; } code { font-family: Consolas, Monaco, 'Courier New', monospace; font-size: 85%; } p > code, li > code { padding: 2px 0px; } div.figure { text-align: center; } img { background-color: #FFFFFF; padding: 2px; border: 1px solid #DDDDDD; border-radius: 3px; border: 1px solid #CCCCCC; margin: 0 5px; } h1 { margin-top: 0; font-size: 35px; line-height: 40px; } h2 { border-bottom: 4px solid #f7f7f7; padding-top: 10px; padding-bottom: 2px; font-size: 145%; } h3 { border-bottom: 2px solid #f7f7f7; padding-top: 10px; font-size: 120%; } h4 { border-bottom: 1px solid #f7f7f7; margin-left: 8px; font-size: 105%; } h5, h6 { border-bottom: 1px solid #ccc; font-size: 105%; } a { color: #0033dd; text-decoration: none; } a:hover { color: #6666ff; } a:visited { color: #800080; } a:visited:hover { color: #BB00BB; } a[href^="http:"] { text-decoration: underline; } a[href^="https:"] { text-decoration: underline; } /* Class described in https://benjeffrey.com/posts/pandoc-syntax-highlighting-css Colours from https://gist.github.com/robsimmons/1172277 */ code > span.kw { color: #555; font-weight: bold; } /* Keyword */ code > span.dt { color: #902000; } /* DataType */ code > span.dv { color: #40a070; } /* DecVal (decimal values) */ code > span.bn { color: #d14; } /* BaseN */ code > span.fl { color: #d14; } /* Float */ code > span.ch { color: #d14; } /* Char */ code > span.st { color: #d14; } /* String */ code > span.co { color: #888888; font-style: italic; } /* Comment */ code > span.ot { color: #007020; } /* OtherToken */ code > span.al { color: #ff0000; font-weight: bold; } /* AlertToken */ code > span.fu { color: #900; font-weight: bold; } /* Function calls */ code > span.er { color: #a61717; background-color: #e3d2d2; } /* ErrorTok */ rotl/R/0000755000176200001440000000000013543637134011444 5ustar liggesusersrotl/R/methods.R0000644000176200001440000000625713543626747013254 0ustar liggesusers############################################################################ ## methods ## ############################################################################ ##' Methods for dealing with objects containing taxonomic information ##' (Taxonomy, TNRS endpoints) ##' ##' This is the page for the generic methods. See the help pages for ##' \code{\link{taxonomy_taxon_info}}, \code{\link{taxonomy_mrca}}, and ##' \code{\link{tnrs_match_names}} for more information. ##' ##' @title Methods for Taxonomy ##' @param tax an object returned by \code{\link{taxonomy_taxon_info}}, ##' \code{\link{taxonomy_mrca}}, or \code{\link{tnrs_match_names}} ##' @param ... additional arguments (see ##' \code{\link{tnrs_match_names}}) ##' @rdname taxonomy-methods ##' @export tax_rank <- function(tax, ...) { UseMethod("tax_rank") } ##' @export ##' @rdname taxonomy-methods ott_id <- function(tax, ...) { UseMethod("ott_id") } ##' @export ##' @rdname taxonomy-methods synonyms <- function(tax, ...) { UseMethod("synonyms") } ##' @export ##' @rdname taxonomy-methods tax_sources <- function(tax, ...) UseMethod("tax_sources") ##' @export ##' @rdname taxonomy-methods is_suppressed <- function(tax, ...) UseMethod("is_suppressed") ##' @export ##' @rdname taxonomy-methods unique_name <- function(tax, ...) UseMethod("unique_name") ##' @export ##' @rdname taxonomy-methods tax_name <- function(tax, ...) UseMethod("tax_name") ### flags ----------------------------------------------------------------------- ##' @export ##' @rdname match_names-methods flags <- function(tax, ...) UseMethod("flags") ### ##' Retrieve the detailed information for the list of studies used in ##' the Tree of Life. ##' ##' @title List of studies used in the Tree of Life ##' ##' @details This function takes the object resulting from ##' \code{tol_about(study_list = TRUE)}, \code{tol_mrca()}, ##' \code{tol_node_info()}, and returns a data frame listing the ##' \code{tree_id}, \code{study_id} and \code{git_sha} for the ##' studies currently included in the Tree of Life. ##' ##' @param tax a list containing a \code{source_id_map} slot. ##' @param ... additional arguments (currently unused) ##' ##' @return a data frame ##' @export source_list <- function(tax, ...) UseMethod("source_list") ##' Extract the lineage information (higher taxonomy) from an object ##' returned by \code{\link{taxonomy_taxon_info}}. ##' ##' The object passed to this function must have been created using ##' the argument \code{include_lineage=TRUE}. ##' ##' @title Lineage of a taxon ##' @param tax an object created by \code{\link{taxonomy_taxon_info}} ##' using the argument \code{include_lineage=TRUE}. ##' @param ... additional arguments (currently unused). ##' @return A list with one slot per taxon that contains a data frame ##' with 3 columns: the taxonomy rank, the name, and unique name ##' for all taxa included in the lineage of the taxon up to the ##' root of the tree. ##' @rdname tax_lineage ##' @export tax_lineage <- function(tax, ...) UseMethod("tax_lineage") ##' @export ##' @rdname tol_node_info tol_lineage <- function(tax, ...) UseMethod("tol_lineage") rotl/R/api-taxonomy.R0000644000176200001440000000446513543626726014232 0ustar liggesusers##' @importFrom httr content ## Summary information about the OpenTree Taxonomy (OTT) .taxonomy_about <- function(...) { res <- otl_POST(path = "/taxonomy/about", body = list(), ...) res } ##' @importFrom jsonlite unbox ##' @importFrom httr content ##' @importFrom assertthat is.flag ##' @importFrom assertthat assert_that ## Information about an OpenTree Taxonomy (OTT) taxon .taxonomy_taxon_info <- function(ott_id = NULL, include_children = FALSE, include_lineage = FALSE, include_terminal_descendants = FALSE, ...) { ott_id <- check_ott_ids(ott_id) if (length(ott_id) > 1) { stop("Must only supply one ", sQuote("ott_id"), " argument") } assertthat::assert_that(assertthat::is.flag(include_children)) assertthat::assert_that(assertthat::is.flag(include_lineage)) assertthat::assert_that(assertthat::is.flag(include_terminal_descendants)) q <- list( ott_id = jsonlite::unbox(ott_id), include_children = jsonlite::unbox(include_children), include_lineage = jsonlite::unbox(include_lineage), include_terminal_descendants = jsonlite::unbox(include_terminal_descendants) ) res <- otl_POST(path = "/taxonomy/taxon_info", body = q, ...) res } ##' @importFrom jsonlite unbox ##' @importFrom httr content ## Get a subtree from the OpenTree Taxonomy (OTT) taxonomic tree .taxonomy_subtree <- function(ott_id = NULL, label_format = NULL, ...) { ott_id <- check_ott_ids(ott_id) if (length(ott_id) > 1) { stop("Must only supply one ", sQuote("ott_id"), " argument") } q <- list(ott_id = jsonlite::unbox(ott_id)) if (!is.null(label_format)) { if (!check_label_format(label_format)) { stop( sQuote("label_format"), " must be one of: ", sQuote("name"), ", ", sQuote("id"), ", or ", sQuote("name_and_id") ) } q$label_format <- jsonlite::unbox(label_format) } res <- otl_POST(path = "/taxonomy/subtree", body = q, ...) res } ##' @importFrom httr content ## Get the most recent common ancestor (MRCA) from nodes in the OpenTree Taxonomy (OTT) .taxonomy_mrca <- function(ott_ids = NULL, ...) { ott_ids <- check_ott_ids(ott_ids) q <- list(ott_ids = ott_ids) res <- otl_POST(path = "/taxonomy/mrca", body = q, ...) res } rotl/R/match_names.R0000644000176200001440000003362113543626746014062 0ustar liggesusers## internal function that match the arguments provided to the correct ## row number in the data frame representing the Open Tree Taxonomy ## for a series of matched names. check_args_match_names <- function(response, row_number, taxon_name, ott_id) { orig_order <- attr(response, "original_order") if (is.null(orig_order)) { stop( sQuote(substitute(response)), " was not created using ", sQuote("tnrs_match_names") ) } if (missing(row_number) && missing(taxon_name) && missing(ott_id)) { stop( "You must specify one of ", sQuote("row_number"), sQuote("taxon_name"), " or ", sQuote("ott_id") ) } else if (!missing(row_number) && missing(taxon_name) && missing(ott_id)) { if (!is.numeric(row_number)) { stop(sQuote("row_number"), " must be a numeric.") } if (!all(row_number %in% orig_order)) { stop(sQuote("row_number"), " is not a valid row number.") } i <- orig_order[row_number] } else if (missing(row_number) && !missing(taxon_name) && missing(ott_id)) { if (!is.character(taxon_name)) { stop(sQuote("taxon_name"), " must be a character.") } i <- orig_order[match(tolower(taxon_name), response$search_string)] if (any(is.na(i))) { stop("Can't find ", taxon_name) } } else if (missing(row_number) && missing(taxon_name) && !missing(ott_id)) { if (!check_numeric(ott_id)) { stop(sQuote("ott_id"), " must look like a number.") } i <- orig_order[match(ott_id, response$ott_id)] if (any(is.na(i))) stop("Can't find ", ott_id) } else { stop( "You must use only one of ", sQuote("row_number"), sQuote("taxon_name"), " or ", sQuote("ott_id"), "." ) } if (length(i) > 1) { stop("You must supply a single element for each argument.") } i } match_row_number <- function(response, row_number, taxon_name, ott_id) { ## all the checks on the validity of the arguments are taken care ## by check_args_match_names() if (missing(row_number) && missing(taxon_name) && missing(ott_id)) { stop( "You must specify one of ", sQuote("row_number"), " ", sQuote("taxon_name"), " ", sQuote("ott_id") ) } else if (!missing(row_number) && (missing(taxon_name) && missing(ott_id))) { i <- row_number } else if (!missing(taxon_name) && (missing(row_number) && missing(ott_id))) { i <- match(tolower(taxon_name), response[["search_string"]]) } else if (!missing(ott_id) && (missing(row_number) && missing(taxon_name))) { i <- match(ott_id, response[["ott_id"]]) } else { stop( "You must use only one of ", sQuote("row_number"), " ", sQuote("taxon_name"), " ", sQuote("ott_id") ) } if (length(i) > 1) { stop("You must supply a single element for each argument.") } i } ##' Taxonomic names may have different meanings in different taxonomic ##' contexts, as the same genus name can be applied to animals and ##' plants for instance. Additionally, the meaning of a taxonomic name ##' may have change throughout its history, and may have referred to a ##' different taxon in the past. In such cases, a given names might ##' have multiple matches in the Open Tree Taxonomy. These functions ##' allow users to inspect (and update) alternative meaning of a given ##' name and its current taxonomic status according to the Open Tree ##' Taxonomy. ##' ##' To inspect alternative taxonomic meanings of a given name, you ##' need to provide the object resulting from a call to the ##' tnrs_match_names function, as well as one of either the row number ##' corresponding to the name in this object, the name itself (as used ##' in the original query), or the ott_id listed for this name. ##' ##' To update one of the name, you also need to provide the row number ##' in which the name to be replaced appear or its ott id. ##' ##' @title Inspect and Update alternative matches for a name returned ##' by tnrs_match_names ##' @param response an object generated by the ##' \code{\link{tnrs_match_names}} function ##' @param row_number the row number corresponding to the name to ##' inspect ##' @param taxon_name the taxon name corresponding to the name to ##' inspect ##' @param ott_id the ott id corresponding to the name to inspect ##' @param ... currently ignored ##' @return a data frame ##' @seealso \code{\link{tnrs_match_names}} ##' @examples ##' \dontrun{ ##' matched_names <- tnrs_match_names(c("holothuria", "diadema", "boletus")) ##' inspect(matched_names, taxon_name="diadema") ##' new_matched_names <- update(matched_names, taxon_name="diadema", ##' new_ott_id = 631176) ##' new_matched_names ##' } ##' @export ##' @rdname match_names inspect.match_names <- function(response, row_number, taxon_name, ott_id, ...) { i <- check_args_match_names(response, row_number, taxon_name, ott_id) j <- match_row_number(response, row_number, taxon_name, ott_id) if (attr(response, "has_original_match")[j]) { res <- attr(response, "original_response") summary_match <- build_summary_match(res, res_id = i, match_id = NULL, initial_creation = FALSE ) } else { summary_match <- response[j, ] } clean_tnrs_summary(summary_match) } ##' @export ##' @rdname match_names inspect <- function(response, ...) UseMethod("inspect") ##' @param object an object created by \code{\link{tnrs_match_names}} ##' @param new_row_number the row number in the output of ##' \code{\link{inspect}} to replace the taxa specified by ##' \code{row_number}, \code{taxon_name}, or \code{ott_id}. ##' @param new_ott_id the ott id of the taxon to replace the taxa ##' specified by \code{row_number}, \code{taxon_name}, or ##' \code{ott_id}. ##' @export ##' @rdname match_names ##' @importFrom stats update update.match_names <- function(object, row_number, taxon_name, ott_id, new_row_number, new_ott_id, ...) { response <- object i <- check_args_match_names(response, row_number, taxon_name, ott_id) j <- match_row_number(response, row_number, taxon_name, ott_id) res <- attr(response, "original_response") if (!attr(response, "has_original_match")[j]) { warning( "There is no match for this name, ", "so there is nothing to replace it with." ) return(response) } tmpRes <- res$results[[i]] if (missing(row_number)) { if (!missing(taxon_name)) { rnb <- match(tolower(taxon_name), response$search_string) } else if (!missing(ott_id)) { rnb <- match(ott_id, response$ott_id) } } else { rnb <- row_number } if (missing(new_row_number) && missing(new_ott_id)) { stop( "You must specify either ", sQuote("new_row_number"), " or ", sQuote("new_ott_id") ) } else if (!missing(new_row_number) && missing(new_ott_id)) { if (!new_row_number %in% seq_len(length(tmpRes$matches))) { stop(sQuote("new_row_number"), " is not a valid row number.") } j <- new_row_number } else if (missing(new_row_number) && !missing(new_ott_id)) { all_ott_id <- sapply( lapply( tmpRes[["matches"]], function(x) x[["taxon"]] ), function(x) .tax_ott_id(x) ) j <- match(new_ott_id, all_ott_id) if (any(is.na(j))) stop("Can't find ", new_ott_id) } else { stop( "You must use only one of ", sQuote("new_row_number"), " or ", sQuote("new_ott_id") ) } if (length(j) > 1) stop("You must supply a single element for each argument") summ_match <- summary_row_factory(res, res_id = i, match_id = j) response[rnb, ] <- summ_match attr(response, "match_id")[rnb] <- j clean_tnrs_summary(response) } ## Access the elements for a given match: ## is_synonym, score, nomenclature_code, is_approximate_match, taxon get_list_element <- function(response, i, list_name) { list_content <- lapply( response[["results"]][[i]][["matches"]], function(x) { x[[list_name]] } ) list_content } match_names_method_factory <- function(list_name) { function(tax, row_number, taxon_name, ott_id, ...) { response <- tax res <- attr(response, "original_response") no_args <- all(c( missing(row_number), missing(taxon_name), missing(ott_id) )) if (no_args) { res_i <- attr(response, "original_order")[attr(response, "has_original_match")] ret <- lapply(res_i, function(i) { get_list_element(res, i, list_name) }) names(ret) <- sapply(res_i, function(i) { get_list_element(res, i, "matched_name")[[1]] }) ## ret is already in the correct order so we can use a sequence ## to extract the correct element ret <- mapply(function(x, i) { ret[[x]][i] }, seq_along(ret), attr(response, "match_id")[attr(response, "has_original_match")]) if (all(sapply(ret, length) == 1)) { ret <- unlist(ret, use.names = TRUE) } } else { i <- check_args_match_names(response, row_number, taxon_name, ott_id) j <- match_row_number(response, row_number, taxon_name, ott_id) if (attr(response, "has_original_match")[j]) { ret <- get_list_element(res, i, list_name)[attr(response, "match_id")[j]] } else { ret <- list( ott_id = NA_character_, name = response[["search_string"]][j], unique_name = NA_character_, rank = NA_character_, tax_sources = NA_character_, flags = NA_character_, synonyms = NA_character_, is_suppressed = NA_character_ ) ret <- list(ret) } } ret } } match_names_taxon_method_factory <- function(.f) { function(tax, row_number, taxon_name, ott_id, ...) { extract_tax_list <- match_names_method_factory("taxon") tax_info <- extract_tax_list(tax, row_number = row_number, taxon_name = taxon_name, ott_id = ott_id ) res <- lapply(tax_info, function(x) .f(x)) names(res) <- vapply(tax_info, function(x) .tax_unique_name(x), character(1)) res <- add_otl_class(res, .f) res } } ##' \code{rotl} provides a collection of functions that allows users ##' to extract relevant information from an object generated by ##' \code{\link{tnrs_match_names}} function. ##' ##' These methods optionally accept one of the arguments ##' \code{row_number}, \code{taxon_name} or \code{ott_id} to retrieve ##' the corresponding information for one of the matches in the object ##' returned by the \code{\link{tnrs_match_names}} function. ##' ##' If these arguments are not provided, these methods can return ##' information for the matches currently listed in the object ##' returned by \code{\link{tnrs_match_names}}. ##' ##' @title \code{ott_id} and \code{flags} for taxonomic names matched ##' by \code{tnrs_match_names} ##' @param tax an object returned by \code{\link{tnrs_match_names}} ##' @param row_number the row number corresponding to the name for ##' which to list the synonyms ##' @param taxon_name the taxon name corresponding to the name for ##' which to list the synonyms ##' @param ott_id the ott id corresponding to the name for which to ##' list the synonyms ##' @param ... currently ignored ##' @return A list of the ott ids or flags for the taxonomic names ##' matched with \code{\link{tnrs_match_names}}, for either one or ##' all the names. ##' @examples ##' \dontrun{ ##' rsp <- tnrs_match_names(c("Diadema", "Tyrannosaurus")) ##' rsp$ott_id # ott id for match currently in use ##' ott_id(rsp) # similar as above but elements are named ##' ##' ## flags() is useful for instance to determine if a taxon is extinct ##' flags(rsp, taxon_name="Tyrannosaurus") ##' } ##' @export ##' @rdname match_names-methods ott_id.match_names <- match_names_taxon_method_factory(.tax_ott_id) ##' @export ##' @rdname match_names-methods flags.match_names <- match_names_taxon_method_factory(.tax_flags) ##' When querying the Taxonomic Name Resolution Services for a ##' particular taxonomic name, the API returns as possible matches all ##' names that include the queried name as a possible synonym. This ##' function allows you to explore other synonyms for an accepted ##' name, and allows you to determine why the name you queried is ##' returning an accepted synonym. ##' ##' To list synonyms for a given taxonomic name, you need to provide ##' the object resulting from a call to the ##' \code{\link{tnrs_match_names}} function, as well as one of either ##' the row number corresponding to the name in this object, the name ##' itself (as used in the original query), or the ott_id listed for ##' this name. Otherwise, the synonyms for all the currently matched ##' names are returned. ##' ##' @title List the synonyms for a given name ##' @param tax a data frame generated by the ##' \code{\link{tnrs_match_names}} function ##' @param row_number the row number corresponding to the name for ##' which to list the synonyms ##' @param taxon_name the taxon name corresponding to the name for ##' which to list the synonyms ##' @param ott_id the ott id corresponding to the name for which to ##' list the synonyms ##' @param ... currently ignored ##' @return a list whose elements are all synonym names (as vectors of ##' character) for the taxonomic names that match the query (the ##' names of the elements of the list). ##' @examples ##' \dontrun{ ##' echino <- tnrs_match_names(c("Diadema", "Acanthaster", "Fromia")) ##' ## These 3 calls are identical ##' synonyms(echino, taxon_name="Acanthaster") ##' synonyms(echino, row_number=2) ##' synonyms(echino, ott_id=337928) ##' } ##' @export synonyms.match_names <- match_names_taxon_method_factory(.tax_synonyms) ##' @export tax_sources.match_names <- match_names_taxon_method_factory(.tax_sources) ##' @export tax_rank.match_names <- match_names_taxon_method_factory(.tax_rank) ##' @export is_suppressed.match_names <- match_names_taxon_method_factory(.tax_is_suppressed) ##' @export unique_name.match_names <- match_names_taxon_method_factory(.tax_unique_name) ##' @export tax_name.match_names <- match_names_taxon_method_factory(.tax_name) rotl/R/api-tol.R0000644000176200001440000001076113543626732013143 0ustar liggesusers##' @importFrom jsonlite unbox ##' @importFrom httr content ##' @importFrom assertthat is.flag ## Summary information about the OpenTree Tree of Life .tol_about <- function(include_source_list = FALSE, ...) { if (!assertthat::is.flag(include_source_list)) { stop("Argument ", sQuote("include_ource_list"), " must be of class ", sQuote("logical")) } q <- list(include_source_list = jsonlite::unbox(include_source_list)) res <- otl_POST(path = "tree_of_life/about", body = q, ...) res } ##' @importFrom jsonlite unbox ##' @importFrom httr content ## Get summary information about a node in the OpenTree Tree of Life .tol_node_info <- function(ott_id = NULL, node_id = NULL, include_lineage = FALSE, ...) { if (!is.logical(include_lineage)) { stop("Argument \'include_lineage\' must be of class \"logical\"") } if (is.null(ott_id) && is.null(node_id)) { stop("Must provide either ", sQuote("ott_id"), " or ", sQuote("node_id")) } if (!is.null(ott_id) && !is.null(node_id)) { stop("Must provide either ", sQuote("ott_id"), " or ", sQuote("node_id"), ", not both.") } if (!is.null(ott_id)) { ott_id <- check_ott_ids(ott_id) if (length(ott_id) != 1) { stop("Please provide a single ", sQuote("ott_id"), call. = FALSE) } q <- list(ott_id = jsonlite::unbox(ott_id), include_lineage = jsonlite::unbox(include_lineage)) } else { if (!check_valid_node_id(node_id)) { stop("Argument ", sQuote("node_id"), " must look like \'ott123\' or \'mrcaott123ott456\'.") } q <- list(node_id = jsonlite::unbox(node_id), include_lineage = jsonlite::unbox(include_lineage)) } res <- otl_POST(path = "tree_of_life/node_info", body = q, ...) res } ##' @importFrom httr content ## Get the MRCA of a set of nodes .tol_mrca <- function(ott_ids = NULL, node_ids = NULL, ...) { if (is.null(ott_ids) && is.null(node_ids)) { stop("Must provide ", sQuote("ott_ids"), " or ", sQuote("node_ids"), " (or both).") } q <- list() if (!is.null(ott_ids)) { ott_ids <- check_ott_ids(ott_ids) q$ott_ids <- ott_ids } if (!is.null(node_ids)) { check_node_ids(node_ids) q$node_ids <- node_ids } res <- otl_POST(path = "tree_of_life/mrca", body = q, ...) res } # ignoring 'include_lineage' for subtree below. arguson only ##' @importFrom jsonlite unbox ##' @importFrom httr content ## Get a subtree from the OpenTree Tree of Life .tol_subtree <- function(ott_id = NULL, node_id = NULL, label_format = NULL, ...) { if (is.null(ott_id) && is.null(node_id)) { stop("Must provide either ", sQuote("ott_id"), " or ", sQuote("node_id")) } if (!is.null(ott_id) && !is.null(node_id)) { stop("Must provide either ", sQuote("ott_id"), " or ", sQuote("node_id"), ", not both.") } if (!is.null(ott_id)) { ott_id <- check_ott_ids(ott_id) if (length(ott_id) != 1) { stop("Please provide a single ", sQuote("ott_id")) } q <- list(ott_id = jsonlite::unbox(ott_id)) } else { if (!check_valid_node_id(node_id)) { stop("Argument ", sQuote("node_id"), " must look like \'ott123\' or \'mrcaott123ott456\'.") } q <- list(node_id = jsonlite::unbox(node_id)) } if (!is.null(label_format)) { if (!check_label_format(label_format)) { stop( sQuote("label_format"), " must be one of: ", sQuote("name"), ", ", sQuote("id"), ", or ", sQuote("name_and_id") ) } q$label_format <- jsonlite::unbox(label_format) } res <- otl_POST(path = "tree_of_life/subtree", body = q, ...) res } ##' @importFrom httr content ## Get an induced subtree from the OpenTree Tree of Life from a set of nodes .tol_induced_subtree <- function(ott_ids = NULL, node_ids = NULL, label_format = NULL, ...) { if (is.null(ott_ids) && is.null(node_ids)) { stop("Must provide ", sQuote("ott_ids"), " or ", sQuote("node_ids"), " (or both).") } q <- list() if (!is.null(label_format)) { if (!check_label_format(label_format)) { stop( sQuote("label_format"), " must be one of: ", sQuote("name"), ", ", sQuote("id"), ", or ", sQuote("name_and_id") ) } q$label_format <- jsonlite::unbox(label_format) } if (!is.null(ott_ids)) { ott_ids <- check_ott_ids(ott_ids) q$ott_ids <- ott_ids } if (!is.null(node_ids)) { check_node_ids(node_ids) q$node_ids <- node_ids } if ((length(ott_ids) + length(node_ids)) < 2) { stop("At least two valid ", sQuote("ott_ids"), " or ", sQuote("node_ids"), " must be provided.") } res <- otl_POST("tree_of_life/induced_subtree", body = q, ...) res } rotl/R/api-collections.R0000644000176200001440000000166613543626721014665 0ustar liggesusers##' @importFrom assertthat assert_that is.flag ## This endpoint currently returns JSON in XML with mime type as text/html .collection_find_collections <- function(property = NULL, value = NULL, verbose = FALSE, ...) { assertthat::assert_that(assertthat::is.flag(verbose)) req_body <- list() req_body$verbose <- verbose res <- otl_POST( path = "collections/find_collections", body = req_body, ... ) res } .collection_properties <- function(...) { req_body <- list() res <- otl_POST( path = "collections/properties", body = req_body, ... ) res } .get_collection <- function(owner_id = NULL, collection_name = NULL, ...) { assertthat::assert_that(assertthat::is.string(owner_id)) assertthat::assert_that(assertthat::is.string(collection_name)) req_body <- list() res <- otl_GET(path = paste("collections", owner_id, collection_name, sep = "/" ), ...) res } rotl/R/base.R0000644000176200001440000001227613543630257012510 0ustar liggesusersotl_url <- function(dev = FALSE) { if (dev) { "https://devapi.opentreeoflife.org" } else { "https://api.opentreeoflife.org" } } otl_version <- function(version) { if (missing(version)) { return("v3") } else { return(version) } } # Take a request object and return list (if JSON) or plain text (if another # type) ##' @importFrom httr content ##' @importFrom jsonlite fromJSON otl_parse <- function(req) { if (grepl("application/json", req[["headers"]][["content-type"]])) { return(jsonlite::fromJSON(httr::content(req, "text", encoding = "UTF-8"), simplifyVector = FALSE)) } txt <- httr::content(req, as = "text", encoding = "UTF-8") if (identical(txt, "")) { stop("No output to parse; check your query.", call. = FALSE) } txt } otl_check_error <- function(cont) { if (is.list(cont)) { if (exists("description", cont)) { if (exists("Error", cont$description)) { stop(paste("Error: ", cont$description$error, "\n", sep = "")) } else if (exists("message", cont)) { stop(paste("Message: ", cont$descrption$message, "\n", sep = "")) } } } } ## Check and parse result of query otl_check <- function(req) { if (!req$status_code < 400) { msg <- otl_parse(req) stop("HTTP failure: ", req$status_code, "\n", msg, call. = FALSE) } desc <- otl_parse(req) otl_check_error(desc) desc } ##' @importFrom httr GET otl_GET <- function(path, url = otl_url(...), otl_v = otl_version(...), ...) { req <- httr::GET(url, path = paste(otl_v, path, sep = "/"), ...) otl_check(req) } ##' @importFrom jsonlite toJSON ##' @importFrom httr POST otl_POST <- function(path, body, url = otl_url(...), otl_v = otl_version(...), ...) { stopifnot(is.list(body)) body_json <- ifelse(length(body), jsonlite::toJSON(body), "") req <- httr::POST(url, path = paste(otl_v, path, sep = "/"), body = body_json, ... ) otl_check(req) } otl_formats <- function(format) { switch(tolower(format), "nexus" = ".nex", "newick" = ".tre", "nexml" = ".nexml", "json" = ".json", "" ) # fall through is no extension = nex(j)son } ## Strip all characters except the ottId from a OpenTree label (internal or terminal) otl_ottid_from_label <- function(label) { return(as.numeric(gsub("(.+[ _]ott)([0-9]+)", "\\2", label))) } ##' @importFrom rncl read_newick_phylo phylo_from_otl <- function(res, dedup = FALSE) { if (is.list(res)) { if (!is.null(res$newick)) { tree <- res$newick } else if (!is.null(res$subtree)) { tree <- res$subtree } else { stop("Cannot find tree") } } else if (is.character(res)) { tree <- res } else { stop("I don't know how to deal with this format.") } if (grepl("\\(", tree)) { fnm <- tempfile() cat(tree, file = fnm) if (!dedup) { phy <- rncl::read_newick_phylo(fnm) } else { dedup_tr <- deduplicate_labels(fnm) phy <- rncl::read_newick_phylo(dedup_tr) unlink(dedup_tr) } unlink(fnm) } else { phy <- tree_to_labels(tree)$tip_label } return(phy) } nexml_from_otl <- function(res) { if (!requireNamespace("RNeXML", quietly = TRUE)) { stop("The RNeXML package is needed to use the nexml file format") } fnm <- tempfile() cat(res, file = fnm) phy <- RNeXML::nexml_read(x = fnm) unlink(fnm) phy } ## check if the argument provided looks like a number (can be coerced ## to integer/numeric). check_numeric <- function(x) { if (is.null(x)) { return(FALSE) } if (length(x) != 1) { stop("only 1 element should be provided") } if (!is.numeric(x)) { x <- as.character(x) if (any(is.na(x))) { return(FALSE) } return(grepl("^[0-9]+$", x)) } else { return(x %% 1 == 0) } } ## Check that ott_ids are not NULL, not NAs and look like numbers check_ott_ids <- function(ott_ids) { if (!is.null(ott_ids)) { if (inherits(ott_ids, "otl_ott_id")) { ## convert objects returned by ott_id method to a vector ott_ids <- unlist(ott_ids) } if (any(is.na(ott_ids))) { stop("NAs are not allowed") } if (!all(sapply(ott_ids, check_numeric))) { stop(sQuote("ott_ids"), " must look like numbers.") } } else { stop("You must supply some OTT ids.") } ott_ids } ## all nodes have a node_id (character, e.g. "ott12345" or "mrcaott123ott456") check_valid_node_id <- function(x) { if (length(x) != 1) { stop("only 1 element should be provided") } if (!is.character(x)) { return(FALSE) } if (grepl("^mrcaott\\d+ott\\d+", x) || grepl("^ott\\d+", x)) { return(TRUE) } else { return(FALSE) } } check_node_ids <- function(node_ids) { if (!is.null(node_ids)) { if (!is.character(node_ids)) { stop("Argument ", sQuote("node_ids"), " must be of type character.") } if (any(is.na(node_ids))) { stop("NAs are not allowed") } if (!all(sapply(node_ids, check_valid_node_id))) { stop(sQuote("node_ids"), " must look like \'ott123\' or \'mrcaott123ott456\'.") } } } # node labels for tree_of_life subtree and induced_subtree # might also be useful for taxonomy queries check_label_format <- function(x) { if (x %in% c("name", "id", "name_and_id")) { return(TRUE) } else { return(FALSE) } } rotl/R/tnrs.R0000644000176200001440000002577113543626766012602 0ustar liggesusers ##' Match taxonomic names to the Open Tree Taxonomy. ##' ##' Accepts one or more taxonomic names and returns information about ##' potential matches for these names to known taxa in the Open Tree ##' Taxonomy. ##' ##' This service uses taxonomic contexts to disambiguate homonyms and ##' misspelled names; a context may be specified using the ##' \code{context_name} argument. If no context is specified, then the ##' context will be inferred (i.e., the shallowest taxonomic context ##' that contains all unambiguous names in the input). Taxonomic ##' contexts are uncontested higher taxa that have been selected to ##' allow limits to be applied to the scope of TNRS searches ##' (e.g. 'match names only within flowering plants'). Once a context ##' has been identified (either user-specified or inferred), all taxon ##' name matches will performed only against taxa within that ##' context. For a list of available taxonomic contexts, see ##' \code{\link{tnrs_contexts}}. ##' ##' A name is considered unambiguous if it is not a synonym and has ##' only one exact match to any taxon name in the entire taxonomy. ##' ##' Several functions listed in the \sQuote{See also} section can be ##' used to inspect and manipulate the object generated by this ##' function. ##' ##' ##' @title Match names to the Open Tree Taxonomy ##' @param names taxon names to be queried. Currently limited to ##' 10,000 names for exact matches and 2,500 names for approximate ##' matches (character vector) ##' @param context_name name of the taxonomic context to be searched ##' (length-one character vector). Must match (case sensitive) one ##' of the values returned by \code{\link{tnrs_contexts}}. ##' @param do_approximate_matching A logical indicating whether or not ##' to perform approximate string (a.k.a. \dQuote{fuzzy}) ##' matching. Using \code{FALSE} will greatly improve ##' speed. Default, however, is \code{TRUE}. ##' @param ids A vector of ids to use for identifying names. These ##' will be assigned to each name in the names array. If ids is ##' provided, then ids and names must be identical in length. ##' @param include_suppressed Ordinarily, some quasi-taxa, such as ##' incertae sedis buckets and other non-OTUs, are suppressed from ##' TNRS results. If this parameter is true, these quasi-taxa are ##' allowed as possible TNRS results. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A data frame summarizing the results of the query. The ##' original query output is appended as an attribute to the ##' returned object (and can be obtained using \code{attr(object, ##' "original_response")}). ##' @seealso \code{\link{inspect.match_names}}, ##' \code{\link{update.match_names}}, ##' \code{\link{synonyms.match_names}}. ##' @examples \dontrun{ ##' deuterostomes <- tnrs_match_names(names=c("echinodermata", "xenacoelomorpha", ##' "chordata", "hemichordata")) ##' } ##' @importFrom stats setNames ##' @export tnrs_match_names <- function(names = NULL, context_name = NULL, do_approximate_matching = TRUE, ids = NULL, include_suppressed = FALSE, ...) { if (!is.null(context_name) && !context_name %in% unlist(tnrs_contexts(...))) { stop( "The ", sQuote("context_name"), " is not valid. Check possible values using tnrs_contexts()" ) } ## take care of duplicated names if (any(duplicated(tolower(names)))) { names <- tolower(names) warning("Some names were duplicated: ", paste(sQuote(names[duplicated(names)]), collapse = ", "), ".", call. = FALSE ) names <- unique(names) } res <- .tnrs_match_names( names = names, context_name = context_name, do_approximate_matching = do_approximate_matching, ids = ids, include_suppressed = include_suppressed, ... ) check_tnrs(res) match_ids <- lowest_ott_id(res) if (!identical(length(res[["results"]]), length(match_ids))) { stop( "The number of matches and the number of 'results' elements should", " be the same." ) } summary_match <- mapply( function(rid, mid) { build_summary_match(res, res_id = rid, match_id = mid, initial_creation = TRUE) }, seq_along(res[["results"]]), match_ids, SIMPLIFY = FALSE ) ## add taxon names with no maches summary_match <- add_unmatched_names(summary_match, res) summary_match <- do.call("rbind", summary_match) summary_match$search_string <- gsub("\\\\", "", summary_match$search_string) ## reorder to match original query match_ids <- c(match_ids, rep(NA_integer_, sum(is.na(summary_match$ott_id)))) ordr <- match(tolower(names), summary_match$search_string) stopifnot(identical(length(match_ids), length(ordr))) summary_match <- summary_match[ordr, ] match_ids <- match_ids[ordr] attr(summary_match, "original_order") <- as.numeric(rownames(summary_match)) rownames(summary_match) <- NULL attr(summary_match, "original_response") <- res attr(summary_match, "match_id") <- match_ids attr(summary_match, "has_original_match") <- !is.na(summary_match[["number_matches"]]) class(summary_match) <- c("match_names", "data.frame") clean_tnrs_summary(summary_match) } clean_tnrs_summary <- function(summary_match) { summary_match[["approximate_match"]] <- convert_to_logical(summary_match[["approximate_match"]]) summary_match[["is_synonym"]] <- convert_to_logical(summary_match[["is_synonym"]]) summary_match[["flags"]] <- convert_to_logical(summary_match[["flags"]]) summary_match[["ott_id"]] <- as.integer(summary_match[["ott_id"]]) summary_match[["number_matches"]] <- as.integer(summary_match[["number_matches"]]) summary_match } ##' @importFrom stats na.omit convert_to_logical <- function(x) { if (all(stats::na.omit(x) %in% c("TRUE", "FALSE"))) { x <- as.logical(x) } else { x } } check_tnrs <- function(req) { if (length(req$results) < 1) { stop("No matches for any of the provided taxa") } if (length(req[["unmatched_names"]]) > 0) { warning(paste(req$unmatched_names, collapse = ", "), " are not matched") } } tnrs_columns <- list( "search_string" = function(x) x[["search_string"]], "unique_name" = function(x) .tax_unique_name(x[["taxon"]]), "approximate_match" = function(x) x[["is_approximate_match"]], "ott_id" = function(x) .tax_ott_id(x[["taxon"]]), "is_synonym" = function(x) x[["is_synonym"]], "flags" = function(x) paste(.tax_flags(x[["taxon"]]), collapse = ", ") ) summary_row_factory <- function(res, res_id, match_id, columns = tnrs_columns) { res_address <- res[["results"]][[res_id]][["matches"]][[match_id]] ret <- sapply(columns, function(f) f(res_address)) n_match <- length(res[["results"]][[res_id]][["matches"]]) c(ret, number_matches = n_match) } build_summary_match <- function(res, res_id, match_id = NULL, initial_creation) { if (length(res_id) > 1 && (!is.null(match_id) && length(match_id) > 1)) { stop("Something is wrong. Please contact us.") } build_summary_row <- function(rid) { if (is.null(match_id)) { match_id <- seq_len(length(res[["results"]][[rid]][["matches"]])) } res <- lapply(match_id, function(mid) { summary_row_factory(res, rid, mid) }) if (identical(length(match_id), 1L)) { unlist(res) } else { res } } summary_row <- lapply(res_id, build_summary_row) if (identical(length(res_id), 1L)) { summary_row <- unlist(summary_row, recursive = FALSE) } ## Needed if only 1 row returned if (!inherits(summary_row, "list")) { summary_row <- list(summary_row) } summary_match <- do.call("rbind", summary_row) summary_match <- data.frame(summary_match, stringsAsFactors = FALSE) names(summary_match) <- c(names(tnrs_columns), "number_matches") summary_match } ##' @importFrom stats setNames build_empty_row <- function(x) { no_match_row <- stats::setNames( rep(NA, length(tnrs_columns) + 1), c(names(tnrs_columns), "number_matches") ) no_match_row[1] <- x no_match_row } add_unmatched_names <- function(summary_row, res) { ## Add potential unmatched names if (length(res[["unmatched_names"]])) { no_match <- lapply(res[["unmatched_names"]], build_empty_row) summary_row <- c(summary_row, no_match) } summary_row } lowest_ott_id <- function(rsp) { vapply(seq_along(rsp[["results"]]), function(x) { .r <- build_summary_match( res = rsp, res_id = x, match_id = NULL, initial_creation = TRUE ) .r <- .r[(!as.logical(.r[["is_synonym"]])) & .r[["flags"]] == "", ] if (nrow(.r) > 0) { which.min(.r[["ott_id"]]) } else { 1L } }, integer(1)) } ##' This function returns a list of pre-defined taxonomic contexts ##' (i.e. clades) which can be used to limit the scope of tnrs ##' queries. ##' ##' Taxonomic contexts are available to limit the scope of TNRS ##' searches. These contexts correspond to uncontested higher taxa ##' such as 'Animals' or 'Land plants'. This service returns a list ##' containing all available taxonomic context names, which may be ##' used as input (via the \code{context_name} argument in other ##' functions) to limit the search scope of other services including ##' \code{\link{tnrs_match_names}}. ##' @title TNRS contexts ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return Returns invisibly a list for each major clades (e.g., ##' animals, microbes, plants, fungi, life) whose elements ##' contains the possible contexts. ##' @export tnrs_contexts <- function(...) { res <- .tnrs_contexts(...) class(res) <- "tnrs_contexts" res } ##' @export print.tnrs_contexts <- function(x, ...) { cat("Possible contexts:\n") lapply(x, function(t) { res <- unlist(t) cat(" ", res[1], "\n") if (length(res) > 1) { lapply(seq(2, length(res), by = 5), function(l) { m <- ifelse(l + 5 <= length(res), l + 4, length(res)) cat(" ", paste(res[l:m], collapse = ", "), "\n") }) } }) } ##' Return a taxonomic context given a list of taxonomic names ##' ##' Find the least inclusive taxonomic context that includes all the ##' unambiguous names in the input set. Unambiguous names are names ##' with exact matches to non-homonym taxa. Ambiguous names (those ##' without exact matches to non-homonym taxa) are indicated in ##' results. ##' ##' @title Infer the taxonomic context from a list of names ##' @param names Vector of taxon names. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A list including the context name, the context ott id and ##' possibly the names in the query that have an ambiguous ##' taxonomic meaning in the query. ##' @examples ##' \dontrun{ ##' res <- tnrs_infer_context(names=c("Stellula calliope", "Struthio camelus")) ##' } ##' @export tnrs_infer_context <- function(names = NULL, ...) { res <- .tnrs_infer_context(names = names, ...) return(res) } rotl/R/studies-methods.R0000644000176200001440000000520313543626750014712 0ustar liggesusers ### list_trees ----------------------------------------------------------------- ##' List trees ids in objects returned by ##' \code{\link{studies_find_studies}} and ##' \code{\link{studies_find_trees}}. ##' ##' \code{list_trees} returns all trees associated with a particular ##' study when used on an object returned by ##' \code{\link{studies_find_studies}}, but only the trees that match ##' the search criteria when used on objects returned by ##' \code{\link{studies_find_trees}}. ##' ##' @param matched_studies an object created by ##' \code{studies_find_trees} or \code{studies_find_studies}. ##' @param study_id a \code{study_id} listed in the object returned by ##' \code{studies_find_trees} ##' @param ... Currently unused ##' @return \code{list_trees} returns a list of the tree_ids for each ##' study that match the requested criteria. If a \code{study_id} ##' is provided, then only the trees for this study are returned ##' as a vector. ##' @seealso \code{\link{studies_find_studies}} and ##' \code{\link{studies_find_trees}}. The help for these functions ##' have examples demonstrating the use of \code{list_trees}. ##' @export list_trees <- function(matched_studies, ...) UseMethod("list_trees") ##' @rdname list_trees ##' @export list_trees.matched_studies <- function(matched_studies, study_id, ...) { res <- attr(matched_studies, "found_trees") if (missing(study_id)) { res } else { if (is.na(match(study_id, names(res)))) { stop(sQuote(study_id), " isn't a valid id.") } else { res[[study_id]] } } } ##' @export ##' @rdname get_study_meta get_tree_ids <- function(sm) UseMethod("get_tree_ids") ##' @export ##' @rdname get_study_meta get_publication <- function(sm) UseMethod("get_publication") ##' @export ##' @rdname get_study_meta candidate_for_synth <- function(sm) UseMethod("candidate_for_synth") ##' @export ##' @rdname get_study_meta get_study_year <- function(sm) UseMethod("get_study_year") ##' @export ##' @rdname get_study_meta get_tree_ids.study_meta <- function(sm) { unlist(sm[["nexml"]][["treesById"]][[sm[["nexml"]][["^ot:treesElementOrder"]][[1]]]][["^ot:treeElementOrder"]]) } ##' @export ##' @rdname get_study_meta get_publication.study_meta <- function(sm) { pub <- sm[["nexml"]][["^ot:studyPublicationReference"]] attr(pub, "DOI") <- sm[["nexml"]][["^ot:studyPublication"]][["@href"]] pub } ##' @export ##' @rdname get_study_meta candidate_for_synth.study_meta <- function(sm) { unlist(sm[["nexml"]][["^ot:candidateTreeForSynthesis"]]) } ##' @export ##' @rdname get_study_meta get_study_year.study_meta <- function(sm) { sm[["nexml"]][["^ot:studyYear"]] } rotl/R/studies-utils.R0000644000176200001440000000472013543626751014413 0ustar liggesusers## Unexported function that generates a data frame summarizing the metadata. ## This function is used by both studies_find_studies and studies_find_trees, ## to generate the output when using the argument detailed=TRUE ##' @importFrom stats setNames summarize_meta <- function(study_ids) { fill <- function(x) { if (length(unlist(x))) { x } else { "" } } meta_raw <- lapply(study_ids, function(x) get_study_meta(x)) ## Extract the metadata meta <- lapply(meta_raw, function(m) { c( tree_ids = fill(list(get_tree_ids(m))), study_year = fill(get_study_year(m)), publication = fill(get_publication(m)), doi = fill(attr(get_publication(m), "DOI")), candidate = fill(list(candidate_for_synth(m))) ) }) ## Convert into a data frame dat <- lapply(meta, function(m) { c( n_trees = length(m[["tree_ids"]]), tree_ids = limit_trees(m[["tree_ids"]]), candidate = paste(m[["candidate"]], collapse = ", "), study_year = m[["study_year"]], title = fill(extract_title(m[["publication"]])), study_doi = m[["doi"]] ) }) dat <- do.call("rbind", dat) dat <- cbind(study_ids = study_ids, dat) rownames(dat) <- NULL dat <- data.frame(dat, stringsAsFactors = FALSE) ## Add list of found trees as attributes found_trees <- lapply(meta, function(m) { m[["tree_ids"]] }) found_trees <- stats::setNames(found_trees, study_ids) attr(dat, "found_trees") <- found_trees attr(dat, "metadata") <- meta_raw dat } ## Unexported function that attempts to extract title from the ## citation information associated with the study information. The ## function gets the element that follows what looks like a year in ## the string. ## pub_orig: the publication string extracted from the study metadata ## split_char: the character on which the bibliographic elements are ## separated with. (currently only deals with . and ,) extract_title <- function(pub_orig, split_char = "\\.") { pub <- unlist(strsplit(pub_orig, split = split_char)) pub <- gsub("^\\s|\\s$", "", pub) which_year <- grep("^\\d{4}[a-z]?$", pub) res <- pub[which_year + 1] if (length(res) > 0) { return(res) } else if (split_char == ",") { return(character(0)) } else { extract_title(pub_orig, ",") } } ## Unexported function that limit the display of tree_ids to the first ## 5 values. limit_trees <- function(x) { if (length(x) > 5) { x <- c(x[1:5], "...") } paste(x, collapse = ", ") } rotl/R/studies.R0000644000176200001440000005117313543626756013266 0ustar liggesusers##' Return the list of study properties that can be used to search ##' studies and trees used in the synthetic tree. ##' ##' The list returned has 2 elements \code{tree_properties} and ##' \code{studies_properties}. Each of these elements lists additional ##' arguments to customize the API request properties that can be used ##' to search for trees and studies that are contributing to the ##' synthetic tree. The definitions of these properties are available ##' from ##' \url{https://github.com/OpenTreeOfLife/phylesystem-api/wiki/NexSON} ##' ##' @title Properties of the Studies ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A list of the study properties that can be used to find ##' studies and trees that are contributing to the synthetic tree. ##' @seealso \code{\link{studies_find_trees}} ##' @export ##' @examples ##' \dontrun{ ##' all_the_properties <- studies_properties() ##' unlist(all_the_properties$tree_properties) ##' } studies_properties <- function(...) { res <- .studies_properties(...) lapply(res, unlist) } ##' Return the identifiers of studies that match given properties ##' ##' @title Find a Study ##' @param exact Should exact matching be used? (logical, default ##' \code{FALSE}) ##' @param property The property to be searched on (character) ##' @param value The property value to be searched on (character) ##' @param detailed If \code{TRUE} (default), the function will return ##' a data frame that summarizes information about the study (see ##' \sQuote{Value}). Otherwise, it only returns the study ##' identifiers. ##' @param verbose Should the output include all metadata (logical ##' default \code{FALSE}) ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return If \code{detailed=TRUE}, the function returns a data frame ##' listing the study id (\code{study_ids}), the number of trees ##' associated with this study (\code{n_trees}), the tree ids (at ##' most 5) associated with the studies (\code{tree_ids}), the ##' tree id that is a candidate for the synthetic tree if any ##' (\code{candidate}), the year of publication of the study ##' (\code{study_year}), the title of the publication for the ##' study (\code{title}), and the DOI (Digital Object Identifier) ##' for the study (\code{study_doi}). ##' ##' If \code{detailed=FALSE}, the function returns a data frame ##' with a single column containing the study identifiers. ##' @seealso \code{\link{studies_properties}} which lists properties ##' against which the studies can be ##' searched. \code{\link{list_trees}} that returns a list for all ##' tree ids associated with a study. ##' @export ##' @examples ##' \dontrun{ ##' ## To match a study for which the identifier is already known ##' one_study <- studies_find_studies(property="ot:studyId", value="pg_719") ##' list_trees(one_study) ##' ##' ## To find studies pertaining to Mammals ##' mammals <- studies_find_studies(property="ot:focalCladeOTTTaxonName", ##' value="mammalia") ##' ## To extract the tree identifiers for each of the studies ##' list_trees(mammals) ##' ## ... or for a given study ##' list_trees(mammals, "ot_308") ##' ##' ## Just the identifiers without other information about the studies ##' mammals <- studies_find_studies(property="ot:focalCladeOTTTaxonName", ##' value="mammalia", detailed=FALSE) ##' } studies_find_studies <- function(property = NULL, value = NULL, verbose = FALSE, exact = FALSE, detailed = TRUE, ...) { .res <- .studies_find_studies( property = property, value = value, verbose = verbose, exact = exact, ... ) res <- vapply( .res[["matched_studies"]], function(x) x[["ot:studyId"]], character(1) ) if (detailed) { dat <- summarize_meta(res) } else { meta_raw <- .res dat <- data.frame(study_ids = res, stringsAsFactors = FALSE) attr(dat, "found_trees") <- paste( "If you want to get a list of the", "trees associated with the studies,", "use", sQuote("detailed = TRUE") ) class(dat) <- c("study_ids", class(dat)) attr(dat, "metadata") <- meta_raw } class(dat) <- c("matched_studies", class(dat)) dat } ##' @export print.study_ids <- function(x, ...) { print(format(x), ...) } ##' Return a list of studies for which trees match a given set of ##' properties ##' ##' The list of possible values to be used as values for the argument ##' \code{property} can be found using the function ##' \code{\link{studies_properties}}. ##' ##' @title Find Trees ##' @param property The property to be searched on (character) ##' @param value The property-value to be searched on (character) ##' @param verbose Should the output include all metadata? (logical, ##' default \code{FALSE}) ##' @param exact Should exact matching be used for the value? ##' (logical, default \code{FALSE}) ##' @param detailed Should a detailed report be provided? If ##' \code{TRUE} (default), the output will include metadata about ##' the study that include trees matching the property. Otherwise, ##' only information about the trees will be provided. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A data frame that summarizes the trees found (and their ##' associated studies) for the requested criteria. If a study has ##' more than 5 trees, the \code{tree_ids} of the first ones will ##' be shown, followed by \code{...} to indicate that more are ##' present. ##' ##' If \code{detailed=FALSE}, the data frame will include the ##' study ids of the study (\code{study_ids}), the number of trees ##' in this study that match the search criteria ##' (\code{n_matched_trees}), the tree ids that match the search ##' criteria (\code{match_tree_ids}). ##' ##' If \code{detailed=TRUE}, in addition of the fields listed ##' above, the data frame will also contain the total number of ##' trees associated with the study (\code{n_trees}), all the tree ##' ids associated with the study (\code{tree_ids}), the tree id ##' that is a potential candidate for inclusion in the synthetic ##' tree (if any) (\code{candidate}), the year the study was ##' published (\code{study_year}), the title of the study ##' (\code{title}), the DOI for the study (\code{study_doi}). ##' ##' @seealso \code{\link{studies_properties}} which lists properties ##' the studies can be searched on. \code{\link{list_trees}} for ##' listing the trees that match the query. ##' @export ##' @importFrom stats setNames ##' @examples ##' \dontrun{ ##' res <- studies_find_trees(property="ot:ottTaxonName", value="Drosophilia", ##' detailed=FALSE) ##' ## summary of the trees and associated studies that match this criterion ##' res ##' ## With metadata about the studies (default) ##' res <- studies_find_trees(property="ot:ottTaxonName", value="Drosophilia", ##' detailed=TRUE) ##' ## The list of trees for each study that match the search criteria ##' list_trees(res) ##' ## the trees for a given study ##' list_trees(res, study_id = "pg_2769") ##' } studies_find_trees <- function(property = NULL, value = NULL, verbose = FALSE, exact = FALSE, detailed = TRUE, ...) { .res <- .studies_find_trees( property = property, value = value, verbose = verbose, exact = exact, ... ) study_ids <- vapply( .res[["matched_studies"]], function(x) x[["ot:studyId"]], character(1) ) n_matched_trees <- vapply( .res[["matched_studies"]], function(x) length(x[["matched_trees"]]), numeric(1) ) match_tree_ids <- lapply( .res[["matched_studies"]], function(x) { sapply( x[["matched_trees"]], function(y) y[["nexson_id"]] ) } ) # this one doesn't return all of the treeids. confusing, bc trees are what is wanted # tree_str <- vapply(match_tree_ids, limit_trees, character(1)) tree_str <- sapply(match_tree_ids, function(x) paste(x, collapse = ", ")) res <- data.frame(study_ids, n_matched_trees, match_tree_ids = tree_str, stringsAsFactors = FALSE ) if (detailed) { meta <- summarize_meta(study_ids) # the next bit seems really slow (JWB) res <- merge(meta, res) attr(res, "metadata") <- attr(meta, "metadata") } else { attr(res, "metadata") <- .res } attr(res, "found_trees") <- stats::setNames(match_tree_ids, study_ids) class(res) <- c("matched_studies", class(res)) res } ##' Returns the trees associated with a given study ##' ##' If \code{file_format} is missing, the function returns an object ##' of the class \code{phylo} from the \code{\link[ape]{ape}} package ##' (default), or an object of the class \code{nexml} from the ##' \code{RNeXML} package. ##' ##' Otherwise \code{file_format} can be either \code{newick}, ##' \code{nexus}, \code{nexml} or \code{json}, and the function will ##' generate a file of the selected format. In this case, a file name ##' needs to be provided using the argument \code{file}. If a file ##' with the same name already exists, it will be silently ##' overwritten. ##' ##' @title Get all the trees associated with a particular study ##' @param study_id the study ID for the study of interest (character) ##' @param object_format the class of the object the query should ##' return (either \code{phylo} or \code{nexml}). Ignored if ##' \code{file_format} is specified. ##' @param file_format the format of the file to be generated ##' (\code{newick}, \code{nexus}, \code{nexml} or \code{json}). ##' @param file the file name where the output of the function will be ##' saved. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return if \code{file_format} is missing, an object of class ##' \code{phylo} or \code{nexml}, otherwise a logical indicating ##' whether the file was successfully created. ##' @seealso \code{\link{get_study_meta}} ##' @export ##' @importFrom jsonlite toJSON ##' @examples ##' \dontrun{ ##' that_one_study <- get_study(study_id="pg_719", object_format="phylo") ##' if (require(RNeXML)) { ## if RNeXML is installed get the object directly ##' nexml_study <- get_study(study_id="pg_719", object_format="nexml") ##' } else { ## otherwise write it to a file ##' get_study(study_id="pg_719", file_format="nexml", file=tempfile(fileext=".nexml")) ##' } ##' } get_study <- function(study_id = NULL, object_format = c("phylo", "nexml"), file_format, file, ...) { object_format <- match.arg(object_format) if (!missing(file)) { if (!missing(file_format)) { file_format <- match.arg(file_format, c("newick", "nexus", "nexml", "json")) res <- .get_study(study_id, format = file_format) unlink(file) if (identical(file_format, "json")) { cat(jsonlite::toJSON(res), file = file) } else { cat(res, file = file) } return(invisible(file.exists(file))) } else { stop(sQuote("file_format"), " must be specified.") } } else if (identical(object_format, "phylo")) { file_format <- "newick" res <- .get_study(study_id = study_id, format = file_format, ...) res <- phylo_from_otl(res) } else if (identical(object_format, "nexml")) { file_format <- "nexml" res <- .get_study(study_id = study_id, format = file_format, ...) res <- nexml_from_otl(res) } else { stop("Something is very wrong. Contact us.") } res } ##' Returns a specific tree from within a study ##' ##' @title Study Tree ##' @param study_id the identifier of a study (character) ##' @param tree_id the identifier of a tree within the study ##' @param object_format the class of the object to be returned ##' (default and currently only possible value \code{phylo} from ##' the \code{\link[ape]{ape}} package). ##' @param tip_label the format of the tip ##' labels. \dQuote{\code{original_label}} (default) returns the ##' original labels as provided in the study, ##' \dQuote{\code{ott_id}} labels are replaced by their ott IDs, ##' \dQuote{\code{ott_taxon_name}} labels are replaced by their ##' Open Tree Taxonomy taxon name. ##' @param file_format the format of the file to be generated ##' (\code{newick} default, \code{nexus}, or \code{json}). ##' @param file the file name where the output of the function will be ##' saved. ##' @param deduplicate logical (default \code{TRUE}). If the tree ##' returned by the study contains duplicated taxon names, should they ##' be made unique? It is normally illegal for NEXUS/Newick tree ##' strings to contain duplicated tip names. This is a workaround to ##' circumvent this requirement. If \code{TRUE}, duplicated tip labels ##' will be appended \code{_1}, \code{_2}, etc. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return if \code{file_format} is missing, an object of class ##' \code{phylo}, otherwise a logical indicating whether the file ##' was successfully created. ##' @export ##' @importFrom jsonlite toJSON ##' @examples ##' \dontrun{ ##' tree <- get_study_tree(study_id="pg_1144", tree_id="tree2324") ##' ##' ## comparison of the first few tip labels depending on the options used ##' head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="original_label")$tip.label) ##' head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="ott_id")$tip.label) ##' head(get_study_tree(study_id="pg_1144", tree_id="tree2324", tip_label="ott_taxon_name")$tip.label) ##' } get_study_tree <- function(study_id = NULL, tree_id = NULL, object_format = c("phylo"), tip_label = c("original_label", "ott_id", "ott_taxon_name"), file_format, file, deduplicate = TRUE, ...) { object_format <- match.arg(object_format) tip_label <- match.arg(tip_label) tip_label <- switch(tip_label, original_labels = "ot:originallabel", ott_id = "ot:ottid", ott_taxon_name = "ot:otttaxonname" ) if (!missing(file)) { if (!missing(file_format)) { file_format <- match.arg(file_format, c("newick", "nexus", "json")) if (missing(file)) stop("You must specify a file to write your output") res <- .get_study_tree( study_id = study_id, tree_id = tree_id, format = file_format, tip_label = tip_label, ... ) unlink(file) if (identical(file_format, "json")) { cat(jsonlite::toJSON(res), file = file) } else { cat(res, file = file) } return(invisible(file.exists(file))) } else { stop(sQuote("file_format"), " must be specified.") } } else if (identical(object_format, "phylo")) { file_format <- "newick" res <- .get_study_tree( study_id = study_id, tree_id = tree_id, format = file_format, tip_label = tip_label, ... ) res <- phylo_from_otl(res, dedup = deduplicate) } else { stop("Something is very wrong. Contact us.") } res } ##' Retrieve metadata about a study in the Open Tree of Life datastore. ##' ##' \code{get_study_meta} returns a long list of attributes for the ##' studies that are contributing to the synthetic tree. To help with ##' the extraction of relevant information from this list, several ##' helper functions exists: \itemize{ ##' ##' \item {get_tree_ids} { The identifiers of the trees ##' associated with the study } ##' ##' \item {get_publication} { The citation information of the ##' publication for the study. The DOI (or URL) for the study is ##' available as an attribute to the returned object (i.e., ##' \code{attr(object, "DOI")} ) }. ##' ##' \item {candidate_for_synth} { The identifier of the tree(s) from ##' the study used in the synthetic tree. This is a subset of the ##' result of \code{get_tree_ids}. ##' ##' \item {get_study_year} { The year of publication of the study. } ##' ##' } ##' } ##' ##' @title Study Metadata ##' @param study_id the study identifier (character) ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @param sm an object created by \code{get_study_meta} ##' @return named-list containing the metadata associated with the ##' study requested ##' @export ##' @examples ##' \dontrun{ ##' req <- get_study_meta("pg_719") ##' get_tree_ids(req) ##' candidate_for_synth(req) ##' get_publication(req) ##' get_study_year(req) ##' } get_study_meta <- function(study_id, ...) { res <- .get_study_meta(study_id = study_id, ...) class(res) <- "study_meta" attr(res, "study_id") <- study_id res } ##' @export print.study_meta <- function(x, ...) { cat("Metadata for OToL study ", attr(x, "study_id"), ". Contents:\n", sep = "") cat(paste0(" $nexml$", names(x$nexml)), sep = "\n") } ##' Retrieve subtree from a specific tree in the Open Tree of Life data store ##' ##' @title Study Subtree ##' @param study_id the study identifier (character) ##' @param tree_id the tree identifier (character) ##' @param object_format the class of the object returned by the ##' function (default, and currently only possibility \code{phylo} ##' from the \code{\link[ape]{ape}} package) ##' @param tip_label the format of the tip ##' labels. \dQuote{\code{original_label}} (default) returns the ##' original labels as provided in the study, ##' \dQuote{\code{ott_id}} labels are replaced by their ott IDs, ##' \dQuote{\code{ott_taxon_name}} labels are replaced by their ##' Open Tree Taxonomy taxon name. ##' @param file_format character, the file format to use to save the ##' results of the query (possible values, \sQuote{newick} or ##' \sQuote{nexus}). ##' @param file character, the path and file name where the output ##' should be written. ##' @param deduplicate logical (default \code{TRUE}). If the tree ##' returned by the study contains duplicated taxon names, should ##' they be made unique? It is normally illegal for NEXUS/Newick ##' tree strings to contain duplicated tip names. This is a ##' workaround to circumvent this requirement. If \code{TRUE}, ##' duplicated tip labels will be appended \code{_1}, \code{_2}, ##' etc. ##' @param subtree_id, either a node id that specifies a subtree or ##' \dQuote{ingroup} which returns the ingroup for this subtree. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @export ##' @examples ##' \dontrun{ ##' small_tr <- get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="node991044") ##' ingroup <- get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="ingroup") ##' nexus_file <- tempfile(fileext=".nex") ##' get_study_subtree(study_id="pg_1144", tree_id="tree5800", subtree_id="ingroup", file=nexus_file, ##' file_format="nexus") ##' } get_study_subtree <- function(study_id, tree_id, subtree_id, object_format = c("phylo"), tip_label = c("original_label", "ott_id", "ott_taxon_name"), file_format, file, deduplicate = TRUE, ...) { object_format <- match.arg(object_format) tip_label <- match.arg(tip_label) tip_label <- switch(tip_label, original_labels = "ot:originallabel", ott_id = "ot:ottid", ott_taxon_name = "ot:otttaxonname" ) if (!missing(file)) { if (!missing(file_format)) { if (missing(file)) stop("You must specify a file to write your output") file_format <- match.arg(file_format, c("newick", "nexus")) res <- .get_study_subtree( study_id = study_id, tree_id = tree_id, subtree_id = subtree_id, format = file_format, tip_label = tip_label, ... ) unlink(file) cat(res, file = file) return(invisible(file.exists(file))) } else { stop(sQuote("file_format"), " must be specified.") } } else if (identical(object_format, "phylo")) { file_format <- "newick" res <- .get_study_subtree( study_id = study_id, tree_id = tree_id, subtree_id = subtree_id, format = file_format, tip_label = tip_label, ... ) res <- phylo_from_otl(res, dedup = deduplicate) ## NeXML should be possible for both object_format and file_format but it seems there ## is something wrong with the server at this time (FM - 2015-06-07) ## } else if (identical(object_format, "nexml")) { ## file_format <- "nexml" ## res <- .get_study_subtree(study_id, tree_id, subtree_id, format=file_format) ## res <- nexml_from_otl(res) } else { stop("Something is very wrong. Contact us.") } res } rotl/R/api-tnrs.R0000644000176200001440000000444113543626727013335 0ustar liggesusers##' @importFrom jsonlite unbox ##' @importFrom httr content ##' @importFrom assertthat is.string is.flag ## Match taxon names .tnrs_match_names <- function(names = NULL, context_name = NULL, do_approximate_matching = TRUE, ids = NULL, include_suppressed = FALSE, ...) { if (is.null(names)) { stop("You must supply a ", sQuote("names"), " argument") } else if (!is.character(names)) { stop( "Argument ", sQuote("names"), " must be of class ", sQuote("character") ) } if (!is.null(ids)) { if (length(ids) != length(names)) { stop( "Arguments ", sQuote("ids"), " and ", sQuote("names"), " must be of the same length" ) } else if (!is.character(ids)) { stop( "Argument ", sQuote("ids"), " must be of class ", sQuote("character") ) } } if (!assertthat::is.flag(do_approximate_matching)) { stop( "Argument ", sQuote("do_approximate_matching"), " must be of class ", sQuote("logical") ) } if (!assertthat::is.flag(include_suppressed)) { stop( "Argument ", sQuote("include_deprecated"), " must be of class ", sQuote("logical") ) } if (!is.null(context_name)) { if (!assertthat::is.string(context_name)) { stop( "Argument ", sQuote("context_name"), " must be of class ", sQuote("character") ) } context_name <- jsonlite::unbox(context_name) } q <- list( names = names, context_name = context_name, do_approximate_matching = jsonlite::unbox(do_approximate_matching), ids = ids, include_suppressed = jsonlite::unbox(include_suppressed) ) toKeep <- sapply(q, is.null) q <- q[!toKeep] res <- otl_POST("tnrs/match_names", body = q, ...) res } ##' @importFrom httr content ## Get OpenTree TNRS contexts .tnrs_contexts <- function(...) { res <- otl_POST("tnrs/contexts", body = list(), ...) res } ## Infer taxonomic context from a set of names .tnrs_infer_context <- function(names = NULL, ...) { if (is.null(names)) { stop("Must supply a \'names\' argument") } else if (!is.character(names)) { stop("Argument \'names\' must be of class \"character\"") } q <- list(names = names) res <- otl_POST("tnrs/infer_context", body = q, ...) res } rotl/R/api-studies.R0000644000176200001440000001356713543626725014036 0ustar liggesusers##' @importFrom jsonlite unbox ##' @importFrom httr content ## Return a list of studies from the OpenTree docstore that match a given properties .studies_find_studies <- function(property = NULL, value = NULL, verbose = FALSE, exact = FALSE, ...) { if (!is.logical(verbose)) stop("Argument \'verbose\' should be logical") if (!is.logical(exact)) stop("Argument \'exact\' should be logical") req_body <- list() if (!is.null(property)) { if (!is.character(property)) { stop("Argument \'property\' must be of class \"character\"") } req_body$property <- jsonlite::unbox(property) } else { stop("Must supply a \'property\' argument") } if (!is.null(value)) { if (!is.character(value)) { if (check_numeric(value)) { value <- as.character(value) } else { stop("Argument \'value\' must be of class \"character\"") } } req_body$value <- jsonlite::unbox(value) } else { stop("Must supply a \'value\' argument") } req_body$verbose <- jsonlite::unbox(verbose) req_body$exact <- jsonlite::unbox(exact) res <- otl_POST( path = "studies/find_studies/", body = req_body, ... ) res } ##' @importFrom jsonlite unbox ##' @importFrom httr content ## Return a list of trees from the OpenTree docstore that match a given properties .studies_find_trees <- function(property = NULL, value = NULL, verbose = FALSE, exact = FALSE, ...) { if (!is.logical(verbose)) { stop("Argument \'verbose\' must be of class \"logical\"") } if (!is.logical(exact)) { stop("Argument \'exact\' must be of class \"logical\"") } req_body <- list() if (!is.null(property)) { if (!is.character(property)) { stop("Argument \'property\' must be of class \"character\"") } req_body$property <- jsonlite::unbox(property) } else { stop("Must supply a \'property\' argument") } if (!is.null(value)) { if (!is.character(value)) { if (check_numeric(value)) { value <- as.character(value) } else { stop("Argument \'value\' must be of class \"character\"") } } req_body$value <- jsonlite::unbox(value) } else { stop("Must supply a \'value\' argument") } res <- otl_POST( path = "studies/find_trees", body = c( req_body, verbose = jsonlite::unbox(verbose), exact = jsonlite::unbox(exact) ), ... ) res } ##' @importFrom httr content ## Return a list of properties that can be used to search studies and trees .studies_properties <- function() { res <- otl_POST(path = "studies/properties/", body = list()) res } ##' @importFrom httr content ## Get a study from the OpenTree docstore .get_study <- function(study_id = NULL, format = c("", "nexus", "newick", "nexml", "json"), ...) { if (is.null(study_id)) { stop("Must supply a \'study_id\' argument") } else if (!is.character(study_id)) { if (check_numeric(study_id)) { study_id <- as.character(study_id) } else { stop("Argument \'study_id\' must be of class \"character\"") } } format <- match.arg(format) res <- otl_GET( path = paste("study", paste0(study_id, otl_formats(format)), sep = "/" ), ... ) res } ##' @importFrom httr content ## Get a tree in a study from the OpenTree docstore .get_study_tree <- function(study_id = NULL, tree_id = NULL, format = c("json", "newick", "nexus"), tip_label = c("ot:originallabel", "ot:ottid", "ot:otttaxonname"), ...) { if (is.null(study_id)) { stop("Must supply a \'study_id\' argument") } else if (!is.character(study_id)) { stop("Argument \'study_id\' must be of class \"character\"") } if (is.null(tree_id)) { stop("Must supply a \'tree\' argument") } else if (!is.character(tree_id)) { stop("Argument \'tree\' must be of class \"character\"") } format <- match.arg(format) tip_label <- match.arg(tip_label) tip_label <- paste0("/?tip_label=", tip_label) tree_file <- paste0(tree_id, otl_formats(format), tip_label) res <- otl_GET(path = paste("study", study_id, "tree", tree_file, sep = "/"), ...) res } ##' @importFrom httr content .get_study_meta <- function(study_id, ...) { otl_GET(path = paste("study", study_id, "meta", sep = "/"), ...) } ##' @importFrom httr content .get_study_subtree <- function(study_id, tree_id, subtree_id, format = c("newick", "nexus", "nexml"), tip_label = c("ot:originallabel", "ot:ottid", "ot:otttaxonname"), ...) { if (is.null(study_id)) { stop("Must supply a \'study_id\' argument") } else if (!is.character(study_id)) { stop("Argument \'study_id\' must be of class \"character\"") } if (is.null(tree_id)) { stop("Must supply a \'tree\' argument") } else if (!is.character(tree_id)) { stop("Argument \'tree\' must be of class \"character\"") } if (is.null(subtree_id)) { stop("Must supply a \'subtree\' argument") } else if (!is.character(subtree_id)) { stop("Argument \'subtree\' must be of class \"character\"") } format <- match.arg(format) format <- otl_formats(format) tip_label <- match.arg(tip_label) url_stem <- paste("study", study_id, "subtree", paste0(tree_id, format), sep = "/") res <- otl_GET(path = paste0(url_stem, "?subtree_id=", subtree_id, "&tip_label=", tip_label), ...) res } ### Let's not worry about those for now, as their results could be ### obtained using get_study_tree get_study_otu <- function(study_id, otu = NULL, ...) { otl_GET(path = paste("study", study_id, "otu", otu, sep = "/"), ...) } get_study_otus <- function(study_id, otus, ...) { otl_GET(path = paste("study", study_id, "otu", otus, sep = "/"), ...) } get_study_otumap <- function(study_id, ...) { otl_GET(path = paste("study", study_id, "otumap", sep = "/")) } rotl/R/deduplicate_labels.R0000644000176200001440000000256213543626736015407 0ustar liggesusers## Create a vector (character) that contains the NEWICK tree strings ## found in a file parse_newick <- function(file) { trs <- readLines(file, warn = FALSE) trs <- strsplit(trs, split = ";") trs <- sapply(trs, function(x) gsub("^\\s+|\\s+$", "", x)) trs <- unlist(trs) trs <- gsub("\\s", "_", trs) trs <- trs[nchar(trs) > 0] trs } ## Internal function to be used by `deduplicate_labels` that: ## 1. identify duplicated labels ## 2. make them unique ## 3. replace the duplicated labels by their unique counterparts dedup_lbl <- function(tr_str) { tr_lbl <- tree_to_labels(tr_str, remove_quotes = TRUE)$tip_label tr_lbl_unq <- make.unique(tr_lbl, sep = "_") if (!identical(tr_lbl, tr_lbl_unq)) { for (i in seq_along(tr_lbl)) { tr_str <- sub( paste0("([\\(|,]\\'?)\\Q", tr_lbl[i], "\\E(\\'?[:|\\)|,])"), paste0("\\1", tr_lbl_unq[i], "\\2"), tr_str ) } warning("Some tip labels were duplicated and have been modified: ", paste(tr_lbl[duplicated(tr_lbl)], collapse = ", "), call. = FALSE ) } paste0(tr_str, ";") } ## Main function: takes a file with potentially duplicated tip labels ## and reate a new file with unique labels deduplicate_labels <- function(file) { tr_strs <- parse_newick(file) tr_dedup <- sapply(tr_strs, dedup_lbl) tmp_tr <- tempfile() cat(tr_dedup, file = tmp_tr, sep = "\n") tmp_tr } rotl/R/tol.R0000644000176200001440000006105313543603272012366 0ustar liggesusers .source_list <- function(tax, ...) { if (!exists("source_id_map", tax)) { ## it should only be missing with tol_about when using ## include_source_list=FALSE stop( "Make sure that your object has been created using ", sQuote("tol_about(include_source_list = TRUE)") ) } tt <- lapply(tax[["source_id_map"]], function(x) { c(x[["study_id"]], x[["tree_id"]], x[["git_sha"]]) }) tt <- do.call("rbind", tt) setNames( as.data.frame(tt, stringsAsFactors = FALSE), c("study_id", "tree_id", "git_sha") ) } ##' Basic information about the Open Tree of Life (the synthetic tree) ##' ##' @title Information about the Tree of Life ##' ##' @details Summary information about the current draft tree of life, ##' including information about the list of trees and the taxonomy ##' used to build it. The object returned by \code{tol_about} can ##' be passed to the taxonomy methods (\code{tax_name()}, ##' \code{tax_rank()}, \code{tax_sources()}, \code{ott_id}), to ##' extract relevant taxonomic information for the root of the ##' synthetic tree. ##' ##' @param include_source_list Logical (default = ##' \code{FALSE}). Return an ordered list of source trees. ##' @param tax an object created with a call to \code{tol_about}. ##' @param ... additional arguments to customize the API call (see ##' \code{\link{rotl}} for more information). ##' ##' @return An invisible list of synthetic tree summary statistics: ##' ##' \itemize{ ##' ##' \item {date_created} {String. The creation date of the tree.} ##' ##' \item {num_source_studies} {Integer. The number of studies ##' (publications)used as sources.} ##' ##' \item {num_source_trees} {The number of trees used as sources ##' (may be >1 tree per study).} ##' ##' \item {taxonomy_version} {The Open Tree Taxonomy version used ##' as a source.} ##' ##' \item {filtered_flags} {List. Taxa with these taxonomy flags were ##' not used in construction of the tree.} ##' ##' \item {root} {List. Describes the root node:} ##' \itemize{ ##' \item {node_id} {String. The canonical identifier of the node.} ##' ##' \item {num_tips} {Numeric. The number of descendent tips.} ##' ##' \item {taxon} {A list of taxonomic properties:} ##' \itemize{ ##' \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ott_id).} ##' ##' \item {name} {String. The taxonomic name of the queried node.} ##' ##' \item {unique_name} {String. The string that uniquely ##' identifies the taxon in OTT.} ##' ##' \item {rank} {String. The taxonomic rank of the taxon in OTT.} ##' ##' \item {tax_sources} {List. A list of identifiers for taxonomic ##' sources, such as other taxonomies, that define taxa judged ##' equivalent to this taxon.} ##' } ##' } ##' ##' \item {source_list} {List. Present only if ##' \code{include_source_list} is \code{TRUE}. The sourceid ##' ordering is the precedence order for synthesis, with ##' relationships from earlier trees in the list having priority ##' over those from later trees in the list. See ##' \code{source_id_map} below for study details.} ##' ##' \item {source_id_map} {Named list of lists. Present only if ##' \code{include_source_list} is \code{TRUE}. Names correspond to ##' the \sQuote{sourceids} used in \code{source_list} ##' above. Source trees will have the following properties:} ##' ##' \itemize{ ##' \item {git_sha} {String. The git SHA identifying a particular source ##' version.} #' ##' \item {tree_id} {String. The tree id associated with the study id used.} ##' ##' \item {study_id} {String. The study identifier. Will typically include ##' a prefix ("pg_" or "ot_").} ##' } ##' ##' \item {synth_id} {The unique string for this version of the tree.} ##' } ##' @seealso \code{\link{source_list}} to explore the list of studies ##' used in the synthetic tree (see example). ##' ##' @examples ##' \dontrun{ ##' res <- tol_about() ##' tax_sources(res) ##' ott_id(res) ##' studies <- source_list(tol_about(include_source_list=TRUE))} ##' @rdname tol_about ##' @export tol_about <- function(include_source_list = FALSE, ...) { res <- .tol_about(include_source_list = include_source_list, ...) class(res) <- c("tol_summary", class(res)) res } ##' @export print.tol_summary <- function(x, ...) { cat("\nOpenTree Synthetic Tree of Life.\n\n") cat("Tree version: ", x$synth_id, "\n", sep = "") cat("Taxonomy version: ", x$taxonomy, "\n", sep = "") cat("Constructed on: ", x$date_created, "\n", sep = "") cat("Number of terminal taxa: ", x$root$num_tips, "\n", sep = "") cat("Number of source trees: ", x$num_source_trees, "\n", sep = "") cat("Number of source studies: ", x$num_source_studies, "\n", sep = "") cat("Source list present: ", ifelse(exists("source_list", x), "true", "false"), "\n", sep = "") cat("Root taxon: ", x$root$taxon$name, "\n", sep = "") cat("Root ott_id: ", x$root$taxon$ott_id, "\n", sep = "") cat("Root node_id: ", x$root$node_id, "\n", sep = "") } tol_about_method_factory <- function(.f) { function(tax, ...) { res <- list(.f(tax[["root"]][["taxon"]])) names(res) <- .tax_unique_name(tax[["root"]][["taxon"]]) res <- add_otl_class(res, .f) res } } ##' @export ##' @rdname tol_about tax_rank.tol_summary <- tol_about_method_factory(.tax_rank) ##' @export ##' @rdname tol_about tax_sources.tol_summary <- tol_about_method_factory(.tax_sources) ##' @export ##' @rdname tol_about unique_name.tol_summary <- tol_about_method_factory(.tax_unique_name) ##' @export ##' @rdname tol_about tax_name.tol_summary <- tol_about_method_factory(.tax_name) ##' @export ##' @rdname tol_about ott_id.tol_summary <- tol_about_method_factory(.tax_ott_id) ##' @export ##' @rdname source_list source_list.tol_summary <- .source_list ##' Most Recent Common Ancestor for a set of nodes ##' ##' @title MRCA of taxa from the synthetic tree ##' ##' @details Get the MRCA of a set of nodes on the current synthetic ##' tree. Accepts any combination of node ids and ott ids as ##' input. Returns information about the most recent common ##' ancestor (MRCA) node as well as the most recent taxonomic ##' ancestor (MRTA) node (the closest taxonomic node to the MRCA ##' node in the synthetic tree; the MRCA and MRTA may be the same ##' node). If they are the same, the taxonomic information will be ##' in the \code{mrca} slot, otherwise they will be in the ##' \code{nearest_taxon} slot of the list. If any of the specified ##' nodes is not in the synthetic tree an error will be returned. ##' ##' Taxonomic methods (\code{tax_sources()}, \code{ott_id()}, ##' \code{unique_name()}, ...) are available on the objects ##' returned by \code{tol_mrca()}. If the MRCA node is MRTA, the ##' name of the object returned by these methods will start with ##' \sQuote{ott}, otherwise it will start with \sQuote{mrca}. ##' ##' @param ott_ids Numeric vector. The ott ids for which the MRCA is desired. ##' @param node_ids Character vector. The node ids for which the MRCA is desired. ##' @param tax an object returned by \code{tol_mrca()}. ##' @param ... additional arguments to customize the API call (see ##' \code{\link{rotl}} for more information). ##' ##' @return An invisible list of the MRCA node properties: ##' ##' \itemize{ ##' ##' \item {mrca} {List of node properties.} ##' ##' \itemize{ ##' \item {node_id} {String. The canonical identifier of the node.} ##' ##' \item {num_tips} {Numeric. The number of descendent tips.} ##' ##' \item {taxon} {A list of taxonomic properties. Only returned if ##' the queried node is a taxon. (If the node is not a taxon, a ##' \code{nearest_taxon} list is returned (see below)).} ##' ##' \itemize{ ##' \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} ##' ##' \item {name} {String. The taxonomic name of the queried node.} ##' ##' \item {unique_name} {String. The string that uniquely ##' identifies the taxon in OTT.} ##' ##' \item {rank} {String. The taxonomic rank of the taxon in OTT.} ##' ##' \item {tax_sources} {List. A list of identifiers for taxonomic ##' sources, such as other taxonomies, that define taxa judged ##' equivalent to this taxon.} ##' } ##' ##' The following properties list support/conflict for the node across ##' synthesis source trees. All properties involve sourceid keys and ##' nodeid values (see \code{source_id_map} below) Not all properties are ##' are present for every node. ##' ##' \item {partial_path_of} {List. The edge below this synthetic tree node ##' is compatible with the edge below each of these input tree nodes (one ##' per tree). Each returned element is reported as sourceid:nodeid.} ##' ##' \item {supported_by} {List. Input tree nodes (one per tree) that support ##' this synthetic tree node. Each returned element is reported as ##' sourceid:nodeid.} ##' ##' \item {terminal} {List. Input tree nodes (one per tree) that are equivalent ##' to this synthetic tree node (via an exact mapping, or the input tree ##' terminal may be the only terminal descended from this synthetic tree node. ##' Each returned element is reported as sourceid:nodeid.} ##' ##' \item {conflicts_with} {Named list of lists. Names correspond to ##' sourceid keys. Each list contains input tree node ids (one or more per tree) ##' that conflict with this synthetic node.} ##' } ##' ##' \item {nearest_taxon} {A list of taxonomic properties of the nearest rootward ##' taxon node to the MRCA node. Only returned if the MRCA node is a not taxon ##' (otherwise the \code{taxon} list above is returned).} ##' ##' \itemize{ ##' \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} ##' ##' \item {name} {String. The taxonomic name of the queried node.} ##' ##' \item {unique_name} {String. The string that uniquely ##' identifies the taxon in OTT.} ##' ##' \item {rank} {String. The taxonomic rank of the taxon in OTT.} ##' ##' \item {tax_sources} {List. A list of identifiers for taxonomic ##' sources, such as other taxonomies, that define taxa judged ##' equivalent to this taxon.} ##' } ##' ##' \item {source_id_map} {Named list of lists. Names correspond to the ##' sourceid keys used in the support/conflict properties of the \code{mrca} ##' list above. Source trees will have the following properties:} ##' ##' \itemize{ ##' \item {git_sha} {The git SHA identifying a particular source ##' version.} ##' ##' \item {tree_id} {The tree id associated with the study id used.} ##' ##' \item {study_id} {The study identifier. Will typically include ##' a prefix ("pg_" or "ot_").} ##' } ##' The only sourceid that does not correspond to a source tree is the taxonomy, ##' which will have the name "ott"+`taxonomy_version`, and the value is the ##' ott_id of the taxon in that taxonomy version. "Taxonomy" will only ever ##' appear in \code{supported_by}. ##' ##' } ##' ##' @examples ##' \dontrun{ ##' birds_mrca <- tol_mrca(ott_ids=c(412129, 119214)) ##' ott_id(birds_mrca) ##' tax_sources(birds_mrca) ##' } ##' @rdname tol_mrca ##' @export tol_mrca <- function(ott_ids = NULL, node_ids = NULL, ...) { res <- .tol_mrca(ott_ids = ott_ids, node_ids = node_ids, ...) class(res) <- c("tol_mrca", class(res)) return(res) } ##' @export print.tol_mrca <- function(x, ...) { cat("\nOpenTree MRCA node.\n\n") cat("Node id: ", x$mrca$node_id, "\n", sep = "") cat("Number of terminal descendants: ", x$mrca$num_tips, "\n", sep = "") if (is_taxon(x[["mrca"]][["taxon"]])) { cat("Is taxon: TRUE\n") cat("Name: ", x$mrca$taxon$name, "\n", sep = "") cat("ott id: ", x$mrca$taxon$ott_id, "\n", sep = "") } else { cat("Is taxon: FALSE\n") cat("Nearest taxon:\n") cat(" Name: ", x$nearest_taxon$name, "\n", sep = "") cat(" ott id: ", x$nearest_taxon$ott_id, "\n", sep = "") } } tol_mrca_method_factory <- function(.f) { function(tax, ...) { if (is_taxon(tax[["mrca"]][["taxon"]])) { res <- list(.f(tax[["mrca"]][["taxon"]])) names(res) <- .tax_unique_name(tax[["mrca"]][["taxon"]]) attr(res, "taxon_type") <- "mrca" } else { res <- list(.f(tax[["nearest_taxon"]])) names(res) <- .tax_unique_name(tax[["nearest_taxon"]]) attr(res, "taxon_type") <- "nearest_taxon" } res <- add_otl_class(res, .f) res } } ##' @export ##' @rdname tol_mrca tax_sources.tol_mrca <- tol_mrca_method_factory(.tax_sources) ##' @export ##' @rdname tol_mrca unique_name.tol_mrca <- tol_mrca_method_factory(.tax_unique_name) ##' @export ##' @rdname tol_mrca tax_name.tol_mrca <- tol_mrca_method_factory(.tax_name) ##' @export ##' @rdname tol_mrca tax_rank.tol_mrca <- tol_mrca_method_factory(.tax_rank) ##' @export ##' @rdname tol_mrca ott_id.tol_mrca <- tol_mrca_method_factory(.tax_ott_id) ##' @export ##' @rdname tol_mrca source_list.tol_mrca <- .source_list ##' Extract a subtree from the synthetic tree from an Open Tree node id. ##' ##' @title Extract a subtree from the synthetic tree ##' ##' @details Given a node, return the subtree of the synthetic tree descended ##' from that node. The start node may be specified using either a node id ##' or an ott id, but not both. If the specified node is not in the ##' synthetic tree an error will be returned. There is a size limit of ##' 25000 tips for this method. ##' ##' @param ott_id Numeric. The ott id of the node in the tree that should ##' serve as the root of the tree returned. ##' @param node_id Character. The node id of the node in the tree that should ##' serve as the root of the tree returned. ##' @param label_format Character. Defines the label type; one of ##' \dQuote{\code{name}}, \dQuote{\code{id}}, or ##' \dQuote{\code{name_and_id}} (the default). ##' @param file If specified, the function will write the subtree to a ##' file in newick format. ##' @param ... additional arguments to customize the API call (see ##' \code{\link{rotl}} for more information). ##' ##' @return If no value is specified to the \code{file} argument ##' (default), a phylogenetic tree of class \code{phylo}. ##' Otherwise, the function returns invisibly a logical indicating ##' whether the file was successfully created. ##' ##' @examples ##' \dontrun{ ##' res <- tol_subtree(ott_id=241841)} ##' @export tol_subtree <- function(ott_id = NULL, node_id = NULL, label_format = NULL, file, ...) { res <- .tol_subtree( ott_id = ott_id, node_id = node_id, label_format = label_format, ... ) if (!missing(file)) { unlink(file) cat(res$newick, file = file) return(invisible(file.exists(file))) } else { phy <- phylo_from_otl(res) return(phy) } } ##' Return the induced subtree on the synthetic tree that relates a list of nodes. ##' ##' @title Subtree from the Open Tree of Life ##' ##' @details Return a tree with tips corresponding to the nodes identified in ##' the input set that is consistent with the topology of the current ##' synthetic tree. This tree is equivalent to the minimal subtree ##' induced on the draft tree by the set of identified nodes. ##' ##' @param ott_ids Numeric vector. OTT ids indicating nodes to be used as tips ##' in the induced tree. ##' @param node_ids Character vector. Node ids indicating nodes to be used as ##' tips in the induced tree. ##' @param label_format Character. Defines the label type; one of ##' \dQuote{\code{name}}, \dQuote{\code{id}}, or \dQuote{\code{name_and_id}} ##' (the default). ##' @param file If specified, the function will write the subtree to a file in ##' newick format. ##' @param ... additional arguments to customize the API call (see ##' \code{\link{rotl}} for more information). ##' ##' @return If no value is specified to the \code{file} argument ##' (default), a phylogenetic tree of class \code{phylo}. ##' ##' Otherwise, the function returns invisibly a logical indicating ##' whether the file was successfully created. ##' ##' Note that the tree returned when specifying a file name with the ##' \code{file} argument is the \dQuote{raw} Newick string returned by Open ##' Tree of Life. This string contains singleton nodes, and therefore will ##' be different from the tree returned as a \code{phylo} object which will ##' not contain these singleton nodes. ##' ##' @examples ##' \dontrun{ ##' ## Result as a `phylo` object ##' res <- tol_induced_subtree(ott_ids = c(292466, 267845, 316878, 102710)) ##' ##' ## Raw Newick string from Open Tree of Life ##' tree_file <- tempfile(fileext = ".tre") ##' tol_induced_subtree(ott_ids = c(292466, 267845, 316878, 102710), ##' file=tree_file) ##' ##' } ##' @export tol_induced_subtree <- function(ott_ids = NULL, node_ids = NULL, label_format = NULL, file, ...) { res <- .tol_induced_subtree( ott_ids = ott_ids, node_ids = node_ids, label_format = label_format, ... ) if (!missing(file)) { unlink(file) cat(res$newick, file = file) return(file.exists(file)) } else { phy <- phylo_from_otl(res) return(phy) } } ##' Strip OTT ids from tip labels ##' @param tip_labels a character vector containing tip labels (most ##' likely the \code{tip.label} element from a tree returned by ##' \code{\link{tol_induced_subtree}} ##' @param remove_underscores logical (defaults to FALSE). If set to ##' TRUE underscores in tip labels are converted to spaces ##' @return A character vector containing the contents of ##' \code{tip_labels} with any OTT ids removed. ##' ##' @examples ##' \dontrun{ ##' genera <- c("Perdix", "Setophaga", "Cinclus", "Struthio") ##' tr <- tol_induced_subtree(ott_ids=c(102710, 285198, 267845, 292466)) ##' tr$tip.label %in% genera ##' tr$tip.label <- strip_ott_ids(tr$tip.label) ##' tr$tip.label %in% genera ##' } ##' @export strip_ott_ids <- function(tip_labels, remove_underscores = FALSE) { stripped <- sub("_ott\\d+$", "", tip_labels) if (remove_underscores) { return(gsub("_", " ", stripped)) } stripped } ##' Get summary information about a node in the synthetic tree ##' ##' @title Node info ##' ##' @details Returns summary information about a node in the graph. The ##' node of interest may be specified using either a node id or an ##' taxon id, but not both. If the specified node or OTT id is not ##' in the graph, an error will be returned. ##' ##' If the argument \code{include_lineage=TRUE} is used, you can ##' use \code{tax_lineage()} or \code{tol_lineage} to return the ##' taxonomic information or the node information for all the ##' ancestors to this node, down to the root of the tree. ##' ##' ##' @param ott_id Numeric. The OpenTree taxonomic identifier. ##' @param node_id Character. The OpenTree node identifier. ##' @param include_lineage Logical (default = FALSE). Whether to return the ##' lineage of the node from the synthetic tree. ##' @param ... additional arguments to customize the API call (see ##' ?rotl for more information) ##' ##' @return \code{tol_node_info} returns an invisible list of summary ##' information about the queried node: ##' ##' \itemize{ ##' ##' \item {node_id} {String. The canonical identifier of the node.} ##' ##' \item {num_tips} {Numeric. The number of descendent tips.} ##' ##' \item {partial_path_of} {List. The edge below this synthetic tree node ##' is compatible with the edge below each of these input tree nodes (one ##' per tree). Each returned element is reported as sourceid:nodeid.} ##' ##' \item {query} { The node id that resolved to this node. This can differ ##' from the node_id field if the query id is not canonical. } ##' ##' \item {taxon} {A list of taxonomic properties. Only returned if ##' the queried node is a taxon. Each source has:} ##' ##' \itemize{ ##' \item {ott_id} {Numeric. The OpenTree Taxonomy ID (ottID).} ##' ##' \item {name} {String. The taxonomic name of the queried node.} ##' ##' \item {unique_name} {String. The string that uniquely ##' identifies the taxon in OTT.} ##' ##' \item {rank} {String. The taxonomic rank of the taxon in OTT.} ##' ##' \item {tax_sources} {List. A list of identifiers for taxonomic ##' sources, such as other taxonomies, that define taxa judged ##' equivalent to this taxon.} ##' } ##' ##' The following properties list support/conflict for the node across ##' synthesis source trees. All properties involve sourceid keys and ##' nodeid values (see \code{source_id_map} below). ##' ##' \item {supported_by} {List. Input tree nodes (one per tree) that support ##' this synthetic tree node. Each returned element is reported as ##' sourceid:nodeid.} ##' ##' \item {terminal} {List. Input tree nodes (one per tree) that are ##' equivalent to this synthetic tree node (via an exact mapping, or the ##' input tree terminal may be the only terminal descended from this ##' synthetic tree node. Each returned element is reported as ##' sourceid:nodeid.} ##' ##' \item {conflicts_with} {Named list of lists. Names correspond to ##' sourceid keys. Each list contains input tree node ids (one or more per ##' tree) that conflict with this synthetic node.} ##' } ##' ##' \code{tol_lineage} and \code{tax_lineage} return data ##' frames. \code{tol_lineage} indicate for each ancestor its ##' node identifier, the number of tips descending from that ##' node, and whether it corresponds to a taxonomic level. ##' ##' @examples ##' \dontrun{ ##' birds <- tol_node_info(ott_id=81461, include_lineage=TRUE) ##' source_list(birds) ##' tax_rank(birds) ##' ott_id(birds) ##' tax_lineage(birds) ##' tol_lineage(birds)} ##' @export tol_node_info <- function(ott_id = NULL, node_id = NULL, include_lineage = FALSE, ...) { res <- .tol_node_info( ott_id = ott_id, node_id = node_id, include_lineage = include_lineage, ... ) class(res) <- c("tol_node", class(res)) return(res) } tol_node_method_factory <- function(.f) { function(tax, ...) { if (exists("taxon", tax)) { res <- setNames( list(.f(tax[["taxon"]])), .tax_unique_name(tax[["taxon"]]) ) } else if (exists("node_id", tax)) { res <- setNames(tax[["node_id"]], tax[["node_id"]]) } else { res <- NA } res <- add_otl_class(res, .f) res } } ##' @export print.tol_node <- function(x, ...) { cat("\nOpenTree node.\n\n") cat("Node id: ", x$node_id, "\n", sep = "") cat("Number of terminal descendants: ", x$num_tips, "\n", sep = "") if (is_taxon(x[["taxon"]])) { cat("Is taxon: TRUE\n") cat("Name: ", x$taxon$name, "\n", sep = "") cat("Rank: ", x$taxon$rank, "\n", sep = "") cat("ott id: ", x$taxon$ott_id, "\n", sep = "") } else { cat("Is taxon: FALSE\n") } } ##' @export ##' @param tax an object returned by \code{tol_node_info}. ##' @rdname tol_node_info tax_rank.tol_node <- tol_node_method_factory(.tax_rank) ##' @export ##' @rdname tol_node_info tax_sources.tol_node <- tol_node_method_factory(.tax_sources) ##' @export ##' @rdname tol_node_info unique_name.tol_node <- tol_node_method_factory(.tax_unique_name) ##' @export ##' @rdname tol_node_info tax_name.tol_node <- tol_node_method_factory(.tax_name) ##' @export ##' @rdname tol_node_info ott_id.tol_node <- tol_node_method_factory(.tax_ott_id) ##' @export ##' @rdname tol_node_info source_list.tol_node <- .source_list ##' @export ##' @rdname tol_node_info tax_lineage.tol_node <- function(tax, ...) { check_lineage(tax) lg <- lapply(tax[["lineage"]], function(x) { if (exists("taxon", x)) { build_lineage(x[["taxon"]]) } else { NULL } }) lg <- do.call("rbind", lg) as.data.frame(lg, stringsAsFactors = FALSE) } ##' @export ##' @rdname tol_node_info tol_lineage.tol_node <- function(tax, ...) { check_lineage(tax) lg <- lapply(tax[["lineage"]], function(x) { c( "node_id" = x[["node_id"]], "num_tips" = x[["num_tips"]], "is_taxon" = exists("taxon", x) ) }) lg <- do.call("rbind", lg) as.data.frame(lg, stringsAsFactors = FALSE) } rotl/R/taxonomy.R0000644000176200001440000002456713543626762013470 0ustar liggesusers##' Summary information about the Open Tree Taxonomy (OTT) ##' ##' Return metadata and information about the taxonomy ##' itself. Currently, the available metadata is fairly sparse, but ##' includes (at least) the version, and the location from which the ##' complete taxonomy source files can be downloaded. ##' ##' @title Information about the Open Tree Taxonomy ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A list with the following properties: ##' \itemize{ ##' ##' \item {weburl} {String. The release page for this version ##' of the taxonomy.} ##' ##' \item {author} {String. The author string.} ##' ##' \item {name} {String. The name of the taxonomy.} ##' ##' \item {source} {String. The full identifying information for ##' this version of the taxonomy.} ##' ##' \item {version} {String. The version number of the taxonomy.} ##' } ##' @examples ##' \dontrun{ ##' taxonomy_about() ##' } ##' @export taxonomy_about <- function(...) { res <- .taxonomy_about(...) return(res) } ##' Information about taxa. ##' ##' Given a vector of ott ids, \code{taxonomy_taxon_info} returns ##' information about the specified taxa. ##' ##' The functions \code{tax_rank}, \code{tax_name}, and ##' \code{synonyms} can extract this information from an object ##' created by the \code{taxonomy_taxon_info()}. ##' ##' @title Taxon information ##' @param ott_ids the ott ids of the taxon of interest (numeric or ##' character containing only numbers) ##' @param include_children whether to include information about all ##' the children of this taxon. Default \code{FALSE}. ##' @param include_lineage whether to include information about all ##' the higher level taxa that include the \code{ott_ids}. ##' Default \code{FALSE}. ##' @param include_terminal_descendants whether to include the list of ##' terminal \code{ott_ids} contained in the \code{ott_ids} ##' provided. ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @param tax an object generated by the \code{taxonomy_taxon_info} ##' function ##' @return \code{taxonomy_taxon_info} returns a list detailing ##' information about the taxa. \code{tax_rank} and ##' \code{tax_name} return a vector. \code{synonyms} returns a ##' list whose elements are the synonyms for each of the ##' \code{ott_id} requested. ##' ##' @seealso \code{\link{tnrs_match_names}} to obtain \code{ott_id} ##' from a taxonomic name. ##' @examples ##' \dontrun{ ##' req <- taxonomy_taxon_info(ott_id=515698) ##' tax_rank(req) ##' tax_name(req) ##' synonyms(req) ##' } ##' @export taxonomy_taxon_info <- function(ott_ids, include_children = FALSE, include_lineage = FALSE, include_terminal_descendants = FALSE, ...) { res <- lapply(ott_ids, function(x) { .taxonomy_taxon_info( ott_id = x, include_children = include_children, include_lineage = include_lineage, include_terminal_descendants = include_terminal_descendants, ... ) }) names(res) <- ott_ids class(res) <- "taxon_info" return(res) } ##' Given an ott id, return the inclusive taxonomic subtree descended ##' from the specified taxon. ##' ##' If the output of this function is exported to a file, the only ##' possible value for the \code{output_format} argument is ##' \dQuote{\code{newick}}. If the file provided already exists, it ##' will be silently overwritten. ##' ##' @title Taxonomy subtree ##' @param ott_id The ott id of the taxon of interest. ##' @param output_format the format of the object to be returned. See ##' the \sQuote{Return} section. ##' @param label_format Character. Defines the label type; one of ##' \dQuote{\code{name}}, \dQuote{\code{id}}, or ##' \dQuote{\code{name_and_id}} (the default). ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @param file the file name where to save the output of the ##' function. Ignored unless \code{output_format} is set to ##' \dQuote{\code{phylo}}. ##' @return If the \code{file} argument is missing: \itemize{ ##' ##' \item{\dQuote{\code{taxa}}} { a list of the taxa names ##' (species) in slot \code{tip_label}, and higher-level taxonomy ##' (e.g., families, genera) in slot \code{edge_label}, descending ##' from the taxa corresponding to the \code{ott_id} provided. } ##' ##' \item{\dQuote{\code{newick}}} { a character vector containing ##' the newick formatted string corresponding to the taxonomic ##' subtree for the \code{ott_id} provided. } ##' ##' \item{\dQuote{\code{phylo}}} { an object of the class ##' \code{phylo} from the \code{\link[ape]{ape}} package. } ##' ##' \item{\dQuote{\code{raw}}} { the direct output from the API, ##' i.e., a list with an element named \sQuote{newick} that ##' contains the subtree as a newick formatted string. } ##' ##' } ##' ##' If a \code{file} argument is provided (and ##' \code{output_format} is set to \dQuote{\code{phylo}}), a ##' logical indicating whether the file was successfully created. ##' ##' @examples ##' \dontrun{ ##' req <- taxonomy_subtree(ott_id=515698) ##' plot(taxonomy_subtree(ott_id=515698, output_format="phylo")) ##' } ##' @export taxonomy_subtree <- function(ott_id = NULL, output_format = c("taxa", "newick", "phylo", "raw"), label_format = NULL, file, ...) { output_format <- match.arg(output_format) res <- .taxonomy_subtree(ott_id = ott_id, label_format = label_format, ...) if (!missing(file) && !identical(output_format, "newick")) { warning( sQuote("file"), " argument is ignored, you can only write newick tree strings to a file." ) } if (identical(output_format, "raw")) { return(res) } else if (identical(output_format, "newick")) { res <- res$newick if (!missing(file)) { unlink(file) cat(res, file = file) invisible(return(file.exists(file))) } } else if (identical(output_format, "phylo")) { res <- phylo_from_otl(res) } else { ## in all other cases use tree_to_labels res <- tree_to_labels(res) } return(res) } ##' Taxonomic Least Inclusive Common Ancestor (MRCA) ##' ##' Given a set of OTT ids, get the taxon that is the most recent common ##' ancestor (the MRCA) of all the identified taxa. ##' ##' @title Taxonomic MRCA ##' @param ott_ids a vector of ott ids for the taxa whose MRCA is to ##' be found (numeric). ##' @param tax an object generated by the \code{taxonomy_mrca} ##' function ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return \itemize{ ##' ##' \item{\code{taxonomy_mrca}} { returns a list about the ##' taxonomic information relating to the MRCA for the ott_ids ##' provided. } ##' ##' \item{\code{tax_rank}} { returns a character vector of the ##' taxonomic rank for the MRCA. } ##' ##' \item{\code{tax_name}} { returns a character vector the ##' Open Tree Taxonomy name for the MRCA. } ##' ##' \item{\code{ott_id}} { returns a numeric vector of the ott id ##' for the MRCA. } ##' ##' } ##' @examples ##' \dontrun{ ##' req <- taxonomy_mrca(ott_ids=c(515698,590452,643717)) ##' tax_rank(req) ##' tax_name(req) ##' ott_id(req) ##' } ##' @export taxonomy_mrca <- function(ott_ids = NULL, ...) { res <- .taxonomy_mrca(ott_ids = ott_ids, ...) class(res) <- c("taxon_mrca", class(res)) return(res) } ### methods for taxonomy_taxon_info --------------------------------------------- taxon_info_method_factory <- function(.f) { function(tax, ...) { res <- lapply(tax, .f) names(res) <- vapply(tax, .tax_unique_name, character(1)) res <- add_otl_class(res, .f) res } } ##' @export ##' @rdname taxonomy_taxon_info tax_rank.taxon_info <- taxon_info_method_factory(.tax_rank) ##' @export ##' @rdname taxonomy_taxon_info tax_name.taxon_info <- taxon_info_method_factory(.tax_name) ##' @export ##' @rdname taxonomy_taxon_info unique_name.taxon_info <- taxon_info_method_factory(.tax_unique_name) ##' @export ##' @rdname taxonomy_taxon_info synonyms.taxon_info <- taxon_info_method_factory(.tax_synonyms) ##' @export ##' @rdname taxonomy_taxon_info ott_id.taxon_info <- taxon_info_method_factory(.tax_ott_id) ##' @export ##' @rdname taxonomy_taxon_info tax_sources.taxon_info <- taxon_info_method_factory(.tax_sources) ##' @export ##' @rdname taxonomy_taxon_info is_suppressed.taxon_info <- taxon_info_method_factory(.tax_is_suppressed) ##' @export ##' @rdname taxonomy_taxon_info flags.taxon_info <- taxon_info_method_factory(.tax_flags) ### methods for taxonomy_mrca --------------------------------------------------- taxon_mrca_method_factory <- function(.f) { function(tax, ...) { res <- list(.f(tax[["mrca"]])) names(res) <- .tax_unique_name(tax[["mrca"]]) res <- add_otl_class(res, .f) res } } ##' @export ##' @rdname taxonomy_mrca tax_rank.taxon_mrca <- taxon_mrca_method_factory(.tax_rank) ##' @export ##' @rdname taxonomy_mrca tax_name.taxon_mrca <- taxon_mrca_method_factory(.tax_name) ##' @export ##' @rdname taxonomy_mrca ott_id.taxon_mrca <- taxon_mrca_method_factory(.tax_ott_id) ##' @export ##' @rdname taxonomy_mrca unique_name.taxon_mrca <- taxon_mrca_method_factory(.tax_unique_name) ##' @export ##' @rdname taxonomy_mrca tax_sources.taxon_mrca <- taxon_mrca_method_factory(.tax_sources) ##' @export ##' @rdname taxonomy_mrca flags.taxon_mrca <- taxon_mrca_method_factory(.tax_flags) ##' @export ##' @rdname taxonomy_mrca is_suppressed.taxon_mrca <- taxon_mrca_method_factory(.tax_is_suppressed) ### method for extracting higher taxonomy from taxonomy_taxon_info calls ------- get_lineage <- function(tax) { check_lineage(tax) lg <- lapply(tax[["lineage"]], build_lineage) lg <- do.call("rbind", lg) as.data.frame(lg, stringsAsFactors = FALSE) } build_lineage <- function(x) { c( "rank" = .tax_rank(x), "name" = .tax_name(x), "unique_name" = .tax_unique_name(x), "ott_id" = .tax_ott_id(x) ) } check_lineage <- function(tax) { if (!exists("lineage", tax)) { stop( "The object needs to be created using ", sQuote("include_lineage=TRUE") ) } } ##' @export ##' @rdname tax_lineage tax_lineage.taxon_info <- function(tax, ...) { lapply(tax, get_lineage) } rotl/R/external_data.R0000644000176200001440000001150613543626740014406 0ustar liggesusers##' Get external identifiers for data associated with an Open Tree study ##' ##' Data associated with studies contributing to the Open Tree synthesis may ##' be available from other databases. In particular, trees and alignments ##' may be available from treebase and DNA sequences and bibliographic ##' information associated with a given study may be available from the NCBI. ##' This function retrieves that information for a given study. ##' ##' @param study_id An open tree study ID ##' @return A study_external_data object (which inherits from a list) which ##' contains some of the following. ##' @return doi, character, the DOI for the paper describing this study ##' @return external_data_url, character, a URL to an external data repository ##' (e.g. a treebase entry) if one exists. ##' @return pubmed_id character, the unique ID for this study in the NCBI's pubmed database ##' @return popset_ids character, vector of IDs for the NCBI's popset database ##' @return nucleotide_ids character, vector of IDs for the NCBI's nucleotide database ##' @seealso studies_find_studies (used to discover study IDs) ##' @importFrom httr parse_url ##' @importFrom rentrez entrez_search ##' @importFrom rentrez entrez_link ##' @examples ##' \dontrun{ ##' flies <- studies_find_studies(property="ot:focalCladeOTTTaxonName", value="Drosophilidae") ##' study_external_IDs(flies[2,]$study_ids) ##' } ##' @export study_external_IDs <- function(study_id) { meta <- get_study_meta(study_id) data_deposit <- meta[["nexml"]][["^ot:dataDeposit"]][["@href"]] url <- attr(get_publication(meta), "DOI") doi <- parse_url(url)$path pmid <- get_pmid(doi, study_id) res <- list( doi = doi, pubmed_id = pmid, external_data_url = data_deposit ) if (!is.null(pmid)) { res$popset_ids <- entrez_link(dbfrom = "pubmed", db = "popset", id = pmid)[["links"]][["pubmed_popset"]] res$nucleotide_ids <- entrez_link(dbfrom = "pubmed", db = "nuccore", id = pmid)[["links"]][["pubmed_nuccore"]] } structure(res, class = c("study_external_data", "list"), id = study_id) } ##' Get external identifiers for data associated with an Open Tree taxon ##' ##' The Open Tree taxonomy is a synthesis of multiple reference taxonomies. This ##' function retrieves identifiers to external taxonomic records that have ##' contributed the rank, position and definition of a given Open Tree taxon. ##' ##' @param taxon_id An open tree study ID ##' @return a data.frame in which each row represents a unique record in an ##' external database. The column "source" provides and abbreviated name for the ##' database, and "id" the unique ID for the record. ##' @seealso tnrs_matchnames, which can be used to search for taxa by name. ##' @seealso taxonomy_taxon, for more information about a given taxon. ##' @examples ##' \dontrun{ ##' gibbon_IDs <- taxon_external_IDs(712902) ##' } ##' @export taxon_external_IDs <- function(taxon_id) { taxon_info <- taxonomy_taxon_info(taxon_id) srcs <- taxon_info[[1]][["tax_sources"]] res <- do.call(rbind.data.frame, strsplit(unlist(srcs), ":")) names(res) <- c("source", "id") res } #' @export print.study_external_data <- function(x, ...) { cat("External data identifiers for study", attr(x, "study_id"), "\n") cat(" $doi: ", x[["doi"]], "\n") if (!is.null(x$pubmed_id)) { cat(" $pubmed_id: ", x[["pubmed_id"]], "\n") } if (!is.null(x$popset_ids)) { cat(" $popset_ids: vector of", length(x[["popset_ids"]]), "IDs \n") } if (!is.null(x$nucleotide_ids)) { cat(" $nucleotide_ids: vector of", length(x[["nucleotide_ids"]]), "IDs\n") } if (nchar(x[["external_data_url"]]) > 0) { cat(" $external_data_url", x[["external_data_url"]], "\n") } cat("\n") } ## Maybe include these functions to get summary information about a ## set of linked sequences? # summarize_nucleotide_data <- function(id_vector){ # summs <- entrez_summary(db="nuccore", id=id_vector) # interesting <- extract_from_esummary(summs, c("uid", "title", "slen", "organism", "completeness"), simplify=FALSE) # do.call(rbind.data.frame, interesting) # } # # summarize_popset_data <- function(id_vector){ # summs <- entrez_summary(db="popset", id=id_vector) # interesting <- extract_from_esummary(summs, c("uid", "title"), simplify=FALSE) # do.call(rbind.data.frame, interesting) # } # # Un-exported function to convert doi->pmid. Also takes study_id as an argument in # order to provide a helpful error message when 0 or >1 pmids are returned. get_pmid <- function(doi, study_id) { pubmed_search <- entrez_search(db = "pubmed", term = paste0(doi, "[DOI]")) if (length(pubmed_search$ids) == 0) { warning("Could not find PMID for study'", study_id, "', skipping NCBI data") return(NULL) } if (length(pubmed_search$ids) > 1) { warning("Found more than one PMID matching study'", study_id, "', skipping NCBI data") return(NULL) } pubmed_search$ids } rotl/R/tree_to_labels.R0000644000176200001440000000265513543626775014573 0ustar liggesusers## Function to extract tip and edge labels from newick formatted strings ## useful when the tree is too small to be read in by ape/rncl. ## tr needs to be a newick formatted tree string ## - missing tips are removed (OK for OTL as it won't happen) tree_to_labels <- function(tr, remove_quotes = TRUE) { n_right <- unlist(gregexpr("\\)", tr)) n_left <- unlist(gregexpr("\\(", tr)) if (n_right[1] == -1) n_right <- 0 else n_right <- length(n_right) if (n_left[1] == -1) n_left <- 0 else n_left <- length(n_left) if (!identical(n_right, n_left)) { stop("invalid newick string, numbers of ( and ) don't match") } ## remove white spaces tr <- gsub("\\s+", "", tr) ## remove branch lengths tr <- gsub(":[0-9]+(\\.[0-9]+)?", "", tr) ## TODO?: remove comments if (n_right < 1) { ## if only 1 tip tip_lbl <- gsub(";$", "", tr) edge_lbl <- character(0) } else { ## extract edge labels edge_lbl <- unlist(strsplit(tr, ")")) edge_lbl <- grep("^[^\\(]", edge_lbl, value = T) edge_lbl <- gsub("(,|;).*$", "", edge_lbl) edge_lbl <- edge_lbl[nzchar(edge_lbl)] ## extract tips tip_lbl <- unlist(strsplit(tr, ",")) tip_lbl <- gsub("^\\(*", "", tip_lbl) tip_lbl <- gsub("\\).*$", "", tip_lbl) tip_lbl <- tip_lbl[nzchar(tip_lbl)] } if (remove_quotes) { tip_lbl <- gsub("^(\\\"|\\\')(.+)(\\\'|\\\")$", "\\2", tip_lbl) } list(tip_label = tip_lbl, edge_label = edge_lbl) } rotl/R/tax_utils.R0000644000176200001440000000413713543626757013621 0ustar liggesusers## all extended-taxon-descriptors have: ## - ott_id ## - name ## - rank ## - unique_name ## - tax_sources ## and they may have ## - flags ## - synonyms ## - is_suppressed ## builds the functions to access the content of the taxon descriptors. ## slot: the name of the list element we need to access ## flatten: if the list element is a list, make it a vector ## optional: is the slot found in all taxon descriptors or only in some tax_access_factory <- function(slot, flatten, optional) { function(tax) { if ((!exists(slot, tax))) { if (optional) { warning("This object doesn't have ", sQuote(slot), call. = FALSE) return(NULL) } else { stop("Invalid taxon object", call. = FALSE) } } else { if (flatten) { unlist(tax[[slot]]) } else { tax[[slot]] } } } } .tax_ott_id <- tax_access_factory("ott_id", flatten = FALSE, optional = FALSE) .tax_name <- tax_access_factory("name", flatten = FALSE, optional = FALSE) .tax_rank <- tax_access_factory("rank", flatten = FALSE, optional = FALSE) .tax_sources <- tax_access_factory("tax_sources", flatten = TRUE, optional = FALSE ) .tax_unique_name <- tax_access_factory("unique_name", flatten = FALSE, optional = FALSE ) ## optional .tax_flags <- tax_access_factory("flags", flatten = TRUE, optional = TRUE) .tax_is_suppressed <- tax_access_factory("is_suppressed", flatten = FALSE, optional = TRUE ) .tax_synonyms <- tax_access_factory("synonyms", flatten = TRUE, optional = TRUE) ## Does the slot element represent a taxon? is_taxon <- function(slot) { if (all(c( "ott_id", "name", "rank", "tax_sources", "unique_name" ) %in% names(slot))) { TRUE } else { FALSE } } ### adds a class to the objects returned by the methods add_otl_class <- function(res, .f) { ## we need a prefix to avoid class name conflict ## apparently the class "name" already exists class(res) <- c( paste0("otl_", as.list(environment(.f))[["slot"]]), class(res) ) res } ##' @export `[.otl_ott_id` <- function(x, i, ...) { r <- NextMethod() class(r) <- class(x) r } rotl/R/is_in_tree.R0000644000176200001440000000421513543626740013712 0ustar liggesusers##' Some valid taxonomic names do not occur in the Synthetic ##' Tree. This convenience function allows you to check whether a ##' given Open Tree Taxonomy identifier (OTT id) is in the tree. A taxonomic ##' name may not occur in the synthetic tree because (1) it is an ##' extinct or invalid taxon, or (2) it is part of a group that is not ##' monophyletic in the tree. ##' ##' @title Check that OTT ids occur in the Synthetic Tree ##' @param ott_ids a vector of Open Tree Taxonomy identifiers ##' @param ... additional arguments to customize the API request (see ##' \code{\link{rotl}} package documentation). ##' @return A named logical vector. \code{TRUE} indicates that the OTT ##' id is in the synthetic tree, and \code{FALSE} that it is not. ##' @examples ##' \dontrun{ ##' plant_families <- c("Asteraceae", "Solanaceae", "Poaceae", "Amaranthaceae", ##' "Zamiaceae", "Araceae", "Juncaceae") ##' matched_names <- tnrs_match_names(plant_families) ##' ## This fails because some ott ids are not in the tree ##' ## plant_tree <- tol_induced_subtree(ott_id(matched_names)) ##' ## So let's check which ones are actually in the tree first: ##' in_tree <- is_in_tree(ott_id(matched_names)) ##' ## This now works: ##' plant_tree <- tol_induced_subtree(ott_id(matched_names)[in_tree]) ##' } ##' ##' @export is_in_tree <- function(ott_ids, ...) UseMethod("is_in_tree") ##' @export is_in_tree.otl_ott_id <- function(ott_ids, ...) { in_tree <- vapply(ott_ids, function(ottid) { test <- try(tol_node_info(ottid, ...), silent = TRUE) if (inherits(test, "try-error")) { if (grepl("was not found", test) && grepl(paste0("'ott", ottid, "'"), test)) { } else { warning("something seems off, check your internet connection?") } return(FALSE) } else { ott_id(test)[[1]] == ottid } }, logical(1), USE.NAMES = TRUE) in_tree } ##' @export is_in_tree.default <- function(ott_ids, ...) { chk_ids <- vapply(ott_ids, check_numeric, logical(1)) if (all(chk_ids)) { is_in_tree.otl_ott_id(ott_ids) } else { stop("Invalid format for ott_ids (they should look like numbers)") } } rotl/R/rotl-package.R0000644000176200001440000000374113057544607014147 0ustar liggesusers##' An Interface to the Open Tree of Life API ##' ##' The Open Tree of Life is an NSF funded project that is generating ##' an online, comprehensive phylogenetic tree for 1.8 million ##' species. \code{rotl} provides an interface that allows you to ##' query and retrieve the parts of the tree of life that is of ##' interest to you. ##' ##' \code{rotl} provides function to most of the end points the API ##' provides. The documentation of the API is available at: ##' \url{https://github.com/OpenTreeOfLife/opentree/wiki/Open-Tree-of-Life-APIs} ##' ##' @section Customizing API calls: ##' ##' All functions that use API end points can take 2 arguments to ##' customize the API call and are passed as \code{...} arguments. ##' ##' \itemize{ ##' ##' \item{ \code{otl_v} } { This argument controls which version ##' of the API your call is using. The default value for this ##' argument is a call to the non-exported function ##' \code{otl_version()} which returns the current version of the ##' Open Tree of Life APIs (v2).} ##' ##' \item{ \code{dev_url} } { This argument controls whether to use ##' the development version of the API. By default, \code{dev_url} ##' is set to \code{FALSE}, using \code{dev_url = TRUE} in your ##' function calls will use the development version.} ##' ##' } ##' ##' For example, to use the development version of the API, you ##' could use: \code{tnrs_match_names("anas", dev_url=TRUE)} ##' ##' Additional arguments can also be passed to the ##' \code{\link[httr]{GET}} and \code{\link[httr]{POST}} methods. ##' ##' ##' @section Acknowledgments: ##' ##' This package was started during the Open Tree of Life ##' \href{http://blog.opentreeoflife.org/2014/06/11/apply-for-tree-for-all-a-hackathon-to-access-opentree-resources/}{Hackathon} ##' organized by OpenTree, the NESCent Hackathon Interoperability ##' Phylogenetic group, and Arbor. ##' ##' @name rotl ##' @docType package ##' @import ape NULL rotl/NEWS.md0000644000176200001440000001363113543633766012354 0ustar liggesusers## rotl 3.0.10 * Small fixes following updates to the Open Tree of Life API (no visible change for users). * Updated documentation to reflect new value in output of `tol_node_info()`. ## rotl 3.0.9 * Small fixes following updates to the Open Tree of Life API. ## rotl 3.0.7 * Minor update to vignette to address change to TNRS endpoint (underscores can't be included in the taxon names anymore). ## rotl 3.0.6 * Minor update to address warnings seen on CRAN. ## rotl 3.0.5 ### New features * The data types in the data frame returned by `tnrs_match_names` are consistent, and remain the same even after using `update()`. ### Other changes * Small internal changes that reflect changes in the data structures returned by the API. ## rotl 3.0.4 ### New features * To improve stability of results across releases of the Open Tree Taxonomy, the TNRS match with the lowest OTT id is returned instead of the first one in case a name is shared across multiple domains (related to #88) * A warning is issued when users attempt to use TNRS on duplicated names. ### Other changes * Fix typos and workaround broken API to retrieve supplementary materials in vignette. ## rotl 3.0.3 ### New features * The function `get_study_subtree` gains the argument `tip_label` to control the formatting of the tip labels, #90, reported by @bomeara * The new function `is_in_tree` takes a list of OTT ids (i.e., the output of `ott_id()`), and returns a vector of logical indiicating whether they are included in the synthetic tree (workaround #31). ### Bug fixes * The function `get_study_subtree` ignored the argument `subtree_id`, #89 reported by @bomeara ### Other chaanges * `citation("rotl")` now includes the reference to the Open Tree of Life publication. * The "How to use rotl?" vignette was updated to document the behavior of v3 of the OTL API which returns an HTTP error code 400 when the request for induced subtree includes taxa that are not in the synthetic tree (fix #84) ## rotl 3.0.1 * Fix tests and vignette to reflect changes accompanying release 6.1 of the synthetic tree * Add section in vignette "How to use rotl?" about how to get the higher taxonomy from a given taxon. * Add `CITATION` file with MEE manuscript information (#82) ## rotl 3.0.0 * `rotl` now interacts with v3.0 of the Open Tree of Life APIs. The documentation has been updated to reflect the associated changes. More information about the v3.0 of the Open Tree of Life APIs can be found [on their wiki](https://github.com/OpenTreeOfLife/germinator/wiki/Open-Tree-of-Life-Web-APIs). ### New features * New methods: `tax_sources`, `is_suppressed`, `tax_rank`, `unique_name`, `name`, `ott_id`, for objects returned by `tnrs_match_names()`, `taxonomy_taxon_info()`, `taxonomy_taxon_mrca()`, `tol_node_info()`, `tol_about()`, and `tol_mrca()`. Each of these methods have their own class. * New method `tax_lineage()` to extract the higher taxonomy from an object returned by `taxonomy_taxon_info()` (initally suggested by Matt Pennell, #57). * New method `tol_lineage()` to extract the nodes towards the root of the tree. * New print methods for `tol_node_info()` and `tol_mrca()`. * New functions `study_external_IDs()` and `taxon_external_IDs()` that return the external identifiers for a study and associated trees (e.g., DOI, TreeBase ID); and the identifiers of taxon names in taxonomic databases. The vignette "Data mashup" includes an example on how to use it. * The function `strip_ott_id()` gains the argument `remove_underscores` to remove underscores from tips in trees returned by OTL. ### Changes * Rename method `ott_taxon_name()` to `tax_name()` for consistency. * Rename method `synth_sources()` and `study_list()` to `source_list()`. * Refactor how result of query is checked and parsed (invisible to the user). ### Bug fixes * Fix bug in `studies_find_studies()`, the arguments `verbose` and `exact` were ignored. * The argument `only_current` has been dropped for the methods associated with objects returned by `tnrs_match_names()` * The print method for `tnrs_context()` duplicated some names. * `inspect()`, `update()` and `synonyms()` methods for `tnrs_match_names()` did not work if the query included unmatched taxa. ## rotl 0.5.0 * New vignette: `meta-analysis` * Added arguments `include_lineage` and `list_terminal_descendants` to `taxonomy_taxon()` * Improve warning and format of the result if one of the taxa requested doesn't match anything `tnrs_match_names`. * In the data frame returned by `tnrs_match_names`, the columns `approximate_match`, `is_synonym` and `is_deprecated` are now `logical` (instead of `character`) [issue #54] * New utility function `strip_ott_ids` removes OTT id information from a character vector, making it easier to match tip labels in trees returned by `tol_induced_subtree` to taxonomic names in other data sources. This function can also remove underscores from the taxon names. * New method `list_trees` returns a list of tree ids associated with studies. The function takes the output of `studies_find_studies` or `studies_find_trees`. * `studies_find_studies` and `studies_find_trees` gain argument `detailed` (default set to `TRUE`), that produces a data frame summarizing information (title of the study, year of publication, DOI, ids of associated trees, ...) about the studies matching the search criteria. * `get_study_tree` gains argument `deduplicate`. When `TRUE`, if the tree returned for a given study contains duplicated tip labels, they will be made unique before being parsed by NCL by appending a suffix (`_1`, `_2`, `_3`, etc.). (#46, reported by @bomeara) * New method `get_study_year` for objects of class `study_meta` that returns the year of publication of the study. * A more robust approach is used by `get_tree_ids` to identify the tree ids in the metadata returned by the API ## rotl 0.4.1 * Initial CRAN release on July, 24th 2015 rotl/MD50000644000176200001440000001162313543642072011553 0ustar liggesusers78ba5b0a1190acda6fd2f0b198141994 *DESCRIPTION 41ba68f62ff5f58f05f96a0dbd08b282 *LICENSE 8b9aef5916e67fe581c88a9bf2546712 *NAMESPACE f4aa4c6a5722535840be916ac80e2fc3 *NEWS.md ac483808e5b69aaaae252003f97e707d *R/api-collections.R 86061c453d64643efc0cbe908effd59d *R/api-studies.R 5f45dcb56bcf4230784c3cdaf8563fbc *R/api-taxonomy.R a6f1238a035c77f6669d93deea9aa2bd *R/api-tnrs.R 034e07143f57ac320d6704a96ca00899 *R/api-tol.R 2f5edd9ab9c39611ad7c52f57869102d *R/base.R 58ac44eb552c57b7b5ad996a340864f9 *R/deduplicate_labels.R c282a05519f66d3c1cb9bf86041e6202 *R/external_data.R 0606c16b6ddaac8e75772c87909d38b5 *R/is_in_tree.R 3878617ce289c163bb45f85f12b1e47c *R/match_names.R 9b6e56ea7e296aadd1c89c6ee15fa01a *R/methods.R 39c9b5a62e0eb9af93ef8c24e65eb761 *R/rotl-package.R de7acd61a314eb507424e45d12d6a4ba *R/studies-methods.R 451a2522c0cbdb4b560dd2801c289112 *R/studies-utils.R 4e146e6edb471e4cb3324b00f7dd521f *R/studies.R d89b501ece90eab10dd2fb8d7232caa3 *R/tax_utils.R 69b78f6e4074938bbf7a972fa23bbe53 *R/taxonomy.R d27906112f453f3f87ef0cb7d20df96e *R/tnrs.R 2d2215f88bd8a91d25e5299d24c24f44 *R/tol.R ad3ff267fb90ff6fd2dff89df96ce91d *R/tree_to_labels.R 1dc5b0e066843fab66ae3c908416ef5b *README.md 9252cdf199ebacefa0ab228cc2c09669 *build/vignette.rds 7692403dbe5797a06e9b38cd8d0ea3a3 *inst/CITATION f32294fe3c0918b942117022a3e1c174 *inst/doc/data_mashups.R 5c225fbf55593b9b1de4f27752d5c63b *inst/doc/data_mashups.Rmd 99e3cc03ce6bbe0412378a17ba15d606 *inst/doc/data_mashups.html 96ad58dceb69cc9ee442642d2c15388b *inst/doc/meta-analysis.R fd6fcba0debf851cb5f63b2a564131fd *inst/doc/meta-analysis.Rmd c8843250c78729599127fc936c02727c *inst/doc/meta-analysis.html 1eeabea32c4dbec78a9625c9f415a901 *inst/doc/rotl.R 828d152e5c611aeffec469ad5d93a677 *inst/doc/rotl.Rmd a2b5fe611dbe57074d5fd1e3bbf69526 *inst/doc/rotl.html 09d93b49b2b38f2495761ea86e134006 *inst/extdata/egg.csv d27a70b4799cd0a916da68498ce7c206 *inst/extdata/mcmcglmm_model.rds 5e5eb20ee387ba7192c62e629a3383f2 *inst/extdata/protist_mutation_rates.csv 059403771f006cdcb499b0eb9803eff9 *man/get_study.Rd 090bee51a46d9f478adf42c5ea2bc97d *man/get_study_meta.Rd 8ca5a9c9e9eec7d3651c21be70ef3750 *man/get_study_subtree.Rd 450fb82ec7068043a0c8bf2d0598bfa2 *man/get_study_tree.Rd 7376b3c8fbc5c5d83c06e9c2756fbb35 *man/is_in_tree.Rd aa63caf24823e451167f689f3ba9ee48 *man/list_trees.Rd e0386442684f2019f009dbd9dc75b9b3 *man/match_names-methods.Rd 86f892122bec47b0709f53c7478c55ab *man/match_names.Rd 35a35962e97907ddd889b4ff7c8e0257 *man/rotl.Rd ea8938c2220f0b358930fbaa9b9af738 *man/source_list.Rd 216476335bfc2e2662b67e1f074d12d2 *man/strip_ott_ids.Rd 23971a71f7542c37d227907fa53a6cb2 *man/studies_find_studies.Rd b703f1c5e9b47cfebf1714be973a6909 *man/studies_find_trees.Rd b52b8d1f1701bf1d7d1b4549d56ccc90 *man/studies_properties.Rd 53b91ea154206361b51b7009446151d5 *man/study_external_IDs.Rd ed749cd0a9f5e22fe03fbf6ad5b62f43 *man/synonyms.match_names.Rd ccb54bd7485bddbe4ee59b4e117a0b21 *man/tax_lineage.Rd db9ed55536b7db87701316de1e5d4493 *man/taxon_external_IDs.Rd 5f58b0e589b08000432acb5656fc2be2 *man/taxonomy-methods.Rd 3e0efd88ff66012d6eadaea7c5606aa4 *man/taxonomy_about.Rd 5fa0e3a349e2d596e24ce621c567497b *man/taxonomy_mrca.Rd e0eca3484f5a290bab377661b280f2d3 *man/taxonomy_subtree.Rd d50ea7664ac97dc3be5e5406b123237c *man/taxonomy_taxon_info.Rd c01395cc8ca421b4e607c110fd714a53 *man/tnrs_contexts.Rd a16c0de937a7de364fbff3a7e1581c44 *man/tnrs_infer_context.Rd 43788c7c376c8a2aef592de35a4f0e85 *man/tnrs_match_names.Rd 0399a2876a415a962c1c35f52ad418b6 *man/tol_about.Rd e03f7ad6f93233aec8d33d2c2ad413b1 *man/tol_induced_subtree.Rd 6e882e1e9c3b69dbddbcafd5ea08ddcc *man/tol_mrca.Rd d9e8fe104c6e576fd8df0354de21fb16 *man/tol_node_info.Rd ca675fcf48a69da215dd88bf3a6a8c0b *man/tol_subtree.Rd 2e5f11fd503ac9afd3daeada3fec43ec *tests/test-all.R 8ed001a0b57c171971944b65477c91a8 *tests/testthat/test-API.R 847fbfea80d45a1a998d6c16eda0502a *tests/testthat/test-api-studies.R dbdaeaa0e8aac809ed49ae0ca436ad77 *tests/testthat/test-api-taxonomy.R 02e21c42744195ba63bcaaefc86c5375 *tests/testthat/test-api-tnrs.R 9bf4fff54c13e1931a77faa40c9e32fe *tests/testthat/test-api-tol.R eefbe86daadd328ef5837146060dce9d *tests/testthat/test-base.R b6b8b458e2e877cd627dedbfb6f7da67 *tests/testthat/test-deduplicate_labels.R edeafd20624754a030aea18c87a31a3e *tests/testthat/test-external.R 9ac25fde1acf26f1c3aaf3d1a830974f *tests/testthat/test-match_names.R 0c807fdb420f96c40bc09a5d561c5b2d *tests/testthat/test-studies.R 09d6355d715a26f75158621b4f920b15 *tests/testthat/test-taxonomy.R 588776fb7f4c891cd0f131d497293b15 *tests/testthat/test-tnrs.R f4167dc0933dbc3ef1406a2f3f5e3339 *tests/testthat/test-tol.R 538d0e358c91e50b80fd1cc51233ffea *tests/testthat/test-tree_to_labels.R fb4b19651907e0fdb26e6f4c0581af83 *tests/tree_of_life.json 5c225fbf55593b9b1de4f27752d5c63b *vignettes/data_mashups.Rmd fd6fcba0debf851cb5f63b2a564131fd *vignettes/meta-analysis.Rmd 828d152e5c611aeffec469ad5d93a677 *vignettes/rotl.Rmd da8cb33974fa673158fea8ccf2d8bbac *vignettes/vignette.css rotl/inst/0000755000176200001440000000000013543637133012217 5ustar liggesusersrotl/inst/doc/0000755000176200001440000000000013543637133012764 5ustar liggesusersrotl/inst/doc/meta-analysis.Rmd0000644000176200001440000002351113543632562016202 0ustar liggesusers--- title: "Using the Open Tree synthesis in a comparative analysis" author: "David Winter" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{Using the Open Tree synthesis in a comparative analysis} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} %\VignetteEncoding{UTF-8} --- ## Phylogenetic Comparative Methods The development of phylogenetic comparative methods has made phylogenies and important source of data in fields as diverse as ecology, genomic and medicine. Comparative methods can be used to investigate patterns in the evolution of traits or the diversification of lineages. In other cases a phylogeny is treated as a "nuisance parameter", allowing with the autocorrelation created by the shared evolutionary history of the different species included to be controlled for. In many cases finding a tree that relates the species for which trait data are available is a rate-limiting step in such comparative analyses. Here we show how the synthetic tree provided by Open Tree of Life (and made available in R via `rotl`) can help to fill this gap. ## A phylogenetic meta-analysis To demonstrate the use of `rotl` in a comparative analysis, we will partially reproduce the results of [Rutkowska _et al_ 2014](https://doi.org/10.1111/jeb.12282). Very briefly, this study is a meta-analysis summarising the results of multiple studies testing for systematic differences in the size of eggs which contain male and female offspring. Such a difference might mean that birds invest more heavily in one sex than the other. Because this study involves data from 51 different species, Rutkowska _et al_ used a phylogenetic comparative approach to account for the shared evolutionary history among some of the studied-species. ### Gather the data If we are going to reproduce this analysis, we will first need to gather the data. Thankfully, the data is available as supplementary material from the publisher's website. We can collect the data from using `fulltext` (with the papers DOI as input) and read it into memory with `readxl::read_excel`: ```{r load-package} library(rotl) ``` ```{r egg_data} ## This should work, but Wiley has currently broken the URLs to access the ## SI. ## if (require(readxl) && require(fulltext)) { ## doi <- "10.1111/jeb.12282" ## xl_file <- try(ft_get_si(doi, 1, save.name="egg.xls"), silent = TRUE) ## egg_data <- read_excel(xl_file) ## } else { egg_data <- read.csv(system.file("extdata", "egg.csv", package = "rotl"), stringsAsFactors = FALSE ) ## } head(egg_data) ``` The most important variable in this dataset is `Zr`, which is a [normalized effect size](https://en.wikipedia.org/wiki/Fisher_transformation) for difference ,in size between eggs that contain males and females. Values close to zero come from studies that found the sex of an egg's inhabitant had little effect in its size, while large positive or negative values correspond to studies with substantial sex biases (towards males and females respectively). Since this is a meta-analysis we should produce the classic [funnel plot](https://en.wikipedia.org/wiki/Funnel_plot) with effects-size on the y-axis and precision (the inverse of the sample standard error) on the x-axis. Here we calculate precision from the sample variance (`Vzr`): ```{r eggs_in_a_funnel, fig.width=6, fig.height=3} plot(1 / sqrt(egg_data$VZr), egg_data$Zr, pch = 16, ylab = "Effect size (Zr)", xlab = "Precision (1/SE)", main = "Effect sizes for sex bias in egg size among 51 brid species" ) ``` In order to use this data later on we need to first convert it to a standard `data.frame`. We can also convert the `animal` column (the species names) to lower case, and remove the underscores in their names, which will make it easier to match names later on: ```{r, clean_eggs} egg_data <- as.data.frame(egg_data) ## Convert taxon names to lower case egg_data$animal <- tolower(egg_data$animal) ## Let's remove the underscores (_) from the taxon names egg_data$animal <- gsub("_", " ", egg_data$animal) ``` ### Find the species in OTT We can use the OTL synthesis tree to relate these species. To do so we first need to find Open Tree Taxonomy (OTT) IDs for each species. We can do that with the Taxonomic Name Resolution Service function `tnrs_match_names`: ```{r birds} taxa <- tnrs_match_names(unique(egg_data$animal), context = "Animals") head(taxa) ``` All of these species are in OTT, but a few of them go by different names in the Open Tree than we have in our data set. Because the tree `rotl` fetches will have Open Tree names, we need to create a named vector that maps the names we have for each species to the names Open Tree uses for them: ```{r bird_map} taxon_map <- structure(taxa$search_string, names = taxa$unique_name) ``` Now we can use this map to retrieve "data set names" from "OTT names": ```{r odd_duck} taxon_map["Anser caerulescens"] ``` ### Get a tree Now we can get the tree. There are really too many tips here to show nicely, so we will leave them out of this plot ```{r birds_in_a_tree, fig.width=5, fig.height=5, fig.align='center'} tr <- tol_induced_subtree(ott_id(taxa)[is_in_tree(ott_id(taxa))]) plot(tr, show.tip.label = FALSE) ``` There are a few things to note here. First, the tree has no branch lengths. At present this is true for the whole of the Open Tree synthetic tree. Some comparative methods require either branch lengths or an ultrametric tree. Before you can use one of those methods you will need to get a tree with branch lengths. You could try looking for published trees made available by the Open Tree with `studies_find_trees`. Alternatively, you could estimate branch lengths from the toplogy of a phylogeny returned by `tol_induced_subtree`, perhaps by downloading DNA sequences from the NCBI with `rentrez` or "hanging" the tree on nodes of known-age using penalized likelihood method in `ape::chronos`. In this case, we will use only the topology of the tree as input to our comparative analysis, so we can skip these steps. Second, the tip labels contain OTT IDs, which means they will not perfectly match the species names in our dataset or the taxon map that we created earlier: ```{r tip_lab} tr$tip.label[1:4] ``` Finally, the tree contains node labels for those nodes that match a higher taxonomic group, and empty character vectors (`""`) for all other nodes. Some comparative methods either do no expect node labels at all, or require all labeled nodes to have a unique name (meaning multiple "empty" labels will cause and error). We can deal with all these details easily. `rotl` provides the convenience function `strip_ott_ids` to remove the extra information from the tip labels. With the IDs removed, we can use our taxon map to replace the tip labels in the tree with the species names from dataset. ```{r clean_tips} otl_tips <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label <- taxon_map[ otl_tips ] ``` Finally, we can remove the node labels by setting the `node.label` attribute of the tree to `NULL`. ```{r remove_nodes} tr$node.label <- NULL ``` ```{r match_species_tree} egg_data <- egg_data[egg_data$animal %in% tr$tip.label, ] ``` ### Perform the meta-analysis Now we have data and a tree, and we know the names in the tree match the ones in the data. It's time to do the comparative analysis. Rutkowska _et al_. used `MCMCglmm`, a Bayesian MCMC approach to fitting multi-level models,to perform their meta-analysis, and we will do the same. Of course, to properly analyse these data you would take some care in deciding on the appropriate priors to use and inspect the results carefully. In this case, we are really interested in using this as a demonstration, so we will just run a simple model. Specifically we sill fit a model where the only variable that might explain the values of `Zr` is the random factor `animal`, which corresponds to the phylogenetic relationships among species. We also provide `Zvr` as the measurement error variance, effectively adding extra weight to the results of more powerful studies. Here's how we specify and fit that model with `MCMCglmm`: ```{r model} set.seed(123) if (require(MCMCglmm, quietly = TRUE)) { pr <- list( R = list(V = 1, nu = 0.002), G = list(G1 = list(V = 1, nu = 0.002)) ) model <- MCMCglmm(Zr ~ 1, random = ~animal, pedigree = tr, mev = egg_data$VZr, prior = pr, data = egg_data, verbose = FALSE ) } else { model <- readRDS(file = system.file("extdata", "mcmcglmm_model.rds", package = "rotl")) } ``` Now that we have a result we can find out how much phylogenetic signal exists for sex-biased differences in egg-size. In a multi-level model we can use variance components to look at this, specifically the proportion of the total variance that can be explained by phylogeny is called the phylogenetic reliability, _H_. Let's calculate the _H_ for this model: ```{r PhyH} var_comps <- colMeans(model$VCV) var_comps["animal"] / sum(var_comps) ``` It appears there is almost no phylogenetic signal to the data. The relationships among species explain much less that one percent of the total variance in the data. If you were wondering, Rutkowska _et al_. report a similar result, even after adding more predictors to their model most of the variance in `Zr` was left unexplained. ## What other comparative methods can I use in R? Here we have demonstrated just one comparative analysis that you might do in R. There are an ever-growing number of packages that allow an ever-growing number of analysis to performed in R. Some "classics" like ancestral state reconstruction, phylogenetic independent contrasts and lineage through time plots are implemented in `ape`. Packages like `phytools`, `caper` and `diversitree` provide extensions to these methods. The [CRAN Phylogenetics Taskview](https://CRAN.R-project.org/view=Phylogenetics) gives a good idea of the diversity of packages and analyses that can be completed in R. rotl/inst/doc/data_mashups.Rmd0000644000176200001440000002037113543632563016106 0ustar liggesusers--- title: "Connecting data to Open Tree trees" author: "David Winter" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{Connecting data to Open Tree trees} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} \usepackage[utf8]{inputenc} --- ## Combining data from OToL and other sources. One of the major goals of `rotl` is to help users combine data from other sources with the phylogenetic trees in the Open Tree database. This examples document describes some of the ways in which a user might connect data to trees from Open Tree. ## Get Open Tree IDs to match your data. Let's say you have a dataset where each row represents a measurement taken from one species, and your goal is to put these measurements in some phylogenetic context. Here's a small example: the best estimate of the mutation rate for a set of unicellular Eukaryotes along with some other property of those species which might explain the mutation rate: ```{r, data} csv_path <- system.file("extdata", "protist_mutation_rates.csv", package = "rotl") mu <- read.csv(csv_path, stringsAsFactors = FALSE) mu ``` If we want to get a tree for these species we need to start by finding the unique ID for each of these species in the Open Tree database. We can use the Taxonomic Name Resolution Service (`tnrs`) functions to do this. Before we do that we should see if any of the taxonomic contexts, which can be used to narrow a search and avoid conflicts between different codes, apply to our group of species: ```{r, context} library(rotl) tnrs_contexts() ``` Hmm, none of those groups contain all of our species. In this case we can search using the `All life` context and the function `tnrs_match_names`: ```{r, match} taxon_search <- tnrs_match_names(names = mu$species, context_name = "All life") knitr::kable(taxon_search) ``` Good, all of our species are known to Open Tree. Note, though, that one of the names is a synonym. _Saccharomyces pombe_ is older name for what is now called _Schizosaccharomyces pombe_. As the name suggests, the Taxonomic Name Resolution Service is designed to deal with these problems (and similar ones like misspellings), but it is always a good idea to check the results of `tnrs_match_names` closely to ensure the results are what you expect. In this case we have a good ID for each of our species so we can move on. Before we do that, let's ensure we can match up our original data to the Open Tree names and IDs by adding them to our `data.frame`: ```{r, munge} mu$ott_name <- unique_name(taxon_search) mu$ott_id <- taxon_search$ott_id ``` ## Find a tree with your taxa Now let's find a tree. There are two possible options here: we can search for published studies that include our taxa or we can use the 'synthetic tree' from Open Tree. We can try both approaches. ### Published trees Before we can search for published studies or trees, we should check out the list of properties we can use to perform such searches: ```{r, properties} studies_properties() ``` We have `ottIds` for our taxa, so let's use those IDs to search for trees that contain them. Starting with our first species _Tetrahymena thermophila_ we can use `studies_find_trees` to do this search. ```{r taxon_count} studies_find_trees(property = "ot:ottId", value = as.character(ott_id(taxon_search)[1])) ``` Well... that's not very promising. We can repeat that process for all of the IDs to see if the other species are better represented. ```{r, all_taxa_count} hits <- lapply(mu$ott_id, studies_find_trees, property = "ot:ottId", detailed = FALSE) sapply(hits, function(x) sum(x[["n_matched_trees"]])) ``` OK, most of our species are not in any of the published trees available. You can help fix this sort of problem by [making sure you submit your published trees to Open Tree](https://tree.opentreeoflife.org/curator). ### A part of the synthesis tree Thankfully, we can still use the complete Tree of Life made from the combined results of all of the published trees and taxonomies that go into Open Tree. The function `tol_induced_subtree` will fetch a tree relating a set of IDs. Using the default arguments you can get a tree object into your R session: ```{r subtree, fig.width=7, fig.height=4} ott_in_tree <- ott_id(taxon_search)[is_in_tree(ott_id(taxon_search))] tr <- tol_induced_subtree(ott_ids = ott_in_tree) plot(tr) ``` ### Connect your data to the tips of your tree Now we have a tree for of our species, how can we use the tree and the data together? The package `phylobase` provide an object class called `phylo4d`, which is designed to represent a phylogeny and data associated with its tips. In oder to get our tree and data into one of these objects we have to make sure the labels in the tree and in our data match exactly. That's not quite the case at the moment (tree labels have underscores and IDs appended): ```{r, match_names} mu$ott_name[1] tr$tip.label[4] ``` `rotl` provides a convienence function `strip_ott_ids` to deal with these. ```{r, sub} tr$tip.label <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label %in% mu$ott_name ``` Ok, now the tips are together we can make a new dataset. The `phylo4d()` functions matches tip labels to the row names of a `data.frame`, so let's make a new dataset that contains just the relevant data and has row names to match the tree ```{r phylobase} library(phylobase) mu_numeric <- mu[, c("mu", "pop.size", "genome.size")] rownames(mu_numeric) <- mu$ott_name tree_data <- phylo4d(tr, mu_numeric) ``` And now we can plot the data and the tree together ```{r, fig.width=7, fig.height=5} plot(tree_data) ``` ## Find external data associated with studies, trees and taxa from Open Tree In the above example we looked for a tree that related species in another dataset. Now we will go the other way, and try to find data associated with Open Tree records in other databases. ### Get external data from a study Let's imagine you were interested in extending or reproducing the results of a published study. If that study is included in Open Tree you can find it via `studies_find_studies` or `studies_find_trees` and retrieve the published trees with `get_study`. `rotl` will also help you find external. The function `study_external_IDs` retrieves the DOI for a given study, and uses that to gather some more data: ```{r} extra_data <- try(study_external_IDs("pg_1980"), silent = TRUE) if (!inherits(extra_data, "try-error")) { extra_data } ``` Here the returned object contains an `external_data_url` (in this case a link to the study in Treebase), a pubmed ID for the paper and a vector IDs for the NCBI's nuleotide database. The packages `treebase` and `rentrez` provide functions to make use of these IDs within R. As an example, let's use `rentrez` to download the first two DNA seqences and print them. ```{r} library(rentrez) seqs <- try(entrez_fetch(db = "nucleotide", id = extra_data$nucleotide_ids[1:2], rettype = "fasta"), silent = TRUE) if (inherits(seqs, "try-error")) { cat("NCBI temporarily down.") } else { cat(seqs) } ``` You could further process these sequences in R with the function `read.dna` from `ape` or save them to disk by specifying a file name with `cat`. ### Find a OTT taxon in another taxonomic database It is also possible map an Open Tree taxon to a record in another taxonomic database. For instance, if we wanted to search for data about one of the tips of the sub-tree we fetched in the example above we could do so using `taxon_external_IDs`: ```{r} Tt_ids <- taxon_external_IDs(mu$ott_id[2]) Tt_ids ``` A user could then use `rgbif` to find locality records using the gbif ID or `rentrez` to get genetic or bibliometric data about from the NCBI's databases. ## What next The demonstration gets you to the point of visualizing your data in a phylogenetic context. But there's a lot more you do with this sort of data in R. For instance, you could use packages like `ape`, `caper`, `phytools` and `mcmcGLMM` to perform phylogenetic comparative analyses of your data. You could gather more data on your species using packages that connect to trait databases like `rfishbase`, `AntWeb` or `rnpn` which provides data from the US National Phenology Network. You could also use `rentrez` to find genetic data for each of your species, and use that data to generate branch lengths for the phylogeny. rotl/inst/doc/data_mashups.R0000644000176200001440000000501413543637105015557 0ustar liggesusers## ---- data--------------------------------------------------------------- csv_path <- system.file("extdata", "protist_mutation_rates.csv", package = "rotl") mu <- read.csv(csv_path, stringsAsFactors = FALSE) mu ## ---- context------------------------------------------------------------ library(rotl) tnrs_contexts() ## ---- match-------------------------------------------------------------- taxon_search <- tnrs_match_names(names = mu$species, context_name = "All life") knitr::kable(taxon_search) ## ---- munge-------------------------------------------------------------- mu$ott_name <- unique_name(taxon_search) mu$ott_id <- taxon_search$ott_id ## ---- properties--------------------------------------------------------- studies_properties() ## ----taxon_count--------------------------------------------------------- studies_find_trees(property = "ot:ottId", value = as.character(ott_id(taxon_search)[1])) ## ---- all_taxa_count----------------------------------------------------- hits <- lapply(mu$ott_id, studies_find_trees, property = "ot:ottId", detailed = FALSE) sapply(hits, function(x) sum(x[["n_matched_trees"]])) ## ----subtree, fig.width=7, fig.height=4--------------------------------- ott_in_tree <- ott_id(taxon_search)[is_in_tree(ott_id(taxon_search))] tr <- tol_induced_subtree(ott_ids = ott_in_tree) plot(tr) ## ---- match_names-------------------------------------------------------- mu$ott_name[1] tr$tip.label[4] ## ---- sub---------------------------------------------------------------- tr$tip.label <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label %in% mu$ott_name ## ----phylobase----------------------------------------------------------- library(phylobase) mu_numeric <- mu[, c("mu", "pop.size", "genome.size")] rownames(mu_numeric) <- mu$ott_name tree_data <- phylo4d(tr, mu_numeric) ## ---- fig.width=7, fig.height=5----------------------------------------- plot(tree_data) ## ------------------------------------------------------------------------ extra_data <- try(study_external_IDs("pg_1980"), silent = TRUE) if (!inherits(extra_data, "try-error")) { extra_data } ## ------------------------------------------------------------------------ library(rentrez) seqs <- try(entrez_fetch(db = "nucleotide", id = extra_data$nucleotide_ids[1:2], rettype = "fasta"), silent = TRUE) if (inherits(seqs, "try-error")) { cat("NCBI temporarily down.") } else { cat(seqs) } ## ------------------------------------------------------------------------ Tt_ids <- taxon_external_IDs(mu$ott_id[2]) Tt_ids rotl/inst/doc/meta-analysis.R0000644000176200001440000000546013543637122015661 0ustar liggesusers## ----load-package-------------------------------------------------------- library(rotl) ## ----egg_data------------------------------------------------------------ ## This should work, but Wiley has currently broken the URLs to access the ## SI. ## if (require(readxl) && require(fulltext)) { ## doi <- "10.1111/jeb.12282" ## xl_file <- try(ft_get_si(doi, 1, save.name="egg.xls"), silent = TRUE) ## egg_data <- read_excel(xl_file) ## } else { egg_data <- read.csv(system.file("extdata", "egg.csv", package = "rotl"), stringsAsFactors = FALSE ) ## } head(egg_data) ## ----eggs_in_a_funnel, fig.width=6, fig.height=3------------------------- plot(1 / sqrt(egg_data$VZr), egg_data$Zr, pch = 16, ylab = "Effect size (Zr)", xlab = "Precision (1/SE)", main = "Effect sizes for sex bias in egg size among 51 brid species" ) ## ---- clean_eggs--------------------------------------------------------- egg_data <- as.data.frame(egg_data) ## Convert taxon names to lower case egg_data$animal <- tolower(egg_data$animal) ## Let's remove the underscores (_) from the taxon names egg_data$animal <- gsub("_", " ", egg_data$animal) ## ----birds--------------------------------------------------------------- taxa <- tnrs_match_names(unique(egg_data$animal), context = "Animals") head(taxa) ## ----bird_map------------------------------------------------------------ taxon_map <- structure(taxa$search_string, names = taxa$unique_name) ## ----odd_duck------------------------------------------------------------ taxon_map["Anser caerulescens"] ## ----birds_in_a_tree, fig.width=5, fig.height=5, fig.align='center'------ tr <- tol_induced_subtree(ott_id(taxa)[is_in_tree(ott_id(taxa))]) plot(tr, show.tip.label = FALSE) ## ----tip_lab------------------------------------------------------------- tr$tip.label[1:4] ## ----clean_tips---------------------------------------------------------- otl_tips <- strip_ott_ids(tr$tip.label, remove_underscores = TRUE) tr$tip.label <- taxon_map[ otl_tips ] ## ----remove_nodes-------------------------------------------------------- tr$node.label <- NULL ## ----match_species_tree-------------------------------------------------- egg_data <- egg_data[egg_data$animal %in% tr$tip.label, ] ## ----model--------------------------------------------------------------- set.seed(123) if (require(MCMCglmm, quietly = TRUE)) { pr <- list( R = list(V = 1, nu = 0.002), G = list(G1 = list(V = 1, nu = 0.002)) ) model <- MCMCglmm(Zr ~ 1, random = ~animal, pedigree = tr, mev = egg_data$VZr, prior = pr, data = egg_data, verbose = FALSE ) } else { model <- readRDS(file = system.file("extdata", "mcmcglmm_model.rds", package = "rotl")) } ## ----PhyH---------------------------------------------------------------- var_comps <- colMeans(model$VCV) var_comps["animal"] / sum(var_comps) rotl/inst/doc/rotl.Rmd0000644000176200001440000002552013543632564014417 0ustar liggesusers--- title: "How to use rotl?" author: "François Michonneau" date: "`r Sys.Date()`" output: rmarkdown::html_vignette: css: vignette.css vignette: > %\VignetteIndexEntry{How to use rotl?} %\VignetteEngine{knitr::rmarkdown} %\VignetteEncoding{UTF-8} \usepackage[utf8]{inputenc} --- `rotl` provides an interface to the Open Tree of Life (OTL) API and allows users to query the API, retrieve parts of the Tree of Life and integrate these parts with other R packages. The OTL API provides services to access: * the **Tree of Life** a.k.a. TOL (the synthetic tree): a single draft tree that is a combination of **the OTL taxonomy** and the **source trees** (studies) * the **Taxonomic name resolution services** a.k.a. TNRS: the methods for resolving taxonomic names to the internal identifiers used by the TOL and the GOL (the `ott ids`). * the **Taxonomy** a.k.a. OTT (for Open Tree Taxonomy): which represents the synthesis of the different taxonomies used as a backbone of the TOL when no studies are available. * the **Studies** containing the source trees used to build the TOL, and extracted from the scientific literature. In `rotl`, each of these services correspond to functions with different prefixes: | Service | `rotl` prefix | |---------------|---------------| | Tree of Life | `tol_` | | TNRS | `tnrs_` | | Taxonomy | `taxonomy_` | | Studies | `studies_` | `rotl` also provides a few other functions and methods that can be used to extract relevant information from the objects returned by these functions. ## Demonstration of a basic workflow The most common use for `rotl` is probably to start from a list of species and get the relevant parts of the tree for these species. This is a two step process: 1. the species names need to be matched to their `ott_id` (the Open Tree Taxonomy identifiers) using the Taxonomic name resolution services (TNRS) 1. these `ott_id` will then be used to retrieve the relevant parts of the Tree of Life. ### Step 1: Matching taxonomy to the `ott_id` Let's start by doing a search on a diverse group of taxa: a tree frog (genus _Hyla_), a fish (genus _Salmo_), a sea urchin (genus _Diadema_), and a nautilus (genus _Nautilus_). ```{r} library(rotl) taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) ``` It's always a good idea to check that the resolved names match what you intended: `r knitr::kable(resolved_names)` The column `unique_name` sometimes indicates the higher taxonomic level associated with the name. The column `number_matches` indicates the number of `ott_id` that corresponds to a given name. In this example, our search on _Diadema_ returns 2 matches, and the one returned by default is indeed the sea urchin that we want for our query. The argument `context_name` allows you to limit the taxonomic scope of your search. _Diadema_ is also the genus name of a fungus. To ensure that our search is limited to animal names, we could do: ```{r} resolved_names <- tnrs_match_names(taxa, context_name = "Animals") ``` If you are trying to build a tree with deeply divergent taxa that the argument `context_name` cannot fix, see "How to change the ott ids assigned to my taxa?" in the FAQ below. ### Step 2: Getting the tree corresponding to our taxa Now that we have the correct `ott_id` for our taxa, we can ask for the tree using the `tol_induced_subtree()` function. By default, the object returned by `tol_induced_subtree` is a phylo object (from the [ape](https://cran.r-project.org/package=ape) package), so we can plot it directly. ```{r, fig.width=7, fig.height=4} my_tree <- tol_induced_subtree(ott_ids = resolved_names$ott_id) plot(my_tree, no.margin = TRUE) ``` ## FAQ ### How to change the ott ids assigned to my taxa? If you realize that `tnrs_match_names` assigns the incorrect taxonomic group to your name (e.g., because of synonymy) and changing the `context_name` does not help, you can use the function `inspect`. This function takes the object resulting from `tnrs_match_names()`, and either the row number, the taxon name (you used in your search in lowercase), or the `ott_id` returned by the initial query. To illustrate this, let's re-use the previous query but this time pretending that we are interested in the fungus _Diadema_ and not the sea urchin: ```{r} taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) resolved_names inspect(resolved_names, taxon_name = "diadema") ``` In our case, we want the second row in this data frame to replace the information that initially matched for _Diadema_. We can now use the `update()` function, to change to the correct taxa (the fungus not the sea urchin): ```{r} resolved_names <- update(resolved_names, taxon_name = "diadema", new_row_number = 2 ) ## we could also have used the ott_id to replace this taxon: ## resolved_names <- update(resolved_names, taxon_name = "diadema", ## new_ott_id = 4930522) ``` And now our `resolved_names` data frame includes the taxon we want: `r knitr::kable(resolved_names)` ### How do I know that the taxa I'm asking for is the correct one? The function `taxonomy_taxon_info()` takes `ott_ids` as arguments and returns taxonomic information about the taxa. This output can be passed to some helpers functions to extract the relevant information. Let's illustrate this with our _Diadema_ example ```{r} diadema_info <- taxonomy_taxon_info(631176) tax_rank(diadema_info) synonyms(diadema_info) tax_name(diadema_info) ``` In some cases, it might also be useful to investigate the taxonomic tree descending from an `ott_id` to check that it's the correct taxon and to determine the species included in the Open Tree Taxonomy: ```{r} diadema_tax_tree <- taxonomy_subtree(631176) diadema_tax_tree ``` By default, this function return all taxa (including self, and internal) descending from this `ott_id` but it also possible to return `phylo` object. ### How do I get the tree for a particular taxonomic group? If you are looking to get the tree for a particular taxonomic group, you need to first identify it by its node id or ott id, and then use the `tol_subtree()` function: ```{r, fig.width=7, fig.height=4} mono_id <- tnrs_match_names("Monotremata") mono_tree <- tol_subtree(ott_id = ott_id(mono_id)) plot(mono_tree) ``` ### How do I find trees from studies focused on my favourite taxa? The function `studies_find_trees()` allows the user to search for studies matching a specific criteria. The function `studies_properties()` returns the list of properties that can be used in the search. ```{r} furry_studies <- studies_find_studies(property = "ot:focalCladeOTTTaxonName", value = "Mammalia") furry_ids <- furry_studies$study_ids ``` Now that we know the `study_id`, we can ask for the meta data information associated with this study: ```{r} furry_meta <- get_study_meta("pg_2550") get_publication(furry_meta) ## The citation for the source of the study get_tree_ids(furry_meta) ## This study has 10 trees associated with it candidate_for_synth(furry_meta) ## None of these trees are yet included in the OTL ``` Using `get_study("pg_2550")` would returns a `multiPhylo` object (default) with all the trees associated with this particular study, while `get_study_tree("pg_2550", "tree5513")` would return one of these trees. ### The tree returned by the API has duplicated tip labels, how can I work around it? You may encounter the following error message: ``` Error in rncl(file = file, ...) : Taxon number 39 (coded by the token Pratia angulata) has already been encountered in this tree. Duplication of taxa in a tree is prohibited. ``` This message occurs as duplicate labels are not allowed in the NEXUS format and it is stricly enforced by the part of the code used by `rotl` to import the trees in memory. If you use a version of `rotl` more recent than 0.4.1, this should not happen by default for the function `get_study_tree`. If it happens with another function, please [let us know](https://github.com/ropensci/rotl/issues). The easiest way to work around this is to save the tree in a file, and use APE to read it in memory: ```{r, eval=FALSE} get_study_tree( study_id = "pg_710", tree_id = "tree1277", tip_label = "ott_taxon_name", file = "/tmp/tree.tre", file_format = "newick" ) tr <- ape::read.tree(file = "/tmp/tree.tre") ``` ### How do I get the higher taxonomy for a given taxa? If you encounter a taxon name you are not familiar with, it might be useful to obtain its higher taxonomy to see where it fits in the tree of life. We can combine several taxonomy methods to extract this information easily. ```{r} giant_squid <- tnrs_match_names("Architeuthis") tax_lineage(taxonomy_taxon_info(ott_id(giant_squid), include_lineage = TRUE)) ``` ### Why are OTT IDs discovered with `rotl` missing from an induced subtree? Some taxonomic names that can be retrieved through the taxonomic name resolution service are not part of the Open Tree's synthesis tree. These are usually traditional higher-level taxa that have been found to be paraphyletic. For instance, if you wanted to fetch a tree relating the three birds that go into a [Turkducken](https://en.wikipedia.org/wiki/Turducken) as well as the pork used for stuffing, you might search for the turkey, duck, chicken, and pork genera: ```{r} turducken <- c("Meleagris", "Anas", "Gallus", "Sus") taxa <- tnrs_match_names(turducken, context = "Animals") taxa ``` We have the OTT ids for each genus, however, if we tried to get the induced subtree from these results, we would get an error: ```{r, error=TRUE} tr <- tol_induced_subtree(ott_id(taxa)) ``` As the error message suggests, some of the taxa are not found in the synthetic tree. This occurs for 2 main reasons: either the taxa is invalid, or it is part of a group that is not monophyletic in the synthetic tree. There are two ways to get around this issue: (1) removing the taxa that are not part of the Open Tree; (2) using the complete species name. #### Removing the taxa missing from the synthetic tree To help with this situation, `rotl` provides a way to identify the OTT ids that are not part of the synthetic tree. The function `is_in_tree()` takes the output of the `ott_id()` function and returns a vector of logical indicating whether the taxa are part of the synthetic tree. We can then use to only keep the taxa that appear in the synthetic tree: ```{r} in_tree <- is_in_tree(ott_id(taxa)) in_tree tr <- tol_induced_subtree(ott_id(taxa)[in_tree]) ``` #### Using the full taxonomic names The best way to avoid these problems is to specify complete species names (species being the lowest level of classification in the Open Tree taxonomy they are guaranteed to be monophyletic): ```{r, fig.width=7, fig.height=4} turducken_spp <- c("Meleagris gallopavo", "Anas platyrhynchos", "Gallus gallus", "Sus scrofa") taxa <- tnrs_match_names(turducken_spp, context = "Animals") tr <- tol_induced_subtree(ott_id(taxa)) plot(tr) ``` rotl/inst/doc/rotl.html0000644000176200001440000021600513543637133014636 0ustar liggesusers How to use rotl?

How to use rotl?

François Michonneau

2019-09-28

rotl provides an interface to the Open Tree of Life (OTL) API and allows users to query the API, retrieve parts of the Tree of Life and integrate these parts with other R packages.

The OTL API provides services to access:

  • the Tree of Life a.k.a. TOL (the synthetic tree): a single draft tree that is a combination of the OTL taxonomy and the source trees (studies)
  • the Taxonomic name resolution services a.k.a. TNRS: the methods for resolving taxonomic names to the internal identifiers used by the TOL and the GOL (the ott ids).
  • the Taxonomy a.k.a. OTT (for Open Tree Taxonomy): which represents the synthesis of the different taxonomies used as a backbone of the TOL when no studies are available.
  • the Studies containing the source trees used to build the TOL, and extracted from the scientific literature.

In rotl, each of these services correspond to functions with different prefixes:

Service rotl prefix
Tree of Life tol_
TNRS tnrs_
Taxonomy taxonomy_
Studies studies_

rotl also provides a few other functions and methods that can be used to extract relevant information from the objects returned by these functions.

Demonstration of a basic workflow

The most common use for rotl is probably to start from a list of species and get the relevant parts of the tree for these species. This is a two step process:

  1. the species names need to be matched to their ott_id (the Open Tree Taxonomy identifiers) using the Taxonomic name resolution services (TNRS)
  2. these ott_id will then be used to retrieve the relevant parts of the Tree of Life.

Step 1: Matching taxonomy to the ott_id

Let’s start by doing a search on a diverse group of taxa: a tree frog (genus Hyla), a fish (genus Salmo), a sea urchin (genus Diadema), and a nautilus (genus Nautilus).

It’s always a good idea to check that the resolved names match what you intended:

search_string unique_name approximate_match ott_id is_synonym flags number_matches
hyla Hyla FALSE 1062216 FALSE 1
salmo Salmo FALSE 982359 FALSE 1
diadema Diadema (genus in Holozoa) FALSE 631176 FALSE 5
nautilus Nautilus FALSE 616358 FALSE 1

The column unique_name sometimes indicates the higher taxonomic level associated with the name. The column number_matches indicates the number of ott_id that corresponds to a given name. In this example, our search on Diadema returns 2 matches, and the one returned by default is indeed the sea urchin that we want for our query. The argument context_name allows you to limit the taxonomic scope of your search. Diadema is also the genus name of a fungus. To ensure that our search is limited to animal names, we could do:

If you are trying to build a tree with deeply divergent taxa that the argument context_name cannot fix, see “How to change the ott ids assigned to my taxa?” in the FAQ below.

Step 2: Getting the tree corresponding to our taxa

Now that we have the correct ott_id for our taxa, we can ask for the tree using the tol_induced_subtree() function. By default, the object returned by tol_induced_subtree is a phylo object (from the ape package), so we can plot it directly.

## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: Protostomia ott189832, mrcaott24ott6612, Lophotrochozoa
## ott155737, mrcaott24ott56, mrcaott56ott5497, Mollusca ott802117,
## mrcaott56ott1881, mrcaott1881ott102410, Cephalopoda ott7368, Nautiloidea
## ott854446, Nautilida ott854452, Nautilidae ott616361, Chordata ott125642,
## mrcaott42ott658, Craniata (subphylum in Deuterostomia) ott947318,
## Vertebrata (subphylum in Opisthokonta) ott801601, Gnathostomata (superclass
## in phylum Chordata) ott278114, Teleostomi ott114656, Sarcopterygii
## ott458402, Dipnotetrapodomorpha ott4940726, Tetrapoda ott229562, Amphibia
## ott544595, Batrachia ott471197, Anura (order in Opisthokonta) ott991547,
## mrcaott114ott3129, mrcaott114ott37876, mrcaott114ott18818, Neobatrachia
## ott535804, mrcaott114ott309463, mrcaott114ott177, mrcaott177ott7464,
## mrcaott177ott2199, mrcaott177ott29310, mrcaott177ott1321, Hylidae
## ott535782, mrcaott177ott17126, mrcaott177ott22852, mrcaott177ott2732,
## mrcaott2732ott3289, mrcaott3289ott40328, mrcaott3289ott173489,
## mrcaott3289ott110534, mrcaott3289ott489758, mrcaott3289ott59160,
## Actinopterygii ott773483, Actinopteri ott285821, Neopterygii
## ott471203, Teleostei ott212201, Osteoglossocephalai ott5506109,
## Clupeocephala ott285819, Euteleosteomorpha ott5517919, mrcaott274ott392,
## mrcaott274ott595, Protacanthopterygii ott1024043, mrcaott274ott3887,
## mrcaott3887ott9371, Salmoniformes ott216171, Salmonidae ott739933,
## mrcaott3887ott28511, Salmoninae ott936925, mrcaott360ott10516,
## Echinodermata ott451020, Eleutherozoa ott317277, Echinozoa ott669475,
## Echinoidea ott669472, Diadematacea ott631171, Diadematoida ott631174,
## Diadematidae ott631173

FAQ

How to change the ott ids assigned to my taxa?

If you realize that tnrs_match_names assigns the incorrect taxonomic group to your name (e.g., because of synonymy) and changing the context_name does not help, you can use the function inspect. This function takes the object resulting from tnrs_match_names(), and either the row number, the taxon name (you used in your search in lowercase), or the ott_id returned by the initial query.

To illustrate this, let’s re-use the previous query but this time pretending that we are interested in the fungus Diadema and not the sea urchin:

##   search_string                unique_name approximate_match  ott_id
## 1          hyla                       Hyla             FALSE 1062216
## 2         salmo                      Salmo             FALSE  982359
## 3       diadema Diadema (genus in Holozoa)             FALSE  631176
## 4      nautilus                   Nautilus             FALSE  616358
##   is_synonym flags number_matches
## 1      FALSE                    1
## 2      FALSE                    1
## 3      FALSE                    5
## 4      FALSE                    1
##   search_string                       unique_name approximate_match
## 1       diadema    Diadema (genus in Nucletmycea)             FALSE
## 2       diadema        Diadema (genus in Holozoa)             FALSE
## 3       diadema Garrettia (genus in Opisthokonta)             FALSE
## 4       diadema                       Diademoides             FALSE
## 5       diadema                        Hypolimnas             FALSE
##    ott_id is_synonym          flags number_matches
## 1 4930522      FALSE                             5
## 2  631176      FALSE                             5
## 3 6356093       TRUE                             5
## 4 4024672       TRUE SIBLING_HIGHER              5
## 5  643831       TRUE                             5

In our case, we want the second row in this data frame to replace the information that initially matched for Diadema. We can now use the update() function, to change to the correct taxa (the fungus not the sea urchin):

And now our resolved_names data frame includes the taxon we want:

search_string unique_name approximate_match ott_id is_synonym flags number_matches
hyla Hyla FALSE 1062216 FALSE 1
salmo Salmo FALSE 982359 FALSE 1
diadema Diadema (genus in Holozoa) FALSE 631176 FALSE 5
nautilus Nautilus FALSE 616358 FALSE 1

How do I know that the taxa I’m asking for is the correct one?

The function taxonomy_taxon_info() takes ott_ids as arguments and returns taxonomic information about the taxa. This output can be passed to some helpers functions to extract the relevant information. Let’s illustrate this with our Diadema example

## $`Diadema (genus in Holozoa)`
## [1] "genus"
## 
## attr(,"class")
## [1] "otl_rank" "list"
## $`Diadema (genus in Holozoa)`
## [1] "Centrechinus"           "Centrechinus (Diadema)"
## [3] "Cidaris (Diadema)"      "Diamema"               
## 
## attr(,"class")
## [1] "otl_synonyms" "list"
## $`Diadema (genus in Holozoa)`
## [1] "Diadema"
## 
## attr(,"class")
## [1] "otl_name" "list"

In some cases, it might also be useful to investigate the taxonomic tree descending from an ott_id to check that it’s the correct taxon and to determine the species included in the Open Tree Taxonomy:

## $tip_label
##  [1] "Diadema_sp._seto17_ott587478"            
##  [2] "Diadema_sp._DSM1_ott219999"              
##  [3] "Diadema_paucispinum_ott312263"           
##  [4] "Diadema_mexicanum_ott639130"             
##  [5] "Diadema_sp._dsm5_ott587480"              
##  [6] "Diadema_sp._DSM8_ott587486"              
##  [7] "Diadema_sp._DSM2_ott587483"              
##  [8] "Diadema_sp._DSM6_ott771059"              
##  [9] "Diadema_sp._DSM7_ott587487"              
## [10] "Diadema_sp._seto18_ott66623"             
## [11] "Diadema_sp._seto16_ott312262"            
## [12] "Diadema_sp._seto9_ott587485"             
## [13] "Diadema_sp._seto38_ott66625"             
## [14] "Diadema_setosum_ott631175"               
## [15] "Diadema_sp._seto19_ott66624"             
## [16] "Diadema_sp._DJN9_ott66626"               
## [17] "Diademasp.CS-2014ott5502179"             
## [18] "Diadema_savignyi_ott395692"              
## [19] "Diadema_sp._SETO15_ott587479"            
## [20] "Diadema_palmeri_ott836860"               
## [21] "Diadema_sp._seto35_ott66618"             
## [22] "Diadema_sp._DSM4_ott587481"              
## [23] "Diadema_sp._DSM3_ott587482"              
## [24] "Diadema_antillarum_antillarum_ott4147370"
## [25] "Diadema_antillarum_scensionis_ott220009" 
## [26] "Diadema_africanum_ott4147369"            
## [27] "Diadema_sp._seto10_ott587484"            
## [28] "Diadema_vetus_ott5725747"                
## [29] "Diadema_principeana_ott5725746"          
## [30] "Diadema_ascensionis_ott4950423"          
## [31] "Diadema_lobatum_ott4950422"              
## [32] "Diadema_pseudodiadema_ott4950421"        
## [33] "Diadema_africana_ott5502180"             
## 
## $edge_label
## [1] "Diadema_antillarum_ott1022356" "'Diadema(genusinHolozoa"      
## [3] "ott631176'"

By default, this function return all taxa (including self, and internal) descending from this ott_id but it also possible to return phylo object.

How do I get the tree for a particular taxonomic group?

If you are looking to get the tree for a particular taxonomic group, you need to first identify it by its node id or ott id, and then use the tol_subtree() function:

## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: Tachyglossus ott16047, Tachyglossus aculeatus ott16038,
## Ornithorhynchidae ott344066, Ornithorhynchus ott962391

How do I find trees from studies focused on my favourite taxa?

The function studies_find_trees() allows the user to search for studies matching a specific criteria. The function studies_properties() returns the list of properties that can be used in the search.

Now that we know the study_id, we can ask for the meta data information associated with this study:

## [1] "O'Leary, Maureen A., Marc Allard, Michael J. Novacek, Jin Meng, and John Gatesy. 2004. \"Building the mammalian sector of the tree of life: Combining different data and a discussion of divergence times for placental mammals.\" In: Cracraft J., & Donoghue M., eds. Assembling the Tree of Life. pp. 490-516. Oxford, United Kingdom, Oxford University Press."
## attr(,"DOI")
## [1] ""
##  [1] "tree5513" "tree5515" "tree5516" "tree5517" "tree5518" "tree5519"
##  [7] "tree5520" "tree5521" "tree5522" "tree5523"
## NULL

Using get_study("pg_2550") would returns a multiPhylo object (default) with all the trees associated with this particular study, while get_study_tree("pg_2550", "tree5513") would return one of these trees.

The tree returned by the API has duplicated tip labels, how can I work around it?

You may encounter the following error message:

Error in rncl(file = file, ...) : Taxon number 39 (coded by the token Pratia
angulata) has already been encountered in this tree. Duplication of taxa in a
tree is prohibited.

This message occurs as duplicate labels are not allowed in the NEXUS format and it is stricly enforced by the part of the code used by rotl to import the trees in memory.

If you use a version of rotl more recent than 0.4.1, this should not happen by default for the function get_study_tree. If it happens with another function, please let us know.

The easiest way to work around this is to save the tree in a file, and use APE to read it in memory:

How do I get the higher taxonomy for a given taxa?

If you encounter a taxon name you are not familiar with, it might be useful to obtain its higher taxonomy to see where it fits in the tree of life. We can combine several taxonomy methods to extract this information easily.

## $`564394`
##          rank               name        unique_name  ott_id
## 1      family     Architeuthidae     Architeuthidae  564393
## 2    suborder          Oegopsina          Oegopsina   43352
## 3       order           Teuthida           Teuthida  380472
## 4  superorder     Decapodiformes     Decapodiformes  854107
## 5  infraclass       Neocoleoidea       Neocoleoidea  329546
## 6    subclass          Coleoidea          Coleoidea    7371
## 7       class        Cephalopoda        Cephalopoda    7368
## 8      phylum           Mollusca           Mollusca  802117
## 9     no rank     Lophotrochozoa     Lophotrochozoa  155737
## 10    no rank        Protostomia        Protostomia  189832
## 11    no rank          Bilateria          Bilateria  117569
## 12    no rank          Eumetazoa          Eumetazoa  641038
## 13    kingdom            Metazoa            Metazoa  691846
## 14    no rank            Holozoa            Holozoa 5246131
## 15    no rank       Opisthokonta       Opisthokonta  332573
## 16     domain          Eukaryota          Eukaryota  304358
## 17    no rank cellular organisms cellular organisms   93302
## 18    no rank               life               life  805080

Why are OTT IDs discovered with rotl missing from an induced subtree?

Some taxonomic names that can be retrieved through the taxonomic name resolution service are not part of the Open Tree’s synthesis tree. These are usually traditional higher-level taxa that have been found to be paraphyletic.

For instance, if you wanted to fetch a tree relating the three birds that go into a Turkducken as well as the pork used for stuffing, you might search for the turkey, duck, chicken, and pork genera:

##   search_string unique_name approximate_match ott_id is_synonym flags
## 1     meleagris   Meleagris             FALSE 446481      FALSE      
## 2          anas        Anas             FALSE 765185      FALSE      
## 3        gallus      Gallus             FALSE 153562      FALSE      
## 4           sus         Sus             FALSE 730021      FALSE      
##   number_matches
## 1              2
## 2              1
## 3              3
## 4              1

We have the OTT ids for each genus, however, if we tried to get the induced subtree from these results, we would get an error:

## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: Mammalia ott244265, Theria (subclass in Deuterostomia)
## ott229558, Eutheria (in Deuterostomia) ott683263, Boreoeutheria ott5334778,
## Laurasiatheria ott392223, mrcaott1548ott4697, mrcaott1548ott6790,
## mrcaott1548ott3021, Cetartiodactyla ott622916, mrcaott1548ott21987,
## Suina ott916745, Suidae ott730008, Sauropsida ott639642, Sauria (order in
## Opisthokonta) ott329823, Archelosauria ott4947372, Archosauria ott335588,
## Dinosauria ott90215, Coelurosauria ott664351, Theropoda ott664350,
## Saurischia ott90223, Aves ott81461, Neognathae ott241846, Galliformes
## ott837585, mrcaott4765ott75785, mrcaott4765ott104461, mrcaott4765ott151684,
## mrcaott4765ott54193, mrcaott4765ott49319, mrcaott4765ott415487,
## mrcaott4765ott51354, mrcaott4765ott53700, mrcaott4765ott446490,
## Meleagridinae ott781250, mrcaott49310ott102705, mrcaott49310ott51349,
## mrcaott49310ott153554, mrcaott153554ott867027, Anseriformes ott241841,
## mrcaott30843ott714464, Anatidae ott765193, mrcaott30843ott75874,
## mrcaott30843ott962771, mrcaott30843ott145504, mrcaott30843ott30847,
## mrcaott30843ott196654, mrcaott30843ott30845

As the error message suggests, some of the taxa are not found in the synthetic tree. This occurs for 2 main reasons: either the taxa is invalid, or it is part of a group that is not monophyletic in the synthetic tree. There are two ways to get around this issue: (1) removing the taxa that are not part of the Open Tree; (2) using the complete species name.

Removing the taxa missing from the synthetic tree

To help with this situation, rotl provides a way to identify the OTT ids that are not part of the synthetic tree. The function is_in_tree() takes the output of the ott_id() function and returns a vector of logical indicating whether the taxa are part of the synthetic tree. We can then use to only keep the taxa that appear in the synthetic tree:

## Meleagris      Anas    Gallus       Sus 
##      TRUE     FALSE      TRUE      TRUE
## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: Mammalia ott244265, Theria (subclass in Deuterostomia)
## ott229558, Eutheria (in Deuterostomia) ott683263, Boreoeutheria ott5334778,
## Laurasiatheria ott392223, mrcaott1548ott4697, mrcaott1548ott6790,
## mrcaott1548ott3021, Cetartiodactyla ott622916, mrcaott1548ott21987,
## Suina ott916745, Suidae ott730008, Sauropsida ott639642, Sauria (order
## in Opisthokonta) ott329823, Archelosauria ott4947372, Archosauria
## ott335588, Dinosauria ott90215, Coelurosauria ott664351, Theropoda
## ott664350, Saurischia ott90223, Aves ott81461, Neognathae ott241846,
## Galloanserae ott5839486, Galliformes ott837585, mrcaott4765ott75785,
## mrcaott4765ott104461, mrcaott4765ott151684, mrcaott4765ott54193,
## mrcaott4765ott49319, mrcaott4765ott415487, mrcaott4765ott51354,
## mrcaott4765ott53700, mrcaott4765ott446490, Meleagridinae ott781250,
## mrcaott49310ott102705, mrcaott49310ott51349, mrcaott49310ott153554,
## mrcaott153554ott867027

Using the full taxonomic names

The best way to avoid these problems is to specify complete species names (species being the lowest level of classification in the Open Tree taxonomy they are guaranteed to be monophyletic):

## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: Mammalia ott244265, Theria (subclass in Deuterostomia)
## ott229558, Eutheria (in Deuterostomia) ott683263, Boreoeutheria ott5334778,
## Laurasiatheria ott392223, mrcaott1548ott4697, mrcaott1548ott6790,
## mrcaott1548ott3021, Cetartiodactyla ott622916, mrcaott1548ott21987, Suina
## ott916745, Suidae ott730008, Sus ott730021, Sauropsida ott639642, Sauria
## (order in Opisthokonta) ott329823, Archelosauria ott4947372, Archosauria
## ott335588, Dinosauria ott90215, Coelurosauria ott664351, Theropoda
## ott664350, Saurischia ott90223, Aves ott81461, Neognathae ott241846,
## Galliformes ott837585, mrcaott4765ott75785, mrcaott4765ott104461,
## mrcaott4765ott151684, mrcaott4765ott54193, mrcaott4765ott49319,
## mrcaott4765ott415487, mrcaott4765ott51354, mrcaott4765ott53700,
## mrcaott4765ott446490, Meleagridinae ott781250, Meleagris ott446481,
## mrcaott49310ott102705, mrcaott49310ott51349, mrcaott49310ott153554,
## mrcaott153554ott867027, Gallus ott153562, mrcaott153554ott153572,
## mrcaott153572ott240568, Anseriformes ott241841, mrcaott30843ott714464,
## Anatidae ott765193, mrcaott30843ott75874, mrcaott30843ott962771,
## mrcaott30843ott145504, mrcaott30843ott30847, mrcaott30843ott196654,
## mrcaott30843ott30845, mrcaott30845ott30850, mrcaott30850ott82420,
## mrcaott30850ott82414, mrcaott30850ott30858, mrcaott30850ott30855,
## mrcaott30850ott604172, mrcaott30850ott82410, mrcaott82410ott339494,
## mrcaott82410ott604175, mrcaott82410ott604182, mrcaott82410ott190881

rotl/inst/doc/meta-analysis.html0000644000176200001440000015044413543637122016427 0ustar liggesusers Using the Open Tree synthesis in a comparative analysis

Using the Open Tree synthesis in a comparative analysis

David Winter

2019-09-28

Phylogenetic Comparative Methods

The development of phylogenetic comparative methods has made phylogenies and important source of data in fields as diverse as ecology, genomic and medicine. Comparative methods can be used to investigate patterns in the evolution of traits or the diversification of lineages. In other cases a phylogeny is treated as a “nuisance parameter”, allowing with the autocorrelation created by the shared evolutionary history of the different species included to be controlled for.

In many cases finding a tree that relates the species for which trait data are available is a rate-limiting step in such comparative analyses. Here we show how the synthetic tree provided by Open Tree of Life (and made available in R via rotl) can help to fill this gap.

A phylogenetic meta-analysis

To demonstrate the use of rotl in a comparative analysis, we will partially reproduce the results of Rutkowska et al 2014. Very briefly, this study is a meta-analysis summarising the results of multiple studies testing for systematic differences in the size of eggs which contain male and female offspring. Such a difference might mean that birds invest more heavily in one sex than the other.

Because this study involves data from 51 different species, Rutkowska et al used a phylogenetic comparative approach to account for the shared evolutionary history among some of the studied-species.

Gather the data

If we are going to reproduce this analysis, we will first need to gather the data. Thankfully, the data is available as supplementary material from the publisher’s website. We can collect the data from using fulltext (with the papers DOI as input) and read it into memory with readxl::read_excel:

##                   animal                   Spp       Lndim Measure Neggs
## 1 Zonotrichia_leucophrys White-crowned sparrow 0.000000000  volume   294
## 2      Passer_domesticus         House sparrow 0.009407469  volume   149
## 3        Serinus_canaria                Canary 0.000000000  volume    52
## 4          Turdus_merula    European blackbird 0.021189299  volume    82
## 5    Agelaius_phoeniceus  Red-winged blackbird 0.218316086  volume   394
## 6    Quiscalus_mexicanus  Great-tailed grackle 0.281894985    mass   822
##   Nclutches        ESr Type         StudyID Year        D        EN
## 1        73 0.14004594 stat        Mead1987 1987 3.421918  85.91673
## 2        31 0.11175203 stat     Cordero2000 2000 4.045161  36.83413
## 3        21 0.49679140 stat     Leitner2006 2006 2.180952  23.84279
## 4        54 0.38598540 stat     Martyka2010 2010 1.414815  57.95812
## 5       106 0.07410136  raw Weatherhead1985 1985 3.173585 124.14982
## 6       205 0.05178834  raw     Teather1989 1989 3.407805 241.21099
##           Zr         VZr
## 1 0.14097244 0.012060292
## 2 0.11222075 0.029555954
## 3 0.54503712 0.047978211
## 4 0.40707397 0.018195675
## 5 0.07423744 0.008254242
## 6 0.05183471 0.004197959

The most important variable in this dataset is Zr, which is a normalized effect size for difference ,in size between eggs that contain males and females. Values close to zero come from studies that found the sex of an egg’s inhabitant had little effect in its size, while large positive or negative values correspond to studies with substantial sex biases (towards males and females respectively). Since this is a meta-analysis we should produce the classic funnel plot with effects-size on the y-axis and precision (the inverse of the sample standard error) on the x-axis. Here we calculate precision from the sample variance (Vzr):

In order to use this data later on we need to first convert it to a standard data.frame. We can also convert the animal column (the species names) to lower case, and remove the underscores in their names, which will make it easier to match names later on:

Find the species in OTT

We can use the OTL synthesis tree to relate these species. To do so we first need to find Open Tree Taxonomy (OTT) IDs for each species. We can do that with the Taxonomic Name Resolution Service function tnrs_match_names:

##            search_string            unique_name approximate_match ott_id
## 1 zonotrichia leucophrys Zonotrichia leucophrys             FALSE 265553
## 2      passer domesticus      Passer domesticus             FALSE 745175
## 3        serinus canaria        Serinus canaria             FALSE 464865
## 4          turdus merula          Turdus merula             FALSE 568572
## 5    agelaius phoeniceus    Agelaius phoeniceus             FALSE 226605
## 6    quiscalus mexicanus    Quiscalus mexicanus             FALSE 743411
##   is_synonym          flags number_matches
## 1      FALSE                             1
## 2      FALSE                             1
## 3      FALSE SIBLING_HIGHER              1
## 4      FALSE                             1
## 5      FALSE                             1
## 6      FALSE                             1

All of these species are in OTT, but a few of them go by different names in the Open Tree than we have in our data set. Because the tree rotl fetches will have Open Tree names, we need to create a named vector that maps the names we have for each species to the names Open Tree uses for them:

Now we can use this map to retrieve “data set names” from “OTT names”:

##  Anser caerulescens 
## "chen caerulescens"

Get a tree

Now we can get the tree. There are really too many tips here to show nicely, so we will leave them out of this plot

## Warning in collapse_singles(tr, show_progress): Dropping singleton nodes
## with labels: mrcaott246ott5481, mrcaott246ott7145, mrcaott246ott928360,
## mrcaott246ott1858, mrcaott246ott2907, mrcaott246ott3600042,
## mrcaott246ott7113, Passeriformes ott1041547, mrcaott246ott3212,
## mrcaott246ott428578, mrcaott246ott44866, mrcaott246ott5929,
## mrcaott246ott32658, mrcaott246ott22325, mrcaott246ott176461,
## mrcaott246ott10351, mrcaott246ott5934, mrcaott246ott1566,
## mrcaott1566ott3598440, mrcaott1566ott496009, mrcaott1566ott35326,
## mrcaott1566ott32651, mrcaott1566ott20498, mrcaott1566ott22300,
## mrcaott22300ott35350, mrcaott22300ott547548, mrcaott22300ott909199,
## mrcaott22300ott67150, mrcaott22300ott130294, mrcaott22300ott3598245,
## mrcaott22300ott416087, mrcaott22300ott629342, mrcaott22300ott416089,
## mrcaott22300ott107840, mrcaott113980ott364210, mrcaott364210ott3598839,
## mrcaott364210ott5341363, mrcaott19467ott431648, mrcaott19467ott252687,
## mrcaott19467ott482248, mrcaott19467ott401023, mrcaott19467ott233446,
## mrcaott19467ott168078, mrcaott19467ott1046624, mrcaott19467ott161293,
## mrcaott19467ott46396, mrcaott46396ott46398, mrcaott46398ott168083,
## mrcaott168083ott431676, mrcaott2175ott968664, mrcaott2175ott259082,
## mrcaott2175ott59905, mrcaott2175ott2224, mrcaott2224ott366470,
## mrcaott3364ott73828, mrcaott3364ott4083, mrcaott4083ott35042,
## mrcaott4083ott370807, mrcaott4083ott11712, mrcaott4083ott52094,
## mrcaott4083ott95949, Erythrura ott465905, mrcaott24017ott389884,
## mrcaott24017ott24025, mrcaott24025ott596770, mrcaott24025ott453058,
## mrcaott24025ott141501, mrcaott141501ott966119, mrcaott141501ott865472,
## mrcaott141501ott389883, mrcaott105913ott311555, mrcaott311555ott1082386,
## mrcaott311555ott445491, Taeniopygia ott708325, mrcaott4088ott95302,
## mrcaott4088ott8371, mrcaott4088ott5616, mrcaott5616ott28339,
## mrcaott5616ott6023, mrcaott6023ott243614, mrcaott6023ott101225,
## mrcaott6023ott125079, mrcaott125079ott463026, mrcaott125079ott765405,
## Zonotrichia (genus in domain Eukaryota) ott789032, mrcaott125079ott265547,
## mrcaott125079ott265554, mrcaott5620ott254662, mrcaott5620ott29804,
## mrcaott29804ott449580, mrcaott29804ott449562, mrcaott29804ott86894,
## mrcaott29804ott93045, mrcaott93045ott264496, mrcaott264496ott264500,
## mrcaott264500ott3597163, mrcaott264500ott283668, Quiscalus ott743410,
## mrcaott283673ott673386, mrcaott283673ott741944, mrcaott283673ott735243,
## mrcaott213448ott213452, mrcaott213448ott1009279, mrcaott213448ott213451,
## mrcaott213454ott430627, mrcaott430627ott498751, mrcaott430627ott617797,
## mrcaott430627ott3597159, mrcaott99175ott364331, Xanthocephalus ott364336,
## mrcaott6366ott28332, mrcaott6366ott88283, mrcaott6366ott341465,
## mrcaott6366ott157599, mrcaott6366ott178457, mrcaott6366ott28346,
## mrcaott6366ott238142, mrcaott6366ott6375, mrcaott6375ott119724,
## mrcaott6375ott238137, mrcaott238137ott328909, mrcaott238137ott464865,
## Haemorhous ott3601758, mrcaott9416ott840030, mrcaott9416ott96147,
## mrcaott9416ott407760, Passer ott515158, mrcaott9416ott407769,
## mrcaott9416ott25628, mrcaott9416ott407764, mrcaott9416ott68955,
## mrcaott9416ott73636, mrcaott1488ott72472, mrcaott1488ott63797,
## mrcaott1488ott62251, mrcaott1488ott110316, mrcaott1488ott5819,
## mrcaott1488ott44217, mrcaott1488ott16185, Hirundinidae ott897681,
## mrcaott16185ott67916, mrcaott67916ott67921, mrcaott67916ott119537,
## mrcaott67916ott67920, Delichon ott922719, mrcaott107463ott353520,
## mrcaott107463ott177058, mrcaott107463ott107476, mrcaott107476ott326781,
## mrcaott107476ott337752, mrcaott337752ott865537, mrcaott337752ott337762,
## mrcaott2375ott73144, mrcaott2375ott71358, mrcaott2375ott814750,
## mrcaott2375ott24855, mrcaott24855ott61147, Cyanistes ott73150,
## mrcaott123763ott258794, mrcaott4820ott409116, mrcaott4820ott17162,
## mrcaott4820ott20998, mrcaott4820ott20989, mrcaott4820ott58860,
## mrcaott4820ott23690, mrcaott4820ott20996, mrcaott4820ott11462,
## mrcaott4820ott140440, mrcaott4820ott197505, mrcaott4820ott75978,
## mrcaott4820ott11315, mrcaott4820ott5933, mrcaott5933ott60465,
## mrcaott5933ott25637, mrcaott25637ott199843, mrcaott25637ott473431,
## mrcaott25637ott686166, mrcaott25637ott111993, mrcaott25637ott183621,
## mrcaott183621ott501241, mrcaott501241ott3598010, mrcaott501241ott597018,
## mrcaott686165ott686168, mrcaott60456ott662804, mrcaott60456ott75990,
## Pica ott776480, Falconidae ott212186, mrcaott47588ott225286,
## mrcaott47588ott748842, mrcaott47588ott201377, mrcaott201377ott773020,
## mrcaott179290ott352521, mrcaott179290ott624976, mrcaott179290ott624973,
## mrcaott179290ott624974, mrcaott179290ott432111, mrcaott5272ott92263,
## mrcaott5272ott24121, Scolopacidae ott887699, mrcaott24121ott217797,
## mrcaott24121ott45306, mrcaott24121ott654830, mrcaott24121ott214779,
## mrcaott24121ott651066, mrcaott651066ott1090732, mrcaott7639ott306220,
## mrcaott7639ott57833, mrcaott7639ott383929, mrcaott7639ott279504,
## mrcaott7639ott47401, mrcaott7639ott341047, mrcaott7639ott234666,
## mrcaott7639ott966608, mrcaott7639ott285543, Sterna ott16767,
## mrcaott285543ott341030, mrcaott285543ott738509, mrcaott285543ott966606,
## mrcaott285543ott966604, mrcaott22965ott738512, mrcaott22965ott80679,
## mrcaott22965ott5859768, mrcaott22965ott154126, mrcaott22965ott241571,
## mrcaott22965ott282132, mrcaott22965ott414141, mrcaott22965ott704174,
## mrcaott22965ott704175, mrcaott22965ott324050, mrcaott22965ott353849,
## mrcaott22965ott75913, mrcaott75913ott335736, mrcaott335737ott450107,
## mrcaott425206ott887691, mrcaott425206ott515355, mrcaott119599ott993041,
## mrcaott119599ott509055, mrcaott416082ott4947414, mrcaott147723ott219032,
## Stercorariidae ott168297, Stercorarius ott742632, mrcaott742640ott742641,
## mrcaott57823ott57827, mrcaott57823ott242771, mrcaott57823ott112937,
## mrcaott112937ott129402, mrcaott112937ott341980, mrcaott112937ott112941,
## mrcaott112941ott112948, mrcaott112948ott5341357, mrcaott112948ott242776,
## mrcaott242776ott313115, mrcaott242776ott704464, mrcaott242776ott331994,
## mrcaott331994ott413796, mrcaott9830ott86672, mrcaott9830ott90560,
## mrcaott9830ott324158, mrcaott9830ott55044, mrcaott9830ott285638,
## mrcaott9830ott117726, Sulidae ott452462, mrcaott403772ott429615,
## Sula ott160486, mrcaott429615ott5859716, mrcaott429615ott827441,
## mrcaott429615ott1030312, Procellariiformes ott452461, mrcaott18206ott31011,
## mrcaott31011ott71459, Diomedeidae ott85277, mrcaott71459ott320282,
## Phoebastria ott941509, mrcaott320282ott320284, Sphenisciformes ott494366,
## mrcaott60413ott60417, mrcaott60413ott429618, Eudyptes ott494364,
## mrcaott82219ott116946, mrcaott116946ott219197, mrcaott134466ott494361,
## Pygoscelis ott494365, mrcaott134466ott783352, mrcaott5021ott198671,
## mrcaott5021ott75792, Cuculiformes ott212171, mrcaott75792ott212172,
## mrcaott75792ott3601282, mrcaott75792ott119216, mrcaott119216ott212175,
## mrcaott119216ott169265, mrcaott169265ott550039, mrcaott169265ott462546,
## mrcaott462546ott626955, mrcaott462546ott549514, mrcaott549514ott3596314,
## mrcaott549514ott3596309, mrcaott549514ott550040, mrcaott549514ott3596308,
## mrcaott549514ott3596307, mrcaott549514ott3596306, mrcaott549514ott792626,
## mrcaott17146ott57819, Columbiformes ott363030, mrcaott17146ott45505,
## mrcaott45505ott50388, mrcaott45505ott506098, mrcaott45505ott51607,
## mrcaott51607ott277822, mrcaott51607ott67614, mrcaott51607ott244134,
## Columba ott938415, mrcaott51607ott277817, mrcaott277817ott320359,
## mrcaott320359ott493986, mrcaott320359ott767317, mrcaott320359ott921832,
## mrcaott320359ott938416, Galliformes ott837585, mrcaott4765ott75785,
## mrcaott4765ott104461, mrcaott4765ott151684, mrcaott4765ott54193,
## mrcaott4765ott49319, mrcaott4765ott415487, mrcaott4765ott51354,
## mrcaott4765ott446490, Tetraoninae ott999677, mrcaott4765ott55929,
## mrcaott4765ott539045, mrcaott4765ott234824, Centrocercus ott728081,
## mrcaott53700ott572162, mrcaott53700ott466627, mrcaott53700ott309383,
## mrcaott53700ott102722, mrcaott102722ott137547, Phasianus ott102718,
## mrcaott49310ott102705, mrcaott49310ott153554, mrcaott153554ott867027,
## Gallus ott153562, mrcaott153554ott153572, mrcaott153572ott240568,
## mrcaott51349ott727334, mrcaott51349ott453575, Pavo ott453587,
## Anseriformes ott241841, Anatidae ott765193, mrcaott30843ott962771,
## mrcaott30843ott145504, mrcaott30843ott30847, mrcaott30843ott196654,
## mrcaott30843ott30845, mrcaott30843ott88385, mrcaott30843ott140301,
## mrcaott30843ott552052, mrcaott30843ott423364, mrcaott30843ott693332,
## mrcaott693332ott693335, mrcaott69333

There are a few things to note here. First, the tree has no branch lengths. At present this is true for the whole of the Open Tree synthetic tree. Some comparative methods require either branch lengths or an ultrametric tree. Before you can use one of those methods you will need to get a tree with branch lengths. You could try looking for published trees made available by the Open Tree with studies_find_trees. Alternatively, you could estimate branch lengths from the toplogy of a phylogeny returned by tol_induced_subtree, perhaps by downloading DNA sequences from the NCBI with rentrez or “hanging” the tree on nodes of known-age using penalized likelihood method in ape::chronos. In this case, we will use only the topology of the tree as input to our comparative analysis, so we can skip these steps.

Second, the tip labels contain OTT IDs, which means they will not perfectly match the species names in our dataset or the taxon map that we created earlier:

## [1] "Ficedula_albicollis_ott107840" "Luscinia_svecica_ott274225"   
## [3] "Turdus_merula_ott568572"       "Sturnus_unicolor_ott366470"

Finally, the tree contains node labels for those nodes that match a higher taxonomic group, and empty character vectors ("") for all other nodes. Some comparative methods either do no expect node labels at all, or require all labeled nodes to have a unique name (meaning multiple “empty” labels will cause and error).

We can deal with all these details easily. rotl provides the convenience function strip_ott_ids to remove the extra information from the tip labels. With the IDs removed, we can use our taxon map to replace the tip labels in the tree with the species names from dataset.

Finally, we can remove the node labels by setting the node.label attribute of the tree to NULL.

Perform the meta-analysis

Now we have data and a tree, and we know the names in the tree match the ones in the data. It’s time to do the comparative analysis. Rutkowska et al. used MCMCglmm, a Bayesian MCMC approach to fitting multi-level models,to perform their meta-analysis, and we will do the same. Of course, to properly analyse these data you would take some care in deciding on the appropriate priors to use and inspect the results carefully. In this case, we are really interested in using this as a demonstration, so we will just run a simple model.

Specifically we sill fit a model where the only variable that might explain the values of Zr is the random factor animal, which corresponds to the phylogenetic relationships among species. We also provide Zvr as the measurement error variance, effectively adding extra weight to the results of more powerful studies. Here’s how we specify and fit that model with MCMCglmm:

## 
## Attaching package: 'ape'
## The following object is masked from 'package:phylobase':
## 
##     edges
## Warning in inverseA(pedigree = pedigree, scale = scale, nodes = nodes): no
## branch lengths: compute.brlen from ape has been used

Now that we have a result we can find out how much phylogenetic signal exists for sex-biased differences in egg-size. In a multi-level model we can use variance components to look at this, specifically the proportion of the total variance that can be explained by phylogeny is called the phylogenetic reliability, H. Let’s calculate the H for this model:

##      animal 
## 0.002953389

It appears there is almost no phylogenetic signal to the data. The relationships among species explain much less that one percent of the total variance in the data. If you were wondering, Rutkowska et al. report a similar result, even after adding more predictors to their model most of the variance in Zr was left unexplained.

What other comparative methods can I use in R?

Here we have demonstrated just one comparative analysis that you might do in R. There are an ever-growing number of packages that allow an ever-growing number of analysis to performed in R. Some “classics” like ancestral state reconstruction, phylogenetic independent contrasts and lineage through time plots are implemented in ape. Packages like phytools, caper and diversitree provide extensions to these methods. The CRAN Phylogenetics Taskview gives a good idea of the diversity of packages and analyses that can be completed in R.

rotl/inst/doc/data_mashups.html0000644000176200001440000023566013543637105016336 0ustar liggesusers Connecting data to Open Tree trees

Connecting data to Open Tree trees

David Winter

2019-09-28

Combining data from OToL and other sources.

One of the major goals of rotl is to help users combine data from other sources with the phylogenetic trees in the Open Tree database. This examples document describes some of the ways in which a user might connect data to trees from Open Tree.

Get Open Tree IDs to match your data.

Let’s say you have a dataset where each row represents a measurement taken from one species, and your goal is to put these measurements in some phylogenetic context. Here’s a small example: the best estimate of the mutation rate for a set of unicellular Eukaryotes along with some other property of those species which might explain the mutation rate:

##                     species       mu pop.size genome.size
## 1   Tetrahymena thermophila 7.61e-12 1.12e+08    1.04e+08
## 2    Paramecium tetraurelia 1.94e-11 1.24e+08    7.20e+07
## 3 Chlamydomonas reinhardtii 2.08e-10 1.00e+08    1.12e+08
## 4  Dictyostelium discoideum 2.90e-11 7.40e+06    3.40e+07
## 5  Saccharomyces cerevisiae 3.30e-10 1.00e+08    1.25e+08
## 6       Saccharomyces pombe 2.00e-10 1.00e+07    1.25e+08

If we want to get a tree for these species we need to start by finding the unique ID for each of these species in the Open Tree database. We can use the Taxonomic Name Resolution Service (tnrs) functions to do this. Before we do that we should see if any of the taxonomic contexts, which can be used to narrow a search and avoid conflicts between different codes, apply to our group of species:

## Registered S3 method overwritten by 'lookup':
##   method         from
##   print.function base
## Possible contexts:
##    Animals 
##       Birds, Tetrapods, Mammals, Amphibians, Vertebrates 
##       Arthropods, Molluscs, Nematodes, Platyhelminthes, Annelids 
##       Cnidarians, Arachnids, Insects 
##    Bacteria 
##       SAR group, Archaea, Excavata, Amoebozoa, Centrohelida 
##       Haptophyta, Apusozoa, Diatoms, Ciliates, Forams 
##    Fungi 
##       Basidiomycetes, Ascomycetes 
##    Land plants 
##       Hornworts, Mosses, Liverworts, Vascular plants, Club mosses 
##       Ferns, Seed plants, Flowering plants, Monocots, Eudicots 
##       Rosids, Asterids, Asterales, Asteraceae, Aster 
##       Symphyotrichum, Campanulaceae, Lobelia 
##    All life

Hmm, none of those groups contain all of our species. In this case we can search using the All life context and the function tnrs_match_names:

search_string unique_name approximate_match ott_id is_synonym flags number_matches
tetrahymena thermophila Tetrahymena thermophila FALSE 180195 FALSE SIBLING_HIGHER 1
paramecium tetraurelia Paramecium tetraurelia FALSE 568130 FALSE 1
chlamydomonas reinhardtii Chlamydomonas reinhardtii FALSE 33153 FALSE 1
dictyostelium discoideum Dictyostelium discoideum FALSE 160850 FALSE 1
saccharomyces cerevisiae Saccharomyces cerevisiae FALSE 356221 FALSE 1
saccharomyces pombe Schizosaccharomyces pombe FALSE 990004 TRUE 1

Good, all of our species are known to Open Tree. Note, though, that one of the names is a synonym. Saccharomyces pombe is older name for what is now called Schizosaccharomyces pombe. As the name suggests, the Taxonomic Name Resolution Service is designed to deal with these problems (and similar ones like misspellings), but it is always a good idea to check the results of tnrs_match_names closely to ensure the results are what you expect.

In this case we have a good ID for each of our species so we can move on. Before we do that, let’s ensure we can match up our original data to the Open Tree names and IDs by adding them to our data.frame:

Find a tree with your taxa

Now let’s find a tree. There are two possible options here: we can search for published studies that include our taxa or we can use the ‘synthetic tree’ from Open Tree. We can try both approaches.

Published trees

Before we can search for published studies or trees, we should check out the list of properties we can use to perform such searches:

## $study_properties
##  [1] "ot:studyPublicationReference" "ot:curatorName"              
##  [3] "ot:studyYear"                 "ot:focalClade"               
##  [5] "ot:focalCladeOTTTaxonName"    "ot:dataDeposit"              
##  [7] "ot:studyPublication"          "ot:tag"                      
##  [9] "ot:studyId"                   "ntrees"                      
## [11] "treebaseId"                  
## 
## $tree_properties
##  [1] "ot:treebaseOTUId"           "ot:nodeLabelMode"          
##  [3] "ot:originalLabel"           "oti_tree_id"               
##  [5] "ot:inferenceMethod"         "ot:tag"                    
##  [7] "ot:treebaseTreeId"          "ot:comment"                
##  [9] "ot:branchLengthDescription" "ot:treeModified"           
## [11] "ot:branchLengthTimeUnits"   "ot:branchLengthMode"       
## [13] "ot:treeLastEdited"          "ot:nodeLabelDescription"   
## [15] "ot:ottId"                   "ot:ottTaxonName"           
## [17] "ot:studyId"                 "ntips"

We have ottIds for our taxa, so let’s use those IDs to search for trees that contain them. Starting with our first species Tetrahymena thermophila we can use studies_find_trees to do this search.

##    study_ids n_trees                                              tree_ids
## 1    ot_1044       1                                                 tree1
## 2    ot_1662       8                tree1, tree2, tree3, tree4, tree5, ...
## 3     ot_560       3                             Tr80090, Tr80091, Tr80092
## 4     ot_575       3                                   tree1, tree2, tree3
## 5     ot_650       1                                                 tree1
## 6     ot_651       1                                                 tree2
## 7     ot_705       1                                               Tr93612
## 8     ot_760       2                                           g0n0, tree1
## 9     ot_762       2                                          tree2, tree3
## 10     ot_89       2                                        Tr1003, Tr1004
## 11     ot_91       2                                      Tr46259, Tr46258
## 12     ot_96       2                                          tree1, tree2
## 13     ot_97       9                tree1, tree2, tree3, tree4, tree5, ...
## 14   pg_1272       1                                              tree2564
## 15   pg_1913       1                                              tree3903
## 16    pg_236       1                                              tree6285
## 17    pg_237       7       tree99, tree100, tree101, tree102, tree103, ...
## 18   pg_2412       4                tree5089, tree5090, tree5091, tree6403
## 19   pg_2435      24 tree5147, tree5148, tree5149, tree5150, tree5151, ...
## 20   pg_2533       6 tree5451, tree5452, tree5453, tree5454, tree5455, ...
## 21   pg_2618       2                                    tree6129, tree6130
## 22   pg_2702       3                          tree6272, tree6273, tree6274
## 23   pg_2762       3                          tree6384, tree6385, tree6386
## 24   pg_2924       1                                              tree6755
## 25    pg_301       2                                     tree205, tree5482
## 26    pg_310       3                             tree259, tree260, tree261
## 27    pg_315       1                                               tree266
## 28    pg_316       3                             tree267, tree268, tree269
## 29    pg_317       1                                               tree270
## 30    pg_424       1                                               tree532
## 31    pg_427       5          tree535, tree536, tree537, tree538, tree5574
## 32    pg_435       1                                              tree5995
## 33    pg_650       1                                              tree1147
## 34    pg_652       2                                    tree1152, tree5628
## 35    pg_655       1                                              tree1157
##                                                        candidate
## 1                                                               
## 2                                                               
## 3                                                        Tr80090
## 4                                                          tree3
## 5                                                          tree1
## 6                                                          tree2
## 7                                                        Tr93612
## 8                                                           g0n0
## 9                                                          tree3
## 10                                                              
## 11                                                              
## 12                                                         tree1
## 13 tree1, tree2, tree3, tree4, tree5, tree6, tree7, tree8, tree9
## 14                                                              
## 15                                                              
## 16                                                              
## 17                                                              
## 18                                                              
## 19                                                              
## 20                                                              
## 21                                                      tree6130
## 22                                                      tree6274
## 23                                                              
## 24                                                      tree6755
## 25                                                              
## 26                                                              
## 27                                                              
## 28                                                              
## 29                                                              
## 30                                                       tree532
## 31                                                              
## 32                                                      tree5995
## 33                                                      tree1147
## 34                                                              
## 35                                                              
##    study_year
## 1        2017
## 2        2017
## 3        2014
## 4        2007
## 5        2015
## 6        2010
## 7        2015
## 8        2013
## 9        2012
## 10       2007
## 11       2012
## 12       2014
## 13       2011
## 14       2009
## 15       2000
## 16       2000
## 17       2005
## 18       1999
## 19       2010
## 20       2010
## 21       2011
## 22       2014
## 23       2014
## 24       2014
## 25       2006
## 26       2011
## 27       2010
## 28       2012
## 29       2012
## 30       2010
## 31       2005
## 32       2008
## 33       2010
## 34       2012
## 35       2010
##                                                                                                                                                                                  title
## 1                         Eggshell palaeogenomics: Palaeognath evolutionary history revealed through ancient nuclear and mitochondrial DNA from Madagascan elephant bird (Aepyornis sp
## 2                                                                                                        'Ultraconserved elements resolve the phylogeny of potoos (Aves: Nyctibiidae)'
## 3                            'Phylogenetic Relationships and Morphological Character Evolution of Photosynthetic Euglenids (Excavata) Inferred from Taxon-rich Analyses of Five Genes'
## 4                                                                                                                                                                                     
## 5                                                                                                      The evolution of annelids reveals two adaptive routes to the interstitial realm
## 6                                                                                                      'Molecular phylogenetics and biogeography of Pollicipes (Crustacea: Cirripedia)
## 7                                            ' A DNA barcoding approach for identification of hidden diversity in Parmeliaceae (Ascomycota): P armelia sensu stricto as a case study '
## 8   'Phylogenetic relationships of the South American ground beetle subgenus <i>Chilioperyphus</i> Jeannel (Coleoptera: Carabidae: Trechinae: Bembidiini: <i>Bembidion</i> Latreille)'
## 9                                                                       'Phylogeny of Bembidion and related ground beetles (Coleoptera: Carabidae: Trechinae: Bembidiini: Bembidiina)'
## 10                                                                                                           Erysiphe abbreviata on cherry bark oak?morphology, phylogeny and taxonomy
## 11                                                                                        Taxonomic revisions of morphologically similar species from two euglenoid genera: Euglena (E
## 12 Phylogeny and taxonomy of sculpins, sandfishes, and snailfishes (Perciformes: Cottoidei) with comments on the phylogenetic significance of their early-life-history specializations
## 13                   'Multigene phylogenetic analyses including diverse radiolarian species support the “Retaria” hypothesis — The sister relationship of Radiolaria and Foraminifera'
## 14                                                                                                                                                                                    
## 15                                                                                                 Molecular phylogeny of Coriaria, with special emphasis on the disjunct distribution
## 16                                                                                                           Phylogeny of basal angiosperms: analyses of five genes from three genomes
## 17                                                                                    Phylogenetic analysis of basal angiosperms based on nine plastid mitochondrial and nuclear genes
## 18                                                                                                       Trochophore concepts: Evolution of larvae in polychaetes and other spiralians
## 19                                                                                                                                                                                    
## 20                                                     Species delimitation using a combined coalescent and information theoretic approach: An example from North American Myotis bats
## 21                                                      'Ultrastructure and LSU rDNA-based Phylogeny of Peridinium lomnickii and Description of Chimonodinium gen. nov. (Dinophyceae)'
## 22                                                                            Resolving deep lineage divergences in core corvoid passerine birds supports a proto-Papuan island origin
## 23                                                         Genome sequencing and comparative analysis of three Chlamydia pecorum strains associated with different pathogenic outcomes
## 24                                                                                                A comprehensive multilocus assessment of sparrow (Aves: Passerellidae) relationships
## 25                                                                                                                                                  Perspectives in the new Russulales
## 26                                                                                                                                                        Subulatomonas tetraspora nov
## 27                                                                                                      Molecular phylogenetics and taxonomy of the genus Thysanocarpus (Brassicaceae)
## 28                                                                                                                                                                                    
## 29                                                                                                                                                                                    
## 30                                                             Combining historical biogeography with niche modeling in the Caprifolium clade of Lonicera (Caprifoliaceae, Dipsacales)
## 31                                                                                                                                                                                    
## 32                                                                                                   Strong mitochondrial DNA support for a Cretaceous origin of modern avian lineages
## 33                                                                                                        Biogeography of Cedrela (Meliaceae, Sapindales) in Central and South America
## 34                                                                                                                                                           Annulatascus aquatorba sp
## 35                                                Tracing the Temporal and Spatial Origins of Island Endemics in the Mediterranean Region: A Case Study from the Citrus Family (Ruta L
##                                               study_doi n_matched_trees
## 1         http://dx.doi.org/10.1016/j.ympev.2017.01.005               1
## 2                   http://dx.doi.org/10.1111/jav.01313               1
## 3                   http://dx.doi.org/10.1111/jeu.12192               1
## 4    http://dx.doi.org/10.1111/j.1096-3642.2007.00306.x               1
## 5           http://dx.doi.org/10.1016/j.cub.2015.06.007               1
## 6         http://dx.doi.org/10.1016/j.jembe.2010.04.024               1
## 7                   http://dx.doi.org/10.1111/boj.12358               1
## 8           http://dx.doi.org/10.11646/zootaxa.3636.4.3               1
## 9         http://dx.doi.org/10.1016/j.ympev.2012.01.015               1
## 10         http://dx.doi.org/10.3852/mycologia.99.5.655               1
## 11   http://dx.doi.org/10.1111/j.1529-8817.2012.01140.x               2
## 12        http://dx.doi.org/10.1016/j.ympev.2014.06.028               2
## 13     http://dx.doi.org/10.1016/j.marmicro.2011.06.007               5
## 14   http://dx.doi.org/10.1111/j.1558-5646.2008.00567.x               1
## 15             http://dx.doi.org/10.1006/mpev.1999.0672               1
## 16                     http://dx.doi.org/10.1086/317584               1
## 17                     http://dx.doi.org/10.1086/431800               1
## 18 http://dx.doi.org/10.1111/j.1095-8312.1999.tb01920.x               2
## 19           http://dx.doi.org/10.1186/1471-2148-10-234               1
## 20              http://dx.doi.org/10.1093/sysbio/syq024               2
## 21       http://dx.doi.org/10.1016/j.protis.2011.03.003               1
## 22        http://dx.doi.org/10.1016/j.ympev.2013.09.027               1
## 23            http://dx.doi.org/10.1186/1471-2164-15-23               1
## 24        http://dx.doi.org/10.1016/j.ympev.2014.04.025               1
## 25         http://dx.doi.org/10.3852/mycologia.98.6.960               2
## 26       http://dx.doi.org/10.1016/j.protis.2011.05.002               1
## 27         http://dx.doi.org/10.1600/036364410792495926               1
## 28                                                                    2
## 29                                                                    1
## 30              http://dx.doi.org/10.1093/sysbio/syq011               1
## 31        http://dx.doi.org/10.3852/mycologia.97.5.1140               3
## 32              http://dx.doi.org/10.1186/1741-7007-6-6               1
## 33                http://dx.doi.org/10.3732/ajb.0900229               1
## 34                     http://dx.doi.org/10.3852/11-238               2
## 35              http://dx.doi.org/10.1093/sysbio/syq046               1
##                  match_tree_ids
## 1                          NULL
## 2                          NULL
## 3                          NULL
## 4                          NULL
## 5                          NULL
## 6                          NULL
## 7                          NULL
## 8                          NULL
## 9                          NULL
## 10                         NULL
## 11                   NULL, NULL
## 12                   NULL, NULL
## 13 NULL, NULL, NULL, NULL, NULL
## 14                         NULL
## 15                         NULL
## 16                         NULL
## 17                         NULL
## 18                   NULL, NULL
## 19                         NULL
## 20                   NULL, NULL
## 21                         NULL
## 22                         NULL
## 23                         NULL
## 24                         NULL
## 25                   NULL, NULL
## 26                         NULL
## 27                         NULL
## 28                   NULL, NULL
## 29                         NULL
## 30                         NULL
## 31             NULL, NULL, NULL
## 32                         NULL
## 33                         NULL
## 34                   NULL, NULL
## 35                         NULL

Well… that’s not very promising. We can repeat that process for all of the IDs to see if the other species are better represented.

## [1]  48  51 128  70  17  87

OK, most of our species are not in any of the published trees available. You can help fix this sort of problem by making sure you submit your published trees to Open Tree.

A part of the synthesis tree

Thankfully, we can still use the complete Tree of Life made from the combined results of all of the published trees and taxonomies that go into Open Tree. The function tol_induced_subtree will fetch a tree relating a set of IDs.

Using the default arguments you can get a tree object into your R session:

## Warning in collapse_singles(tr, show_progress): Dropping singleton
## nodes with labels: mrcaott2ott276, mrcaott2ott142555, mrcaott2ott3043,
## mrcaott2ott7623, Chloroplastida ott361838, Chlorophyta ott979501,
## mrcaott185ott23323, mrcaott185ott599, mrcaott1427ott25671,
## mrcaott1427ott1544, mrcaott1544ott15345, mrcaott1544ott1795,
## mrcaott9389ott365252, mrcaott9389ott23557, mrcaott23557ott527099,
## mrcaott149ott902, SAR ott5246039, Alveolata ott266751, Ciliophora (phylum
## in subkingdom SAR) ott302424, Intramacronucleata ott340382, Conthreep
## ott5248773, Peniculia ott5257364, Paramecium (genus in subkingdom SAR)
## ott568126, Hymenostomatia ott5257367, Tetrahymena ott47284, Amoebozoa
## ott1064655, mrcaott3973ott5765, mrcaott3973ott26103, mrcaott26103ott273110,
## mrcaott26103ott229626, Dictyostelia ott835575, Dictyostelium ott999665,
## Opisthokonta ott332573, Nucletmycea ott5246132, Fungi ott352914,
## mrcaott48ott3465, mrcaott48ott67172, mrcaott48ott1423, mrcaott48ott4814,
## h2007-2 ott5576447, h2007-1 ott5584405, Dikarya ott656316,
## mrcaott48ott1053, Saccharomycetales ott5976840, Saccharomycetaceae
## ott989994, Saccharomyces ott908546, Taphrinomycotina ott656312,
## Schizosaccharomycetes ott921286, Schizosaccharomycetidae ott5670481,
## Schizosaccharomycetales ott508517, Schizosaccharomycetaceae ott990009,
## Schizosaccharomyces ott990008

Connect your data to the tips of your tree

Now we have a tree for of our species, how can we use the tree and the data together?

The package phylobase provide an object class called phylo4d, which is designed to represent a phylogeny and data associated with its tips. In oder to get our tree and data into one of these objects we have to make sure the labels in the tree and in our data match exactly. That’s not quite the case at the moment (tree labels have underscores and IDs appended):

## $`Tetrahymena thermophila`
## [1] "Tetrahymena thermophila"
## [1] "Dictyostelium_discoideum_ott160850"

rotl provides a convienence function strip_ott_ids to deal with these.

## [1] TRUE TRUE TRUE TRUE TRUE TRUE

Ok, now the tips are together we can make a new dataset. The phylo4d() functions matches tip labels to the row names of a data.frame, so let’s make a new dataset that contains just the relevant data and has row names to match the tree

And now we can plot the data and the tree together

Find external data associated with studies, trees and taxa from Open Tree

In the above example we looked for a tree that related species in another dataset. Now we will go the other way, and try to find data associated with Open Tree records in other databases.

Get external data from a study

Let’s imagine you were interested in extending or reproducing the results of a published study. If that study is included in Open Tree you can find it via studies_find_studies or studies_find_trees and retrieve the published trees with get_study. rotl will also help you find external. The function study_external_IDs retrieves the DOI for a given study, and uses that to gather some more data:

## External data identifiers for study 
##  $doi:  10.1016/j.ympev.2006.04.016 
##  $pubmed_id:  16762568 
##  $nucleotide_ids: vector of 58 IDs
##  $external_data_url http://purl.org/phylo/treebase/phylows/study/TB2:S1575

Here the returned object contains an external_data_url (in this case a link to the study in Treebase), a pubmed ID for the paper and a vector IDs for the NCBI’s nuleotide database. The packages treebase and rentrez provide functions to make use of these IDs within R.

As an example, let’s use rentrez to download the first two DNA seqences and print them.

## >AM181011.1 Plectroninia neocaledoniense partial 28S rRNA gene, specimen voucher G316300 (Queensland Museum)
## GCTAGCAAGCGCGTCGGTGGTTCAGCCGGCTGGTCTCGTCGAGTTGTCGGTGTGCGGATCCGAACGGACC
## GCGGCCGATGGCGTCGGCGGGCAAGCTGTGGTGCACTCTGTCGGCGTGCGCGTCAGCGTCGGTTTCGGCC
## GGACGACGAGGCGCTCGGGGAAGGTAGCTGGACCGGTCTTCGGTGCAGTGTTATAGCCCTGGGCCGCTGG
## GTTCGGCGTTTGGGACCGAGGAGAGAGATGATCGCTGCAGCGCCTGTCTCCCTCTCGAGGGGGGCTAGCC
## AGCCGCTGTTTGGGTGGCGTCACTGGCGGAGGACTGCACGCAGTGCTTCGCCGGTGGTCGTGTCCAGGCG
## GGCGGTGTGGGTATAGAGGCGCTTAGGACGCTGGCGTCCAAATGGCCGTGCGCGACCCGTCTTGAAACAC
## GGACCAAGGAGTCTAGCATGTGCGCGAGTCTTAGGGTGTGGAAGCCCTCGGGCGCAATGAAAGTGAAGGG
## CCGTCGTCTCTCGGGGCTGCGGTGTGAGGTGAGAGCCGTCGCCGTCGGGTGGCGGTGCATCATCGGCCGG
## TCCATCCTGCTCTCAGGAGGATCTGCGCAAGAGCGTGTTTGCTGGGACCCGAAAGATGGTGAACTATGCC
## TGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGGTTCTGACGTGCAAATCGATCGTCA
## AATTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGG
## ATAGCTGGAACTCGTCTTGACACAGTTTTATCAGGTAAAGCGAATGATTAGAGGTCTTGGGGGTGAAACA
## CCCTCAACCTATTCTCAAACTTTAAATAGGTAAGAAGCGCGACTTGCTCAATTGAAGTGGCGCGCAGTGA
## ATGTGAGTTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGCTCGGTTA
## AGGTGCCCAAGTCGACGCTCATCAGACCCCAGAAAAGGTGTTGGTCGATATAGACAGCAGGACGGTGGCC
## ATGGAAGTCGGAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCTGAAAATGGAT
## GGCGCTCAAGCGTCGCACCTATACCGAGCCGTCGTGGTAAATGCCAGGCCACGACGAGTAGGAGGGCGCG
## GTGGTCGTGACGCAGCCCTTGGCGCGAGCCTGGGCGAAACGGCCTCCGGTGCAGATCTTGGTGGTAGTAG
## CAAATATTCAAATGAGAGCTTTGAAGACCGAAGTGGAGAAAGGTTCCATGTGAACAGCAGTTGGACATGG
## GTTAGTCGATCCTAAGAGATAGGGAAGTTCCGTGTGAAAGTGCGCAATGCGCTTCTGTGCTGCGCGCCTC
## CTATCGAAAGGGAATCGGGTTAATATTCCCGAACCGGAAGGCGGATATCTCTGGCTCTCGGGTCAGGAGC
## GGCAACGCAAGCGTACTGCGAGACGTCGGCGGGGGCTCCGGGAAGAGTTGTCTTTTCTTTTTAACGCAGT
## CGCCATCCCTGGAATCGGTTTGCCCGGAGATAGGGTTGGCTGGCTCGGTAAAGCAGCACACTTCATGTGC
## TGTCCGGTGCGCTCTCGACGGCCCTTGAAAATCGCAGGTGTGCATCGATTCTCGCATCCGGTCGTACTCA
## TAACCGCATCAGGTCTCCAAGGT
## 
## >AM181010.1 Eilhardia schulzei partial 28S rRNA gene, specimen voucher G316071 (Queensland Museum)
## GCTAGTAATGTACGTTGGTGGTTCAGCCGGCTAGTCTTGTCGAGTCGTCGTGTGGTGGATCCGACTGGAC
## CGTCCGCGGTGGTGTCGGCGGGCGAGCTGTGGTGCACTCTACGGACGTGCGCGTCAGCGTCGGTTCTCGA
## TGGGCGATAAGGTGCGTGGGGGAAGGTGGCTCGGTCCTTGGGAACTGAGTGTTACAGACCCTGGTGCTGG
## GCTCGTCGTGGGACCGAGGAGAGAGAGAGATGATCGCTGCGGCACCTGCCCCGTTGTCATTTTTCGGGGC
## TAGCCAGCCGTTTGTCAGGTGTGCGTCGGACGTTGAGGACTGCACGCAGTGCTGGACGTGGAGGCGTGAT
## CTGATGGCGGTGTGGGCATTAGAGGTGCCTAGGACGCTGGCGTCCAAATGGCCGTGCGCGACCCGTCTTG
## AAACACGGACCAAGGAGTCTAACATGTGCGCGAGTCTTAGGGTGTGCAAGCCCTCGGGCGCAATGAAAGT
## GAAGGCTCGGCGGCGCTAGTCGAGCTGAGGTGAGAGCCGTGGCCGTTGCATGTGGCGGCGGCGGCGCATC
## ATCGGCCGGTCCATCCTGCTCTCAGGGGGATCCGAGCAAGAGCGTATTTGTTGGGACCCGAAAGATGGTG
## AACTATGCCTGAATAGGGTGAAGCCAGAGGAAACTCTGGTGGAGGCTCGTAGCGATTCTGACGTGCAAAT
## CGATCGTCAAATTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTT
## TCCCTCAGGATAGCTGGAGCTCTTGGACACAGTTTTATCAGGTAAAGCGAATGATCAGAGGTCTTGGGGG
## TGAAACACCCTCAACCTATTCTCAAACTTTAAATCGGTAAGAAGCGCGACTTGCTGAATTGAAGCCGCGC
## GCAAGCAATGTGAGTTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGAACGC
## TGGGTTAAGGTGCCAAAGTCGACGCTCATCAGACCCCAGAAAAGGTGTTGGTTGATATAGACAGCAGGAC
## GATGGCCATGGAAGTCGGAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCTGAA
## AATGGATGGCGCTCAAGCGTCGCACCTATACCGGGCCGTCGTCGCAAATGCCAGGCGACGACGAGTAGGA
## GGGCGCAGTGGTCGTCATGCAGCCCTTGGCGTGAGCCTGGGTCAAACGGCCTCTGGTGCAGATCTTGGTG
## GTAGTAGCAAATATTCAAATGAGAGCTTTGAAGACCGAAGTGGAGAAAGGTTCCATGTGAACAGCAGTTG
## GACATGGGTTAGTCGATCCTAAGTGATAGGGGAGCTCCGTATGAAAGTGCGCAATCGGCCCTGCTTGTGT
## CGCCTTGCGCCACCTATCGAAAGGGAATCGGGTTAATATTCCCGAACCGGAAGGCGGATTTTCTCTGGCT
## CTCGGGTCAGGAGCGGCAACGCTAGCGAACCGCGAGACGTCGGCGGGGGCTCCGGGAAGAGTTGTCTTTT
## CTTTTTAACGCAGTCGCCATCCCTGGAATCGGTTTGCCCGGAGATAGGGTTGGCTGGCTCGGTAAAGCAG
## CACACTTCATGTGCTGTCCGGTGCGCTCTCGACGGCCCTTGAAAATCGCGGCGAGTGTAGTCTGATTTTC
## GCATCCGTTCGTACTCATAACCGCATCAGGTCTCCAAGGT

You could further process these sequences in R with the function read.dna from ape or save them to disk by specifying a file name with cat.

Find a OTT taxon in another taxonomic database

It is also possible map an Open Tree taxon to a record in another taxonomic database. For instance, if we wanted to search for data about one of the tips of the sub-tree we fetched in the example above we could do so using taxon_external_IDs:

##   source       id
## 1  silva AY102613
## 2   ncbi     5888
## 3   gbif  7415807

A user could then use rgbif to find locality records using the gbif ID or rentrez to get genetic or bibliometric data about from the NCBI’s databases.

What next

The demonstration gets you to the point of visualizing your data in a phylogenetic context. But there’s a lot more you do with this sort of data in R. For instance, you could use packages like ape, caper, phytools and mcmcGLMM to perform phylogenetic comparative analyses of your data. You could gather more data on your species using packages that connect to trait databases like rfishbase, AntWeb or rnpn which provides data from the US National Phenology Network. You could also use rentrez to find genetic data for each of your species, and use that data to generate branch lengths for the phylogeny.

rotl/inst/doc/rotl.R0000644000176200001440000000650413543637133014074 0ustar liggesusers## ------------------------------------------------------------------------ library(rotl) taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) ## ------------------------------------------------------------------------ resolved_names <- tnrs_match_names(taxa, context_name = "Animals") ## ---- fig.width=7, fig.height=4------------------------------------------ my_tree <- tol_induced_subtree(ott_ids = resolved_names$ott_id) plot(my_tree, no.margin = TRUE) ## ------------------------------------------------------------------------ taxa <- c("Hyla", "Salmo", "Diadema", "Nautilus") resolved_names <- tnrs_match_names(taxa) resolved_names inspect(resolved_names, taxon_name = "diadema") ## ------------------------------------------------------------------------ resolved_names <- update(resolved_names, taxon_name = "diadema", new_row_number = 2 ) ## we could also have used the ott_id to replace this taxon: ## resolved_names <- update(resolved_names, taxon_name = "diadema", ## new_ott_id = 4930522) ## ------------------------------------------------------------------------ diadema_info <- taxonomy_taxon_info(631176) tax_rank(diadema_info) synonyms(diadema_info) tax_name(diadema_info) ## ------------------------------------------------------------------------ diadema_tax_tree <- taxonomy_subtree(631176) diadema_tax_tree ## ---- fig.width=7, fig.height=4------------------------------------------ mono_id <- tnrs_match_names("Monotremata") mono_tree <- tol_subtree(ott_id = ott_id(mono_id)) plot(mono_tree) ## ------------------------------------------------------------------------ furry_studies <- studies_find_studies(property = "ot:focalCladeOTTTaxonName", value = "Mammalia") furry_ids <- furry_studies$study_ids ## ------------------------------------------------------------------------ furry_meta <- get_study_meta("pg_2550") get_publication(furry_meta) ## The citation for the source of the study get_tree_ids(furry_meta) ## This study has 10 trees associated with it candidate_for_synth(furry_meta) ## None of these trees are yet included in the OTL ## ---- eval=FALSE--------------------------------------------------------- # get_study_tree( # study_id = "pg_710", tree_id = "tree1277", # tip_label = "ott_taxon_name", file = "/tmp/tree.tre", # file_format = "newick" # ) # tr <- ape::read.tree(file = "/tmp/tree.tre") ## ------------------------------------------------------------------------ giant_squid <- tnrs_match_names("Architeuthis") tax_lineage(taxonomy_taxon_info(ott_id(giant_squid), include_lineage = TRUE)) ## ------------------------------------------------------------------------ turducken <- c("Meleagris", "Anas", "Gallus", "Sus") taxa <- tnrs_match_names(turducken, context = "Animals") taxa ## ---- error=TRUE--------------------------------------------------------- tr <- tol_induced_subtree(ott_id(taxa)) ## ------------------------------------------------------------------------ in_tree <- is_in_tree(ott_id(taxa)) in_tree tr <- tol_induced_subtree(ott_id(taxa)[in_tree]) ## ---- fig.width=7, fig.height=4------------------------------------------ turducken_spp <- c("Meleagris gallopavo", "Anas platyrhynchos", "Gallus gallus", "Sus scrofa") taxa <- tnrs_match_names(turducken_spp, context = "Animals") tr <- tol_induced_subtree(ott_id(taxa)) plot(tr) rotl/inst/extdata/0000755000176200001440000000000013260441704013642 5ustar liggesusersrotl/inst/extdata/egg.csv0000644000176200001440000002111512706456642015134 0ustar liggesusersanimal,Spp,Lndim,Measure,Neggs,Nclutches,ESr,Type,StudyID,Year,D,EN,Zr,VZr Zonotrichia_leucophrys,White-crowned sparrow,0,volume,294,73,0.140045943,stat,Mead1987,1987,3.421917808,85.91673339,0.140972438,0.012060292 Passer_domesticus,House sparrow,0.009407469,volume,149,31,0.11175203,stat,Cordero2000,2000,4.04516129,36.83413078,0.112220753,0.029555954 Serinus_canaria,Canary,0,volume,52,21,0.4967914,stat,Leitner2006,2006,2.180952381,23.84279476,0.545037117,0.047978211 Turdus_merula,European blackbird,0.021189299,volume,82,54,0.3859854,stat,Martyka2010,2010,1.414814815,57.95811518,0.40707397,0.018195675 Agelaius_phoeniceus,Red-winged blackbird,0.218316086,volume,394,106,0.07410136,raw,Weatherhead1985,1985,3.173584906,124.1498216,0.074237439,0.008254242 Quiscalus_mexicanus,Great-tailed grackle,0.281894985,mass,822,205,0.051788336,raw,Teather1989,1989,3.407804878,241.2109934,0.05183471,0.004197959 Taeniopygia_guttata,Zebra finch,-0.010812869,mass,116,24,-0.05636213,stat,Rutkowska2005,2005,4.066666667,28.52459016,-0.056421926,0.039177906 Taeniopygia_guttata,Zebra finch,-0.010812869,mass,90,20,0,stat,Rutkowska2002,2002,3.8,23.68421053,0,0.048346056 Vanellus_vanellus,Northern lapwing,-0.029825984,volume,114,32,0.03014961,stat,Lislevand2005,2005,3.05,37.37704918,0.03015875,0.029089175 Philomachus_pugnax,Ruff,0.22184875,volume,120,30,0.03462025,stat,Thuman2003,2003,3.4,35.29411765,0.034634091,0.030965392 Luscinia_svecica,Bluethroat,0,volume,102,18,-0.1468127,stat,Lifjeld2005,2005,4.733333333,21.54929577,-0.147881353,0.053910402 Sturnus_unicolor,Spotless starling,0.025305865,mass,153,34,-0.133824538,stat,Cordero2001,2001,3.8,40.26315789,-0.134632122,0.026836158 Branta_canadensis,Canada goose,0.061028185,mass,242,44,-0.006674089,stat,Leblanc1987,1987,4.6,52.60869565,-0.006674188,0.020157756 Falco_tinnunculus,Eurasian kestrel,-0.080479586,mass,132,33,-0.1910071,stat,Martinez-Padilla2007,2007,3.4,38.82352941,-0.193382195,0.027914614 Falco_tinnunculus,Eurasian kestrel,-0.080479586,mass,108,28,0.2165249,stat,Blanco2003,2003,3.285714286,32.86956522,0.220007175,0.033478894 Larus_michahellis,Yellow-legged gull,0.091409863,mass,1068,669,-0.06718163,stat,Rubolini2009,2009,1.477130045,723.0236794,-0.067282976,0.001388843 Cincloramphus_cruralis,Brown songlark,0.363356588,mass,44,17,0.1439293,stat,Isaksson2010,2010,2.270588235,19.37823834,0.144935702,0.061056628 Pavo_cristatus,Peafowl,0.119205592,mass,3313,205,0.005428755,stat,Petrie2001,2001,13.12878049,252.3463625,0.005428808,0.004010486 Parus_caeruleus,Blue tit,0.010299957,mass,192,21,0.07261821,stat,Cichon2003,2003,7.514285714,25.5513308,0.072746264,0.044343281 Larus_argentatus,Herring gull,0.049687784,mass,79,30,0.1160999,stat,Bogdanova2006,2006,2.306666667,34.24855491,0.116625804,0.03200148 Larus_fuscus,Lesser black-backed gull,0.064503231,mass,60,22,0.124354,stat,Bogdanova2005,2005,2.381818182,25.19083969,0.125001014,0.045063639 Corvus_monedula,Jackdaw,0.041392685,mass,226,70,0.2033713,stat,Arnold2003,2003,2.782857143,81.21149897,0.206246808,0.012785844 Carpodacus_mexicanus,House finch,0.002809678,volume,378,84,-0.075561895,raw,Badyaev2006,2006,3.8,99.47368421,-0.075706199,0.010365521 Carpodacus_mexicanus,House finch,0,volume,304,64,-0.072529696,raw,Badyaev2006,2006,4,76,-0.072657281,0.01369863 Sterna_hirundo,Common Tern,0.008600172,volume,427,158,0,raw,Fletcher2004,2004,2.362025316,180.7770632,0,0.005625023 Lonchura_striata,Bengalese finch,-0.021189299,mass,116,34,0.09239892,stat,Soma2007,2007,2.929411765,39.59839357,0.092663229,0.027323604 Molothrus_bonariensis,Ring-billed gull,0.078874433,mass,90,30,-0.000377536,stat,Chin2012,2012,2.6,34.61538462,-0.000377536,0.03163017 Pica_pica,Magpie,0.063358906,volume,43,8,-0.036738337,raw,Slagsvold1992,1992,4.5,9.555555556,-0.036754879,0.152542373 Corvus_corone,Hooded crow,0.049218023,volume,103,31,0.073794034,raw,Slagsvold1992,1992,2.858064516,36.03837472,0.073928423,0.030267833 Taeniopygia_guttata,Zebra finch,-0.010812869,mass,133,22,-0.03994883,stat,Pariser2012,2012,5.036363636,26.40794224,-0.039970102,0.042720543 Delichon_urbicum,House martin,0,mass,90,35,0.03076685,stat,Gil2006,2006,2.257142857,39.87341772,0.030776563,0.027119808 Xanthocephalus_xanthocephalus,Yellow-headed blackbird,0.247321812,mass,90,23,-0.088294337,raw,Richter1983,1983,3.330434783,27.02349869,-0.088524861,0.04162591 Larus_delawarensis,Ring-billed gull,0.06069784,mass,110,37,0.053696485,raw,Meathrel1987,1987,2.578378378,42.66247379,0.053748182,0.025212749 Cincloramphus_cruralis,Brown songlark,0.363356588,volume,95,40,-0.3293106,stat,Magrath2003,2003,2.1,45.23809524,-0.342054801,0.02367531 Larus_ridibundus,Black-headed gull,0,mass,60,20,0.1391671,stat,Groothuis2006,2006,2.6,23.07692308,0.140076126,0.049808429 Anseranas_semipalmata,Magpie goose,0.125672077,mass,60,16,-0.110406595,raw,Whitehead1990,1990,3.2,18.75,-0.11085851,0.063492063 Sterna_hirundo,Common Tern,0,volume,108,40,0.073872636,raw,Gonzalez-Solis2005,2005,2.36,45.76271186,0.074007456,0.023384859 Falco_tinnunculus,Eurasian kestrel,-0.080479586,mass,80,16,0.097815848,raw,Wu2010,2010,4.2,19.04761905,0.098129617,0.06231454 Larus_delawarensis,Shiny cowbird,0.035472318,volume,90,90,-0.07294093,stat,Tuero2012,2012,1,90,-0.073070702,0.011494253 Pygoscelis_antarcticus,Chinstrap penguin,0.058509856,volume,264,132,0.03094903,stat,Fargallo2006,2006,1.8,146.6666667,0.030958917,0.006960557 Phoebastria_irrorata,Waved albatross,0.091157684,volume,224,224,-0.088469783,stat,Awkerman2007,2007,1,224,-0.088701688,0.004524887 Passer_domesticus,House sparrow,0.009407469,volume,77,19,0.05470045,stat,Wetzel2012,2012,3.442105263,22.37003058,0.054755105,0.051626145 Sula_nebouxii,Blue-footed booby,-0.147287056,mass,76,56,-0.2611557,stat,D'Alba2007,2007,1.285714286,59.11111111,-0.267348297,0.017821782 Stercorarius_parasiticus,Parasitic jaeger,-0.063477845,volume,534,267,0.1397023,stat,Janssen2006,2006,1.8,296.6666667,0.140621937,0.003405221 Ficedula_albicollis,Collared flycatcher,0.013679697,volume,1162,198,0.04804496,stat,Bowers2013,2013,4.894949495,237.3875361,0.048081979,0.004266438 Sterna_dougallii,Roseate tern,0,mass,440,146,-0.062868359,raw,Szczys2005,2005,2.610958904,168.5204617,-0.062951384,0.006041549 Centrocercus_urophasianus,Greater sage-grouse,0.261995252,volume,146,20,0.06614164,stat,Atamian2010,2010,6.04,24.17218543,0.066238344,0.04723178 Phasianus_colchicus,Ring-necked pheasant,0.140492874,mass,106,15,0.4531655,stat,Rubolini2007,2007,5.853333333,18.10933941,0.488676681,0.06618423 Taeniopygia_guttata,Zebra finch,-0.010812869,mass,43,15,0,raw,Clotfelter1996,1996,2.493333333,17.2459893,0,0.070195195 Larus_fuscus,Lesser black-backed gull,-0.010812869,volume,304,101,-0.00990453,raw,Bradbury1999,1999,2.607920792,116.5679575,-0.009904854,0.008805301 Sturnus_vulgaris,European starling,0.01616166,mass,354,69,0.04996099,stat,Love2011,2011,4.304347826,82.24242424,0.050002622,0.012619503 Erythrura_gouldiae,Gouldian finch,0,volume,1473,324,-0.019559388,stat,Pryke2009,2009,3.837037037,383.8899614,-0.019561883,0.00262543 Larus_ridibundus,Black-headed gull,0,volume,147,49,0.05453834,stat,Lezalova2005,2005,2.6,56.53846154,0.05459251,0.018678161 Aythya_ferina,Common pochard,0,volume,185,26,0.1957707,stat,Lezalova2013a,2014,5.892307692,31.39686684,0.198330883,0.035215153 Aythya_fuligula,Tufted duck,0.026629385,volume,46,7,-0.04923335,stat,Lezalova2013b,2014,5.457142857,8.429319372,-0.049273187,0.184185149 Aythya_affinis,Lesser scaup,0.031791834,volume,38,5,-0.143657133,raw,Dawson1996,1996,6.28,6.050955414,-0.144657788,0.32776618 Chen_caerulescens,Lesser snow goose,0.037500891,mass,85,22,-0.089455106,raw,Ankney1980,1980,3.290909091,25.82872928,-0.089694871,0.043804453 Falco_sparverius,American kestrels,-0.036212173,volume,170,34,0.093153037,raw,Anderson1997,1997,4.2,40.47619048,0.093423893,0.026683609 Columba_livia,Domestic pigeon,0,mass,63,16,0.3301501,stat,Pike2005,2005,3.35,18.80597015,0.342996707,0.063267233 Zonotrichia_leucophrys,White-crowned sparrow,0,mass,38,11,0.06348392,stat,Bonier2007,2007,2.963636364,12.82208589,0.063569411,0.101811368 Quiscalus_major,Boat-tailed grackle,0.268544242,mass,122,41,-0.056059589,raw,Bancroft1984,1984,2.580487805,47.2778828,-0.056118426,0.022584639 Cuculus_canorus,Common cuckoo,0.042879996,volume,71,38,0.1527316,stat,Fossoy2012,2012,1.694736842,41.89440994,0.153936091,0.025710636 Eudyptes_chrysocome,Rockhopper penguin,0.037301411,mass,213,194,0.1191936,stat,Poisbleau2010,2010,1.078350515,197.5239006,0.119762927,0.005140756 Larus_michahellis,Yellow-legged gull,0.091409863,volume,124,48,-0.003408011,stat,Perez2006,2006,2.266666667,54.70588235,-0.003408024,0.019340159 Gallus_gallus,Red Junglefowl,0.080943092,volume,220,71,-0.08467843,stat,Parker2005,2005,2.678873239,82.12407992,-0.084881699,0.012638378 rotl/inst/extdata/mcmcglmm_model.rds0000644000176200001440000036167213260441704017347 0ustar liggesuserswTK0dEQ1'@ADsa`f␣$9 $Yr+EE@%**`FQy}]wkU=l0FCCf+-[Z6(_;)_of@,]44ݷd+I֋+r)0-Q`=lz ]eܝ:726. w{ ֋֧(ZΊ?tn d^*>I ؕс3-|jGUʾ'^ O"k+5#s=cG?P`SRl:_6[_ZG(XrVӃK)n5TwQ i9,U9Ⰾ?IvgoDn6/9O0XEs5&Yx]~RP&];?W؄6ENƗqo1SY])0WRzNf%]9M]w: ۗ@Ie{O֛/=Z1|}Di6x F'zvnF= kј> ְۣ֊OG=j ݷb` 6 ugܿsۗrpb _oG8oZu]44ƹgr1r!> $lcG՛kuI_xgFqVX`iL {_N;r?mt?u1{VsTa'ZmDyW0:۰>5`<~/B71:A=y:ۗ\yC>~*0 gUOr;[0Qm 1:/19P, ?5|FT~@S^ݡA0v켊W*:U.l=PW qq%DNr oNׁZJKl F7i%GA n^^F[j az*tcy8cS`d05EbxQr rIۗi--KOF6zр+W7կȵ)>|2e^ͧѭQ Ql1Je2WSA.:o]91a4AǨs: w!lNuan)W~q` _Qn46̉Ȯԁ`뷅Ks0?h4F1YLwb\Q*ݺ|>\hƗ39:q>S- &׽huLL<BY[ 5>Lqa~owwx'&_JIꡜx'ckbrEX1}λUW|lΞgTWF1@wP*uݝ9U ΘߘzR(@s2(361?)vť[Lە\7[++Ҍ)^^58c/nJ5ε2jj3ܹQ~1+Y?莐/b~[0ڨk|g?ga[M0= کZhbvI+R͊]N`ߊW\mUkYj|JcDF) ë́mձO1~s$s 2LQdJsY 6lfg1: Eؼ = 5F_0xk 96L?q:!K_L) Pޠ ӭ !&gO( ?u5NcMW=z/ `,`qʴs)o+0}p~n09'/inm[;ƇC]U',%d4TJ}fl=~,CPf+4^d5Fk<?bqhԭX!bz*ۊѻ}!ޛ\Ͽb&.%c}z6<|r3j{1}]Cw0Y`L#HL?Yob$ !,]{Mpbzo~znYT 363[+X<'x KgV^owfRvw75#?RFKӧ7lrlFyԛRc6l`/cr%P˾X<`z0S<1z).b8?I?l$5Nc 819qTxz=Q jQ^lW0:{b`)U,/ݢr*͉=s:hbu#4@cw2:(Jbv{O+E ؾ+0(q3/zu-[5^(sS Lo~Cg6nOË|&'b80$j>cy$tSx/5ɚ併nCS'߭K Os]cZ}IBv^?K "}P~K{{e7XlF 69w9=V%y2Ժcڂع] ܰsmRS祈ScX<%T\a_kdٽ˟Ӱщ"ard eL8lo_ 0UV?ubo-F8fujaEdbxnڢJikiwҊX5ľ| QW1YMb~dÏwm,cz7\V>oU B>R@[rbe> Ңyy#X$5~3qT}~7G68( !Y lgOZBP/|[ZaSb7~몛7ϔ+G8gsm v +_Imر,޻s{ob'zk!Unp*݅<$q1aX]]| 6_λod?u{0-\~~%=扒P̞!I`~S-P.vٛ_L+ܬO{%bv@3RHL1vn+LNw 1zv,Ob%(& ?SHo);̮Bw6X#T: X=IeOQ$f~ON73/sj5V$Sт/*8Հ<n&Å*q|k.>#Q%,8>qRO:&j5; /J*6cNVU{ "!R*AɳGf_=!D'Fk3Tb }ց՛F1ؾYQF`Qބ[;Lb >u*@mwqy`0m:ZZ_a}f[o)q鵬$sϋ?PvfIz /hڋwr2gUkO՝ʡlT9ύ%`~~Ss9L?٤X=/):;ď\懂c7aN٘$N5c9Zl={@} VL-0XǻiXSSrj1_ p ש/}q]1af"; j1̔S+71~]i vj, %6_ SSM~ǁZ]Kxk:0ZE_; 3F+>QMi8"qZф cqyL/e T=;彩vPT$/ zVQyׂ/NO0f=iUY,0D)c)菭HFo@!)Ib9lC3?ϔI3T^Ӌyj5£90ʫR?1snmeOULzfҴi̞iB/va e 7I}\{#$_Ϋ?y;K̺;{0rߛ,8j[9yj\'ѯyH7 j]pcT;eIۭ1B\&3v);Y\Qw-4t4, 뎰ݭԥDAqrc]3ۿhRv7/5&/GIMch$ x-#2 M\G%v3"`Ş`{cv@یxϻh86 >c&Iޫy@a~! Χ:AA@*|8 \'vz!cEs,wƤumn^˧]%a9C Q&be#qFScWgι}ZXJ\ 'v$څI`:_%N6SU@+P4H(ʮqdFZ| ݢ - ܝr}قG\0cp '8@VsVR=ӟ9ZBSq8AH+ +#`L=bA&Bdn٠߸05pxǁvˋO@;FJ~Rfi'|mzܶ?(^ /+;Ӛ;\׃GC߹Ӱ}7D{7Z-qB?pMyHʳpBEygJ3~v,zی7l(3TrP h6z U XU/uw}IK 4u2qM”sk[7/5ӧ8ՆA)h G٠ڬ7T4#H"z@`鮿qiX]1 0l՟$Zr_qePK XZv47|\7WrЄc`k'!2rxcdZY6g6*~STTޛ{A}Fwi ^?{'{edZna'ݲ\6㬴49Oа Li&iW{q4W/TClCnq+vxo p>f+LdCvЃGQuM):q6busL`Ζ mM;T>3fN̽{N~3YA@|Wvsҩ Ì!V R=RA|U0 v%ObOTft&i3`Z-u,%/JֳFb/UFL. hLY;r)8 ?OKxkHVxD6$q\GZ2^RV Ǹ ޺/PZC!`yյ^P8i 8gAY}QWq/h3feBpyO+G \`[*HGk@_`* {p2='pdJ"}T MjJgTn}bL"gٲKTSfGiIu헒n[Yu=ACt0CeaT6UR Ι|Wu@qi!aNE u s0Q᭾ȓUc!p:(Iw]fU5ȂCy]/TU]8yvH>@Y}+zÐ(y\eIN/BEP~ֽqdD[aP)Lvm<{Q~e!1YO$s)}Uf(kIO05 5Rg'ƙl1DڗK-JCQyKx">0 ;Ͻ u&ͫŮdyTU7|q ΚmgGaL5Yϸ%MgwK+O f?>,d6fy;aoqsbh+@%S_vȒb_Y\,Ϻ3q~ Ok-0 *h 긾?Ҏ7R:_} K\샏:"Iٗ"I ހ6vIU;k X%^#ɒ!Lˀƛ"uJ~wۦ.ɩ_lTA?ϠE*C 1rYoA]Fq>9WX[hL<@pT'@n l۞Mzޕyn m"ƃ0 ,]^'Dvw,&kӝw8\.TRޥoq{V9Xͧ 𥶔8U<}b6,]%EE3{׍/ˀ%' =ޭ.[e=|"ŞFrߙsd;Z '_qKwIצ *zW1EP3YˡNܝǠU7;䜑Y= v+Ig]7(u뉯냠N97(v7^O FVNrp!\}hMU.fhܣH٠=QWuR5|Hp5f?i'u1 PF'Hlr %%):RO׃/>6 uƉ9kvޕ' .5T&]Gc+ 8gn4̑W@?̄3o ĔRoeJE/ JF\pL(uԆX_'6AHG|NwҖ,R'}Ucd_"\F +WCU@j0𨁌+H166@]w7J]E>76([/yp\bnݺ~b+hjf\_P {;0-.nf2+ت F?;U%q3O{asx, &ZgFapjzq'h0$9?}c۟A:GgJĶksnr>nIص2nqW쑁ɟ xapC;^KoIV|Fϗ8ƨv2vm{l r%QZsgYs~>w$\XG/K҂dН22܏μ_=. /#oAVLqX6 RWϊl&:i$qT&h25H=Z&-ʠu60r|v$D~FҔ'77`_'N('g3ҥ*p|k)q>N,Hus^ ̔'z5Y5WP1=)g ѮF]'BN ~{9l|r9~2^[H;GF S~;vzOpۜṷNi l jRm~g'\p';ұIOtp叹#!(V{Ƹ $~Z<;q 圿# )nۜt\̶`Ӥ,qf "KTC#rRaCZ2`KmgOoz TL.*iOFRj5'n`| S7rM勎ε?Q)e7|Z fDwMm|׭Ag7寥-٠/B} j4Jo  >^D)T^Z^*+/k xgP&>uv°&`&lޛwׄA0bLhZ9AkdvOp11\9Ь8>8r p9%`6 t?X 緹.:3(栵v|W+դ[<@+0Li]Z>2'Ur@\g6ٟ70 ;놵dHxlxgXQEV)[YoxKEh{Y ^ ?e/ q/7y9:ci|.< 6?u7׉ !ꟚNxm8O@n!@ yBH@40f&]VI8 {y'r\_L؄vn~p8gXw\Lbޞ;ڶΠS'4~ -xҋ[=um^cd= s\UWuQp1?Zh\ۃ.9.dfS<ډXD(jd؉N1U}x:+\y?lG=0z ^W._2c^VlDɭ`@6YTV'rτ7}@mȍF %?MGY@wWL7o@?=\'OЪUz?c-< VUuV: Mj"g6H6E%ЪN1.L1y@aU A W Y H 8}e`Q_?xb^!]L-`ww0T޽1 2O~rm9Ppg#m<?-u}@+ulhN%rˣ޷Wk ~UYo6X⭕I) ]Or yg\&e}wqm֔[:Y[[cx'EB r8OC`gxs<+GX-0~4+Xm 0I?_{kEgX4Yv"I*񷺓4 j:t[ v~7jIf8:''ڴb #mhИg ί ;1'w~{ s4_rnX6; 99ZNi2, kӀO`}ed3 XT>CR l[B }ސ |Z!4+n6Â0G\iȾ\Ӂn&z^|;) &߽=3}^Z9peϫ>v-k O&g(y|GXq> ҧ/[l`Zc3#~k~TO/Eh18{-99%^rQXsl, ޼:K}sO[lwy}*g`p6D ky ,H%#Tʎ ykZ`\&>;^}03ߣOף1?#Z pSO?AKwxwڿlv06ͪl2r0k5T<HgZiE\ . tyǀ̩m+5@蕿r-mK8 P /=XdEіn+~0%*t_.2;BL_䁉ŏk{is t?с@}`#?Y"y'#/zK sW/Se?l=K>dR%ZKU8ҏ@wwH;0`^j(oz d]RE\)(ʢ;σܵC}O@߀ʭC ]fjPA lW^pÍ &C\POX!וC0޳Q6(ɉY^0 L /ʧ9ZSysott td}oɨg]pٻyfff/D8w:L}\Pug^Wo_mQ1mnx^-yO<Ie' NظTtfN<Af}`s&alLNp8ѱSe~^dxPK?3e3S^a|p!-"iqC/|K|7Ǹ&-tvj2g[1)&anPK6 |.iYI;mkƍ) =0"*&}wk=w9<g <ꠠQt0pxDAir䅪Ǎx9^lffG\.]zTTVL<S7l=OsP̆'4ZQ=y{[>~m~|nz%5TBXo4xv\2=`cV']uÉb[0P= h }h;ϥ;̭v ٛ5,τ8Ur^hC+>u@Žzlvϧk+tG傤ws`ykp:V&ܫCG w/02e.>;EHc*`Yp<^ubc_ &@h|\3|֫`ޫy qhlg1kji* Xi%К`$r&*VN{4XZzLwTl̓{{;Kx'c@p75Ci6NYP\|kΊf@>(ݘ){@-y`kXQPP)iV\݉,EpmI h5ۋ'AW0"b ѐY-{ײt D ۅ)֓[>.L$r@A&ϵ{܁`Is+^?l:`8¶|D`#BӂI2.#[*HP]֯/kW"Ԉ̢w\ y8 w[0;rɽ 0fYצtAtu/Eoe`M`KfPk'pc&pHrW i^[ COU@7d7q2)g:܏Qqla Aˏ*-[wVp]+񓞪 x) H`z3➹h0=q XGW]~0DufYNnHHoov'ĸgL~D،?# 3A^CE ީF'5پ/œq'f Z@9y$|)g]->17[OCBICGP-8>zuc2#&N9s]-a.́|G:1 E?_A٦;t/T N/ؠ`on?߲ A{,3DSp8tR߃nFPP$x 4o,p:h9:2e?Ӟ/u# o*f/,WFv/?(T \ ҡ3*3B{t+ǥ4pp%WO? 6<) 9@j!|}w>_:W{,A|"\$?jL7nng.S)(_tD~C++{q\ YJoٗ)LǏ̝FD?eu44KNxqP 9&˝.l!'Y 4CJ>`!O]|[FħkU8dh$[p+ҕ:Ifk.VR/T(yǐq{F?8ez:V?7|~lqs+ܠp6< V :sKTT?v'u@QJhz%Pqt+YqiEƽU `hrP73@ Ԕ iʡഩO9|1$ J~jYE/l-EO `[pSY;Lz0~W& C`맘]0wL*vi-CŴ2@ުYh %8 N*2F}w"~ێ,ޮ= `6LW1x:p3gA{a7n DpRο_?(N Ɤ/J|c0Z_8۴L[l;!}bMc>L{Gȏ{ڐ p>.GRj^՗Dwv JGσGt(|Aiïգ3(OV`.;IvmҽCw>`򞺾c<}!:/뗙냷IIq _|>vIl| GR"xi%"C 栫 b;wQЙSp ^j<(u\y0OLBݧ}jyZ_]Xц`$|,M„s@OɷHydcaiu{q>\ޢ ,+h`%I'8k(="*YSrW5Z a ca;^6.uVW$bc`źқ^ UUvf0;erQ/h:JH *> :ocuk9ȅ׾~;DWW& 籠{+t: b7Xy1x:FlKu] s FWO? `>r*j<^pVy8 O?sxUF{9_cNk'p0r&ptE"*Nw{E?ooIɻ;y)G3UID .Z,qM v  (Qj&g3E}cSQ]5;>36 W^D;>z昈2нti )}dl!X g;qg̔7%Q;fpv쥫|@|64znF򃷣`4qnI ҇c K[,]/{Td!zlӫ KbF55ǭQVb΃u&_AnHoæG8=R.% idʓ\:Ģy4e &{~гe?bv( `LJnIoU"x1llom)8 `RЪ9yu%K0rA o'C~b N.I@n5 ^t?,`wϪ;]H׽`_ x 7 i{`ksp&ٻ( v:^)Aсz $(}v:B0\[t8)Wx oˤk@u{gmm6\V2@cL0Y͡CJ{`ҷr +3ˀS-0gt_ ±#Q-uw-Cp׾*q)k?:CɱRpx2(ʟ-Ð8:i+no٤_[} VN$G+8=y/V+=Hn"K6io=_2_a$8:z8Xǯgs$:;9)?&_[-Ml5v oA&&N[&,/1vUoZ,oә9o7íddN|Ba :]'KaeIG_"7?ۺNp?(3_iz=5wٕ_Bi_CK[ioDdm6>|6VVg{[oq;{mt2"?*{ZBvvM"rQ1qmq.d) [S"k(U_{ЌlR:ϸ(hF/ɡk7VY+Gc/?3!7M""{sr3ȩ_Kι񇓈%uEE3mD{gFc"䕳QmǑLv:dAC.d{pn|=_)#e^ߣYwy\rpm4cz{76J ;msu-8Dd9~~GB؏"j^Ȫzl͙$y} O i^sKWo}re%Cγs]Ƈ79("?'K&C:}N6.FU½9O ;VCݮcՈH`&; !rY,A =ds#Zvr>̫\n 4'o!7keNInUOt3m)GIUb2ȩ4ȎuͭZd}Kc$riF(φLr<)t;=u8n^@κ?ՑELّӾʕE7 9)3m>nw>rc?{UOٗ]%ؑpy6rz;pKrl>3o$ї%]D@Ρ%="j?p$r: Hur;9{wI#ghH>2l{ZPMoD|ܔb7gvZ:':W4!')]suy4)\a1iQ@s]~Ⱥ!aF&dG.+/W|ov!1I`DӴObڝߗ}~$伮ٞ92V\Yi%d{$tl8ZlGcl"$ @}[߮R%7_1]Fzy2f^D]ōb4D#+>̥>`Rm,N G^B'F|)stU+"|,ˋN+"+=7{#[FDN2r;p?"ޞa?H:1>+<v>>vt7/^Gڟ*yY&UTzҳExr&O+W@d١D*dOw1^ َ n'E/F6۝[mW,)=IP~O+m(FK9AbȾh,oõkW"RJAS9:o׵ dg"Kq0k\o.߭ 1nψ4R*H"MLٰƇ^8Y)y2Og"Gg5DJ5-e>wܤYE.oc"fA&8ovzyeZ0r6l*$la{Ad5 q~d!Ǧ1$*~!Gd$Dzwr"wX49"<` r,?^8Bʵb2" 7% 1';ȲVA%D%`B m +Yl\/6Jw!';cSsxk4rvWOo OForډ{iUKPAS&_<ꟄƟw%iOrܵT2OcQ89kD1c"$ /\ZC[nVaFՎ]DdO Fv;n B٥ۈu~{dw/@_F&|Uc3ӰD$%V<r%92DWisYA൪^y9S_C$|R8 f)3-C^7:!+hH+Sdnvc^>"Rz) 9U:- r>eDDY-59)K+MOφT!2%-lzFE18dEnR_~4"Mv#|]0d`Ǘ<_¸?Vݾ /H_2C}el=w!+BMdvxO }g`6"zLf  VsYWM}l>٧92?Fɟo|˖;3s!/ַ*vm̢ѭ @NZ=޿4͇KIqDDx9cAW!{"fZWsMQׇ>O" 9g?lg,i~7ii nXs:"V$C %UQ~+]x@SDӈ|9$_ nO.DBݪt#(;d"~ tl"_4bȱRVt&rү}9\Oq;j " xkp.r#Oꉏht!©X%d_BD=囥 W~k9Ӿ rX'H}\s.!{vXauJ?YXY%ln^ވ9NU&nb[Oy4Yg>4ҥR?-7ӞK*"{" bl+."+لLm+v=DiR"m:bP-f9jŐ-뼦9;w'rm@Os"/e|;DgC.#vJJ5X_=skYK OS/}i\Gv T)r&VҫB?IaC}i3r7]S2,ĹFȡ8i9}A"Uol/ȵ;D6:*(|S)^-4suUdj.r9N h8V"p}O/(>/IQEv'?|a_ǝ5A:KK/i#]h9"4ԷP!>m9w~$:!S>cW/wϡ(GoWo-!bZ#sP+ƭAzRJ_H,rIL${|@.N[@d?O6fqk*/̦ԅڤK&xJ}Z; ~>5P0rZ~mi_8OW?咞!y-[搣|ݪ+V*#rQ6jioz ")2ړ_!nUEJ\r.6Y*<"{#} ]"wbENiόܚ1oG]3rTYu^D+1Y]Pr&(ѵA~4yM)uQ6|JZf2g#ȁo\G }[0E"ݪ]e#GITGgKCEbNĽm.e+u'"yڽcAv 792 9SJZ.CBD+xdy[Q?%p_؟N߬!PB4v]8˂H ,¼7)bj!ܕ}WYD:?7^pnLģ=Ŕ(4+|{mm?0^GY_a<<{!wcJU18*KD[V?#F`k_m=x<.w}D6R)G|-\‘/veDWNs@N )}=g>u#&7qN#r[ ^];%{!ڛ?ۆ?XʧlzA`Rdǘ7Gj@\/i0rSuY7J-7ȴ)'eO"O2_Xˣ_}ӾöpNoEl Qi;gٳA; &sJSBM_Fܭ'(}{֟²|\.irg Ժ_5N˿^jlD"%NS7!EJ]kg3Oȶ-kc3i ,}gz~!q{~'~/D^A/>ZXe}wQQm] "0 ':%oD!W#Cr[@.gv+H@+?Dg~l5*wxVD(dENӚbGd&7[s5-_En:cvG!r m{eT&"^Q*A 󂈤3>{'3<ݠ &x揻C_쨽r Mꦕ\!Bx'r=]rXnԕ{JN"AJ0Õ}{JSȵ(mPr:.'"CJ:#Gmk?Ƚl*tuADzm5:D6ܫr0)"vG߾M>MKkKSF/?)#  ]yZƆ7>2* 2+Ț{[- d(/m.Ej_nݓ&nl>?Z[rt") Δ"ֳ4˿xvE֏τ=ۄL@SC_!nfH! r؃ܵ5["׫B*r9ؤDϸ2[^ٸIh! M4|퉣˔:u"D;^\l|y HNH|uXUOZ9tri%fYdTrk?CFBbD]F]ey-^d:$~'=,hI>yLktwSlLj$ϟyDsГS9x&##g Ϟ]_̓DnX\Gȸ1䞅f 3ȯN2!ی=\Agd_x| r*o&ЀFv|}~aAKNc d}ݭGH/cK0~i[bkGg_~998z_.0!MCyEXߒ)5I>Dt/<9Jv! /-)"h>xd ҹ߿2jE5K֡˔g`sdsRS8SRr ?k;3 )G=kybs)ep ȾrWu~ꀼrR/ ?NUrg&rH:DRc ;8+?j 7+/ͭBcNmn"ϔ3{P꬈s}7XJ=sxۨ9TKqZ|8SidlһqR9*_zC~QȎq"{(EwGi&5a<gJ-r- ٿKzAO_[ニ[{>#[5_ىȞN{M|SZˡT_9fGڡL6DbWeMmFd#dC㸽q I 3A D"V<0A&Zӭe#_DZ%f↥MnJ=me=Q\Gy|e|eFBNG#R㲗FQ'|rٞ2n9f1!B}Kw|ͩyJ:}=rr U=0d%\)vMz9d''RчODS E9{1 r %Ƈ.Y{d.SBx/Os<;w=2EiqSzȣǯG<(c$ wOE]Npɽwad<ul,.Dc;sA:G(,sw+"gP7޽tף9sJdv)& nk3:"):SLn\9.F "!սQ .0rY89ʊ/1!w; wm—[*Ŝqz~9rr@J+ѷWD\)+AR\.&\Գ_+ltw#”{dJ@l\? 7o<\}K n8N\W@1du^[ 8͛.2Awި,uKv#0;[dH$mnPaoFV GAq`&h)r q`\:LlNHw9 w ?h Y88y(Kq#֊0c`*TZGӮcr ῿n"A3;W R!@}eɬo-]Jp]y6g'FXmreUؒ[sc*=.|<) h[d&hFsuD0]W@dS(;-#>=+\Alݿ;@5++L @FR{5 Iʢ {@3qnxK 7 :+v?Xgs<{cKvgrYIpRGL "j0NIGX! LtZk07jGoHJf@P\4l {᪯? 'WdϨ55/nւ #AKZ: ^ǃJAB.l::Dl8'9v Zt@$=5&<|>>gu=Fut=!ҀX%CЁSתBiD8:/}* ӃkDrcFט!p(eMQ2 t!,7>xUx5g-G|MOO =kum`y(xOv0 T "v<Ҁ1!<HHW+`cbtV}FS pz .U,2@܃e>,?㯮ώҶlzrY(ZN(s^˒+ӼY޾{< M~w`pek,e<= +SqC`?)}}MK :wdʼnӝ\较[K[o)(K+aHq?f:Qpq+۪ ^AFi`o\s?*Ӿ󵔧z(ŁF0rG|6HE;\ѱ'@Vk|^m`c`eǮ4/+@k{#v<4{c vu/6r[}eg)m嫅kbJqxnQ{l 6~ǃ>#`7sv Xܑ|{Apr6ofm<:쳔 ckǨ_kE]K&oBsB:[ٳG}BήgyJ c˦{-fWeS`6G`>! 0Uo)|XSӹc:.hdJAͻ3BA-d? tp6 <`vjQ?lDuK o"~G>~tF(iL]O]]`5x;9|V5HrFds8RtoRto`y F }>Ǔcr {57/TG>!6{XWeCN/ ~hΖИBNMK)# ^C_2SqnYtY`,f&L-{)z_Om}* ]kB/AgoHmtDes'( Pd{]IL<ُAWܫ`T$,"?s_1bv!ĀClc7vjL`vt_}#97O \rΖDpвy:rv]g+iކpz w? S5 ;t:H2\Ŀ[E!S/[ f λXd*s Zg3AKh*'hI[ydse,A@Gl:XU 2AO8Nyu?=HO,Moދes`gZszH{:;bhF%NgY~B)SI_yV@hsC o_;8l\9xf׎Eb:4MtPQJ-Fa^ vbqwNo\b`6iifӝ`TN6‘B3@aYr~픟q`+FPrp460 d#(SU`)QD5}p`]t,57.냖:x޵2V`duPKn58\_ j) _ˎFKJp pMcw:DF.olWK7KwF[XOX~ *\@{3^c=H.MxX`s,=\L?[f]6cv=c$ p*O7΀ŕj~m-\=q^L~峃rzк3 򾮕]c)E'V#>1Zr"S nu)sْAir*glIw\&+ю=yx]P:t!st:*Tj?Gj= !ծQ`vI }*? rN\D*s&ڬC.{EHߘ ,~Kc1́[^?L%URt}xZ}NtYuLIjw\ɜQML_-O:;I,[vIJr(-bRҭ}+뵮'hn`,B_J*A93H8~00T8;5@)(.R~&*y@j w0:)ưQϽCqY0vU%ˬYp1Ծ%gius δܗ 6֏-ӏ1X糇|rt2l;e[rb\(8OƁ:[XMqq䏼Xe \vr? m_å%7np]3b! )ԟ+σ[Ę0-XNY(NS 0$"U$X)}b֗6Оr N>{z>pf0 S5w2/_ 癛`t<7x=*ܺU<9޳s v/"/]J20?LZܠkE xP}'XZ}NtmH-G:OɋqcC`R2 /7qຍ^86 W}& o/sy)pբ? ^\J'j ';y"5k|yRo2?L>%P(Ժ7hK4: !nEUB@lTCww7KBB-P DQEw{}9s{0>~0kA͒8[_s?M×7$w?j:ؘHcY9BG9mENiȁ屏~f|OX]1n!N6ZGTB/D}FqO3juFa-)7 ԫuN/Q8}='{"ڠڗYSZvLgwSOh %YQI5 r u筛@*7 5$ə6^&drL`rܝ`7( p3jbC{ݔiZt? ^ R-jxw){$W_̔v:(FZaBw3 s]EtM}+j2mԖikHblƯ: U|bIv~r`׭2P>3<sꆥ+Op/չǐ+=ʽ ͝P'۵:+N.`~̞a+hЛk.|y+5,/ 6C>Z6O~~M-#^~U7s< [eh@≔L%r]grr4w^Q5bLWCXpx+ !E8G5^ϛgJxh+)&y٠\ *Q񎄀0m| &|&s6{nWhY}4v< 'u@LY+B;51 wBg;8!v_@ژBmqW3:Phݍ\W9y2FFo=5x+4֭-ZZe3<*dAWHk0޶{_Yg*JT?[n9N 8`٣vITq;+kŞ[s%! \` Nm{ef\ }iGQdK868>$:l *]$dV_J߅> hTYmrf/*!&d݅%Ձ~k6gJ8( INs\?j=Ya#$\Ib}8wdVv> Cêh̆ݣQfGrƇoI91XyMQY\>4s"|Ǚ%90RzA^7݃nTP4,xowv,c/ß)z{ yvP>'$vV8 մ€e˵s pe^4V rwfIb#ؗ: ) M AF߾Q{}F~"eStRE{*˧vN!sRr( 3W|kʓ0[8vBn?[kle}I|#ܬ 악OGU[10{m;;27+vٙkj4l-^|B>]2Vk[a^_ S}ּWP욱f>{Y$4ؘyQw7@E{3G\ "%eKz6SE |}'#SzKlSύUzmaLm!J</hL^ Ȁ8co/BnsK;:~u $d:ʛ0iȈ q&}#t S _i [ç[0t SţbcY0鱫o CrB ?tLUaD>[+`Fu8Pl dM(a A"&0u?_6B7וR tl!n /(r}xM;_ϨRkG6#vAsN_L]3wJJdkv:9"sU,f[vOls=\nq)sybY6X5E)#9q@sM&/)Q}tÍnPuM{s?\}o mZ^s攳 QIdEBG>O}s퀪\y 9njsgs3O8^P9*|OH.Br+w<DEQ)2GC *o tn`aRl dE09ng'שv |n􄯝ͭRwqtt8+P~ Y!2clvCB$ψw4Ezi4ewH0 s%뾃~%~yGGr)|~ cl xw7E4w+LL[AQ30s| L$|W~G>w+f@G>9kݺf10CmMve;8iݵnMH$2tC}Lro,s t݁CX4R'uuS8*fx \wzw͇ߛ\Y(j>/؉ML9KL6=gryNb3#wBs?5>:HC#zR?qLF"37 eOF^N`IVߴiX&8ۑ쯔???? hν5D8Ԅ AO{_48L˝XfXut tlٝ%Cx*l VLx&3<8}ӐդS=B]{a3H RrJUߵO}^2>*Ii?dpwG}74{w T¦?/d~>=fܫ.5g-W~K ÌbU',Hr[J>gh5|6rZ|Z޳~wk+%M WXaLx2} W5k%Ɨ?y4(3 O}C o1}z`[ZYЩ+'ʒ_ 7].ac)_nX^BhLbq/5랣;zZ9Fa~bU>z;s%w-a6^Ő /Ea?[z v";V>kma[qhky-xsW?^onX$oL]ҙ*'Pvt 3 +y H >wZ!k`y򽛃E 1@EuzB:B9 qL}\W`w@] tNEleM+(m{듩,Э6Ȯn3пe5\l=92&jBB(aNTT}Vҹ* .o=)cں[ƤsMQ;n=Rs4_䞆DTy~](tXZṀz* Ck&܌ #I*W|׍Vv!h? z'\G@-L~O6|86g,0;w2]w欳$С0[e*g-ѯ[2g;R&6՞Ui\|7h0|W5|&vy9M"<;[3Å+D%9iŠI):sڻigx"SQ)G~t!+ZzS|VQ& n"ofA!φ`7͞= ?/E_@񃝍N˫ GI¬W.W /72UgIut~^W ~aVhKֿ$=ޚb*"[SbSjXƚdAWݖˁ2 U`_68v힁Oס|{ #L_ۉ*-#kHAZ3Btawl*t9$#/O{NW /Zp}xa~Xo6AKၰ)]L`??XgrJab̹$;4-tn.< 3+W좱Lf ~7niylIH0 ? 7ܯ i?5u ,h+~eAtVK USas$~wca#n?x#-w^Uc7Щ4r{|OkUߞ%T? ;((% T=&b; %Uzd d۝ׁ?s;9 Q⁶iLٷR6bu^u)іs(iʐ3ޡ˔bx VmǢ7@W%#IGcò6 ,`\z(M7=FlT)ۯ;Pb m֫__w&\&uwl0]7>w>s)4mU;ˉ X[tSkO_H\G8FuYaWk:fl/rh6XMmpQZ7ig9kcR&7F'ۿ&M,ث~hhBgn >9EzUʡwa]x$t]7B[OW>H͢hfꔘGnhb67В{C7,^- Cyd:Y ĝ(+iG)HW:R.?b0eV~U+=,xG]gUAp{vu]8׬>] &zW?DgYB L‘U @PLYz”+yfݿ=Hf9s<\,!YQ絣\۫h`qN,bm daj:$DHB~Py64Yiy EDNUC' )>EjG1öai|^EնdГTO1n9b),v&؍dG7:ߓ.>Z\n CcCGah:^T 0Qc|z/>ٵNh* mEGtz6 :;N{Ar';?pF}<46A\:o$_rlyn %T 嬓V)Li; yXƈ.u]ɬ=i:7 -'אָ|d#xڇi쇓AKv-rwvaSpXᯔK:mӁ!5?=zq jia1:K{Sf@roqù(g=h&׫yZuPx/۶$=b.x + T^+cA*.Hf]'Ԝ›D5B־!eSOӧ=,CkA\K %:ܰ|2,% =Ydx&IMP .!s-Ϟ-c'r+&:$|}ɽ{J0p )e"3ef?`w (V2%6݆SД*[k%Y`k5"H^@ܗuƭ0X3t3 lk1|g*NӫC>{!2ꥇ~UP inX< O5|nkR^O3UU//j}zпewl1Tk`*&Ôq]7(7 '#w審 ظ<^롗IN:9|r: `9娰]'nmn32>ꇂѮvF5`6TP 碀1ϫcZkaqj]J ~8E.N|қg_0^t|w$)]ütP~^,{g*ŷOh/{-}J>>HYԇ!v+:؉6F^?zF`IM{R\7җMӀs-@Tbnɯ7rd}^r kZ*3ˆW9WzVs5L͛*_TN*Lt]0߶ 7QT&\XNÍm*f_=dѩԟMiB[mIiˬ,2<|whʡqIMm]54IPo ' %Ǽ 3[|,|i5mKSmzB +<=a6s)w1mFO݃_7~ټQ} skYsL̸psDsB%pիqߨӕv~XjPdlwFkM,aFQ-'g%s37怍jOFvWf'!wʞB/e͚k߅дf:5!`Ck &XH>b>6 N?#8`G 5pYh{voxZK~0Mz';U[UpԑX ,`Rr4?&ʱC6P=ShǕvh m%Y`enF"%V! yjq6qCPKS3t/76C݋39?|'A$ӄH?:yǚxbϿZB*ȧ¿m,ݞ놎7.Ӷ= -f?/"|KykCoiIK8R#[ykCEU 2q+{݄?%R{$|=H}*`{\N1=X>W`Mۯ8 { {ͽ }>}-W?OF#O| Zוy b]ѵ%Ysb^[(vƈPh/ !K,KGhWWEo/DzLaL`3Y+[\'d}+gvK?~CӟjY i#w-~ z: },w]/C=ת%_ ,Ams3Wj}-ms>q̂XWEO 1t:#M(~S?ߤk[H<'2G ^ ~/ ,x[d{O%JdNߔzđoFÞa]:K t > E,vGrz}#EtL{vͯ,3BOEOw`N2F9b^W$wt8%!e kJEFUJ>0*#S5 h{<^C˩+d<߼rcPNB=oZDFD^J+{AvD\y4oSDA3"~m\n[KY{#k iy"/!kh@|HWl)$k9Pq'Akaj݄\c} q0t3s ͔4z5A|g |6x}9";q~ϳvWTl  Kw;_Uv;gs5?= BB]B'wnk"4bJ-*I/k ~JYެ|"A'\7r\=MȕRD{~[OT<m W[y= (tvIMxNWнK5%1rWyj |{ NSSE_@4o/DiKyV* Y+Dvb'-W.}ORve%{k'$es^+4 ۮw+/g#0׹OaWN99KqhW$]Eʊ!gKCxb~|JKO'eIy7;| ڕV\ '{)^~MJ4f&)|e"Do k:UT'sg65Dr<|B_EѼK󝄼M)|tkť;$螋%~3z]f!\8*ZBŽD%.R֯F}_Co;l/(o%j;Nb] s)vBPz[U M=ۈ:f Q7ҷd;v*ꔌaǺ(z/{ .B.JUx^$z& ?vr+i4(Nidq"ϫ)ĺڃ$+Cdyˆ:%i^ix'{ǟH_d {G?n*(ٿXqǖ۰D0:rJo;xbR=q>h?KŽ)uaii63zq_5!_H`};71//9^tOI>U =םH_1~]ae>IlDՉrgn z<.X_=in/ļRKySV~ {[knIOAJmF*Zս|9I1„݌u?hq=} KkK0Z#_ AM|CSt>+ǏRZ rwߜ %Kף :DI$8BKl, 5e(fb"oe,#V*o; ui׈LBJl :aDtJ֧ԕ%Sh r~>N_$ @E)W¸"˧l'⡣qN@ms0R .o\Yn~f?ooz=B$byFS`qS_[-/y&E%ìch_}8^no5}%UcR7?*AkOR^Wm'O["9W\ TS荷N՜7(3u/&]BȟU#JR7 1_Oߍ2g΄:%0b؂_2tDQ(cNgDjzJlZ$uձ޳d'Ns+mQox PAguY捿&lw"E3T$;iKzbT{9%2Io|O9hHNt!k'o@ 8)AOZ8gt]GN?@W0iΙLڔ/ؑ=gX`x_U!೹&Q?M_v&za/5{,qIsM+A'"޻2/'kEnQSz'bFi!) 3&겮+oZDS밭ߢ!/Bu;mUM|t{'J+ {$^$/%%>[45}nHdLEDڕrրrp T W2ov_ +!_hJ~z'1Fa'JR]yN[L7-a;{@&xŽ&:!D=iOs8B9g^$tѳ&Qn yyJo'BM A7t*j?Ϳkt|o/qC_3O_㚬yIXX&Q1 I#DŲb^&odR0(9N_yh{d%JXYaG;E_ 0}>K7?'D٥GKGԛݺ8ue=:Hy?~C2luw^!ihuBKe$^5`F4($Fكfs/%D<GuIѿz{ic4ļGKTEkvSR8Z&VW*ѾbPS,;1?=[KV?=L'|Mc'Xl12B鸈ya=P٥{NǼ?'z 1r?PLS B XNϹɖDžzbDQ꧔J/b]ٹ`Jsqǔ\i#Dك3&3¾f, Lv hr>Wp&i?Xl\ A8_בSX(~͞R$$nN!=دŦgNqWQ!1DT5 3eOe;Fx.E襜w37O>e_ćN,JMsqy.`J=~io~V~E"N"S/Z6jm!+ G览#{c?1+Vr#^t0fMy]xFo5)'ud`(6ʷ x_$]f%ӿ'ZEnSB- )rv-%. ֙:v*KϞ$Y3M _Fͽ3\{)_RAKH<+ A'qk2E#j-oLz{#6 Du3,~d9TPcDKjGS }o&ۥ[{xi&mճA]A3S4 > lS uM!|IcAqb{S$O$AqXʵߟs"3kS!XVװ'Իm%~"I{&fʀOsyaO=of ,ѽ:s0 A/K!ڡU &c}Чm^sWb[X9/=u:le~ӉܹwbδGE9/R914_&b0h$U>(LVGD&3HgCUz+Ž85^"B,S(eN(|fdv~9)}ԟ γ,m80o` y]s-5{]Q4Ty"!L%IBQh>SS ^ܾۡ;cϥUkabe ׸Pږf?:av 5<Ԟpɸ#>wF81h$t;^L D /x@9ϫ7U­e>y#"lJ}]xVy5eš5ڝ쟰yˌꕘ„9Qo[< Z[0^l;E&oT',|R`@.W¯>pVfE>;y?_`g1k&Mɽ&raRz`WhR߱'4_O>O| \3_-@l1/VL$SVH~MO>qVw.A{xs wxފ25cn1oHw\t1)+Xw}:73-O7R5堛0kp=~n7ٔ M*OAtEsؚz gg÷ܝ>vc;tnbL4~W@5Jcz:=IT9w7KyjKegGkcv_.,0XZg=7|iiIZ< Su5} aKAXӵ8%X{!۵teO=_k9| ~vz@^SE;xI8"6w>Qg^] d:!vSwd}j0KRڵM۠|ۼ9M[3áktM(.e3x3YAX-,7'hZO3K_ΉA(Ujosh ~xZeRL`{-o]vO(.,5mo7}9ƷS&;g;eܦ`#xE١6F@J!w>tx@ݰMsȻM}{A aV^ h"<~|k 8_G[*9$eݲa$Tb L"%2 %Pwf_ %;.<&R,) =_576@#hmi89O&ʝdemx$` U\DGðBD_q!zK#$'Ll#j7<&[˜q›& >^ɹn :a(hAW$R[В(lzhCZ-QIz![렪t}~sL$=<W|o6_{Yhπxq\\_!a'ib*wz$@-iv4r놏''mP0cL"\Pֿzc)~Vz7Dƅ-V_9>CxYpް{I\iX9nkV]Mtj8 Zf(UsCUcS]`Z=A rچc&P1anպZqXFM}V/yj?`-[idy} Ka8$= =4Pi02iM ȩ MZ>f6ek>_uX gt.>v֨);7iڷ Ŕƿ^}!PL ||TzlS\h#@yԨw_ 2D4Y[iyďa*pj6;(^] 0f&n.bcy{vG/~7(ނUjrާSx6;-P(wS)ӏl)*+/5<̿v;# eJ+䔕yJXBu?HAv1eS8F'f@rH簗SsVHJ3ݡayн'a))xL˗j=6%^`vK b!]&_ob07Tp8ڝδޑ G& ܐQg=" k\/8 1*'a~P+&:|؄7_Z6>]p}˻8h3GmW~_#Θ i֪1t<̲xaɺM-Q0Gcafynd@_Kzr=A6{dORи**ޒ$\伨 W'>Y A۳jU\[CӎHVϟgfnэ?'Jshӕ>yfy<|M'bt`Ӓ>= WmIo@;%$^\lY?AFv&RGz;$mTSƤBdHbU[gpI̲5@"GM4-~ywt z1+~ \Ůa7HLq㇚%[Kq>40~//)BoH$ 7ٿ> -tj1+ rrj݋005c`qcB" Q3y%Um<ڏʽ^t6/9nfՄߍ*]k[:GS oW>%^֣p6;{OZEеA/糦^ 6̳͉& a9J;rZKگ !j[75TnU4kI3ll-˙M6 %;oP\g( iĆ)Ӧ~ZRjNjH)t~Qk.dMHg溊@wWe8& -֐($t 6&_u@2'mWds[e |x h NBHk/dr$V3$.3הŦe{~`-$ f%ù9\-|ngx2 KW ^ƫs!VVz{#@;ODku-W6\d= .1 =WxH6s"%53c/yG,ˬqXCT73Fbt$ʱI/u ~is)Ήaoq: lO]I00<jl|P- ;Ѡ7c/\]V8jX_8m|:0l<"K3ZIEٍGPoxR'ʊ\)K>hjԯ!P 9AWhBpj~7 (0hy™P9W,TStMAG5{Ia#n.^U `|.3hLL@mݠ0x~j|MY5Ìw8MR{4 ^-dj({BV6GHd͉ބuP̴lηvX_:=fMn[nlMNW^<^ݦ慣8oޏv.B+بg),ޱ0W`6R<|~hxO.闓p K 2= Wvh9kbn12vpBv&g1_x^p})ks;b"hbb\^BFXT'Ѿ}=gpu6r>ѷ:d{7k&9Vh[[J3:D^5gx/TȺJam}³U$߷r\g1/pjųGhw "W.׊=9 !J^C@OչDžʞ'͸%~OҬȢ߷q,mq(|Htx|U\绀I޵~Ȉ m}zg3Шسk_TCP!p-LG Kӫ05mϊ<=plQ-򝆡x z&FH.2V @?qлC;Ȭj=}Uј Gfpߒïsc\9ӯD}hu7)!?EB`qu_j39.K%s`41n-e~ iX1Y>(^z 9?/R80αʅ|oOm9Hpi}˖kʼ&iD#I -u0;'0 3eaSF/u% E#Re4}"[q Dʦ.P 18|2U*}O2-BP<(g֔'`p6~8_JFY+ Vb`"wvdnW6X 3  3h޿Z|d=V?ȽX;4yյϯ65c 8h}!̝Hh1J6o@gP-6VEJjˬ\8 my_Rn> 8`pM1>9- ,{b8B~2EyʶwVh.̬ FZ=J-qЕz|..=W@NG,9ئ *۔Ø^C094xz^&e)Иq_ܶBwt+HȬu:2n7anӐ9. RLFڧdu* vAU?9zA1OCa GzDz}a6cWzZ@Xg ::ϝüйU}V %7`qbو^A1WQ& EM`1ҿmn+)R1B^Q vG+՛LwpQ3-df~mFx-x>4TtrD?YO$,-zr> Slk9, GSFryҺW=yCB %$ۈhrLDLbp1xB>Y,1T5B^${.Wĸu,.-R-Z9kz>Dðn?H|zM_R=ݠ|~ޏy7]YHvJŗ;k`xĺQxn 3_ ._O.shY/O5&xE%~P\8hT 4!pq(2V8g* Z?٭@j[MS9ϴ$Z❅lQNźL֘ ڗ@Ft'\$CAi>! }G`֓;m=Y !Йep?ZFͼ >s 0{_#P}ߒ&d)g<`SɊ|Ui;U >st^s9jfp(^Z磢g`澛@*I:,#}W"̀ؕ'.}Dsֺu#baښnwpҮ?Vk vv< zI"d:twpY0[)eهhN:-^#!p3Uͬ >x:F:! ftӡn8>D*? # YK߸W X_6R;?oRa'c#~%h>cɎI?K9pO%;х7^S.4ȧxj!?MQk,}V?o7VQ`}^#Esl7lz^;fνG,~k|uFͣ~☌Efo::t)ק,ǡ2$iӰLp#m _)T ????({k-p ;ipYq';dCͰ@5.?;KOw >:T3Lgxx"Ї=4OR0Bmam~,\\?j"sLһD`:﫽yeOOGnt̝JrZv^>",C_Ԧ-=w-BXXyH4fvjB{p5R561!XQ8es1@34\wbJР Ku}8j hٹ`B(!~O6ڝޞaTT6߰>-fܢI}1 /|7'z☦̲OjaO.aijJe/>C!~hn9chQjv7C7I{j};L\ս:hawL:6!q֤n>rHى*x%a=^WV'<삫>Pw㺦h ҟm!VvO { Z?yBJ d'd{C0ի SeiFhpj_.,T}56 E.N;6>Bk~'aVsz6JaP/yAmeZT:=xswThj~$μg} q!7I7z8f:*k ƿ7* k&@5e| T&X>zo. i\%pl4ME'^_K8}zJW!]܍jRZRyrCxmղ:<"[-’nħluAF:GEs,F߅2B+hGݹ^?_z>>sV'x(we/&; S":2 !0V{x /z+Cļk>, ?f568פx / 7A!N/R 8×T@*29hf͗K7g)yڎ-8.j,˂kSC/0X,X wfW|$mNX2R0%$-}Цk lgWJnWNØ4dfkJ/AhQg@޲c"7 $Ny jSWN%l7ov]_S܆qڽ21kZ_j=G!v9T ǫs-~|8WvGJZl$!fG^ ~2wDv:} v„Ջ6Z:.~ݰHjA3U:O`ƵfVl |ᄅBׄ ~{7@jcJ*ʅu~{Osl ?^c*!OʚWP*a6-'SY[m]g*Wkz8seMՄP,!hsU\hz=SO08u>>I'皢Pwzh~= ĩ»P谼(dǟ @/3U9vMAFXyr!T//: B(h/tO* [Пlpl N/% XϽ?a2v*udX56(uox?;|3K_a¯j3XMs/Exv^.g 'Vj5JrӄrSt wHES0,w-CVݵyrҳO*XK[|اn1Љ&4L/ADb2B x_orߛ={$~_hՋʱ˅;!W:⏒5Y!\[;^8nd| Β<b{;A⵭}/vݭIB{Y5T &Ej8CŦ԰`5p-oe@`lq0-?=Ic.h JۮVyyhx5}@z*GvdG[ǽ4=ܻ-:>nfS9iB#Y Zת=&K|vRaQP0J> {TM`3DcvJLJ>p^g ;(0nwJsmӘ:سo8[m `XSN-`QҔ!g5 Caa)~ڎEoJF s?@mɇemhY,1ʹP-Oo~yЖ U'yb >R s)gGBq_/UX~QZ'a.;i! ت{aheh0(F8޵ ߾,Iۆg^V,o >"qpHqv96Yx>8 G0U^9@S<`L{ư[wf|>CcUG2{7K T%P']? /2 O}z d)ۡɧS_w?"۲W7$KLLj xlaɻnr}xa?ϥ]}R?ifxNXճ[F9t0\>BǫYߟơC|ub.cPX)38lGCu$_l7`5 F(oh@sL$LoI=O8/L.YWЄΆ}r 8Cs(>Ihtobz}E;Ѐ)10^z,l+o%1nY[YPu4;QVӎRԗ4uK]`<7[C W`?5t{S{X$^CϜvpxY}Bm3v%AMj~ϲA#d/MQ?ҳ."|O_U1)[WF7; ={7'_4r0 x~5Yr ,C2>kGW*1XX۲zx CugIvbg>P0ʡ#L!\AbeqgV7Sg5]`StG{DT![V-F,BODى~Tꛀב4[jBqpb ܕ#UaKnф@aNQI+0MU{*K'=BiPaZˣeٔS3pH?nGH$qۜ1ׅ`[~I;.FR O70O*f@|+NX鲭x Yay1On Z[<^rBuy.ԳW\;jGbC l"}X4.;xh?o aחp瑋0;yPnVGIQ]x yy @EqUV".ShYK/`6YSYs-TijӺA,{b|~.fNFS`"OI[hl#cD]mq0Ϟ[4~{n 2-nvX_ 5 {1,nCsĖ#8FBˏBvsiۃ˦=SM`SEԁ1d+_:Fba4a-Lb s\D۶G{g[z N2J/&.-Շا `yP,wo 9 )P嬓j[hM>~n9L8lh%Yebeb,.#]>q["Ah۸KWW g\.Џ!fw g}k;0i5\u& c_ FDFBJC$.һ.A]Ww irptfG.Lfއf.'\j=^P 9 Nma/JJm`X|Q>E*FAVz~וa*MÙg(S;7ν .xl,5:p\Zsp.Hq/$rbaE6lOgWi$gŽ͞0ȢAӂ{נO/d7[~ ߂Lh~|KAY'Rd Bw~A?]0뺒Y-{Ӻ/tn[NY_nGe'>`os[2 º˙?X==_) tڦBk~zx: 6[>ctMb>̀ |, Qzа#MWU$Α*͝'½<^mI{&\ @VW Ӈǜ"U\"N8[197j܅F?}C qlO{YւV>KK*ua99eX<{Kz ܳJsRMN%EÓ$`W͛`%zX\BZ=[N':@EWLtHWz{a9t`Sm=SFEa3g-̌4@APLe.Jl "xs)U, ,K.`?jD9>,q/)/[a[ffx~ 5xIG |״c&,TW|BfeKAܰx$kܼ >g5(zg@ m_\_k b.X%T(>Α7L79%n)JoQoNFT_SAqwy: 4C/ust?juwsQa",NF$ #zgdBe͕}]9](\ՍkmEc&WǴTgq]"7RݿVae9 88HzSy#0\Yf0TFo?o=T;_2?<[\G}}9 mǩC"VtnY?mrm Z)k/.n/_-C[nq4>.#1_gw}ozbioUgrݯ^A7zk&a㵙7}/t/U ;`'gU輻a(ȹm[  d?nꅣ`wJMPm1h U.zdKɢS?`ӄ %\ӖYYdzy9NEC㒚ۺjhP-h7ϑAN:0V^Jۏygg7Y(rk(`$>QoWy{lRJcیnyf־,qrI/F0k=zKW'KQQ+0Yw?\N})_x+ؚ"ךY2Ìvգ[nOθK@/Y%fhot;3'=0<OCt=_05k׈ E +B;iȣu j [mC)L|||m~GDq^m,k.<Ჲ=QhT2 'a"|Nt=/\w #{&U7Xå hR LclzủЎ+ڽ>J݌pE*HKlC|Ameㆠg^nmgr~deOIҧ ~U5ktAÏ5a 7<#_UO=ۜY=#Q 5598/+o\m{Z _EʭmՋdv W~ |TKByIzU +`cd?{ C}<7_q.{`9)BGS|<wSGSjvsqup<:`n_46nzwإ_YOrru70 1?KiW#B Kk(`mG?o&#io?LӺ"wk_ۺF?y%A& 2$eX?Jߧ7b]_&2ps1u_ħ'd`c_-F'W+GSS߿=j^[7&MFt{(onQBzKBսzM%\Kr)w%HGHIґz*H)5wͅG?$ٝ۩iL=6)Nϑ'$Ѓ?F+|vlyէn>i$]y'vCrc$z{gG6_Gb'ohҫZZFF|28MI;IoJxgDlCI-)߼E].<I]E(đH@ոlY[]ދjR8d8BR@5=8n_~8 lPUс>h݁k]Iz=-Qf<:;2#f-I~殺xYL/ղq6 Nu/$xyƁ ?#ge|oؑؿJIbkp󝊓wAv!c7:$0p݅$&#IkE-8Sm%RڵyYmNE~OO׏$*vó$i촣+Sܻ=$J֠gWAU$vE?q[%$Ʊ13bGt~B"Uۏ?gIVܻ"Hg[n :լH}ڌ5 xRČ0}Ě^ooHgڞגaP5.78 /i˺؇L;qԧϢ kA]]*i4/%.ƝG )q],L]yLyb_yLGM)M2o=:ِ$h9I>_RH\[:G6U0#~S8Iz9tF0yCC$9B_)$bVܢҞ 05>IsgoC+O>-r4ugb{|pުڹH}ؼ1$njߋ뷉]_bK.7aCYC^ʼn kbHزn "ζ>=I-ԱwH_], ]K{ } q78yvp3W&J-~]7mGQ{EkO?]:GR"FO $Żl'Iߴx'HW '_.*==Db_ P(pd鳢۾V^#qc?XDOkm:c"g;t|Qxg#tLtNoDt?-C ^[ͬkMzuО3|A-8H\ΎOHJе?ퟪ\(G뼑U JvXcG=i+[H-AF]?$n$1olǍ~m%q%|K$aIzؾOHl !1="](}k\$?'R o-REZ}oG6RfpP귆_&Of;`r8Cbr-|[ZuwJ& ckD%һOiW-X8⚭iޠg5o䲈Iɼ:LhOUwe'o<|ڐT]nԈL_yƶ#ĵ֭>! kkNp/IO**ҩ-ܭH\v4~»$i/k95'LyI l\@}{Վ$nh}%\Hu7?/&'r?"Il58Vv%u6Dxp?#Sԙå_'e kO"qKľ%_MёYL3s+Ú}>^ӥ$U' L}I|;G% sĹzRA{f{=TFw~JsOIR>Z UfK8|@6?6YDb暗km!ǟUEuC<,! ?q^.K'6<5EnvgskzV㖑Վ{~+N5;BHj7yw퀮Dھ$NV*$P{7&o -?(ITjX}ZܡILӍMG~V$0̆ItڼHt &#)%%kp5/cߦIuIJB;~Lle $o\q⮴죔oMbPΙW+N%F.jF&֪4kIb3M I3.5FҾň{1$?r5yqgZ•$n=y ?ן3cgY>1q-Z8E];rg\muz|t#E8״A<ou){lrĥr8wyR6>$7n9$/INO-B={F$qUI*y>PFס6M2I£wHkL:8kjI t ]|h,]rKZW%ĔWއr~-arOXwp 8wsW"m󇭏8ObVܜNWۧbPs.$a#Z~]8hZczq[;C$}hmľ*MHaqW_\ };I;==2V'Z}?CV)v"꫼nd_~GfU`m2ṭr$َ7?ӎwSr~B7Hb&sڨĶύGe'ΉHclep%>#{I 'Ms}BJW)}dYI폛 6]~4m&=sYevpպEx.$(48s}4 .w\t }=yB/XYhPJ$ϢV:e$I`{plLo}mEq$1[7AxَbSyHLV^=Mv3[XCmM[̆刼yWD\WݮI:I"w`qMΐ߫]͸?y[ƔxQ ljt2IiG7I2=?7ҷ&Iμ W=GE.+G~$i}ސĹeZĔ$~ƢeiRzĝ$ar"ɱi1({q$i|HGRӤW/x]mI>Z}D?s擾7ZZ$b1Jϻē&aycٵgv?]u"EIOf.?Il wq{/YlμA!49d"q kx`r{4=6u7샪oFhWNˉߩ)Wݫdž/uˁwe9I_-QN|b7i7$ǯH9C\3칾ܷiweb;Qcně5s{Gv1ϐ]E ΢HWy6]7 ݃bS1~~|dBW6$5R=75?*OwhO/0n<犖HT}$ܡ}c~dz$` O6nΝ^FzéuIL? ?qI$viP߶^BFTGԪLmZkv(6`Ï%J4% f]@jQlWbW4 [z&L&aU/0Sjw=ıʥq*_m~ZZڑu 髞vq#է??& >)Tʇ!݇ ͺ׮(t go}RNMc4Ԇ7~ԓ7)3I}/q?н$iЂ $$gMO"K6$xg +{p$et4k1n|i^t?3|ۭ+%}ni}I\?G=ޙ2SQ}R ˟\IR Kqu.I?vy%q oG\Շ\d7IoTxӞ>W5ˋHLϖ"OlE;jRg,\eG7Fw-I#ao|-zO\1:2er۬kzb%Ս3_u\vmL=kzyBb{iWI̮ѷ[Ώ%}Pboә=k:>!Eʽ{$UZ]s;2F6| e[gZ᧷] |ɒ{SخΤoXoNC\ƍZ ӲQ5-}z\ĭ%w7$ ZC󶹾8jL^Uգ`~ ;qyP\{ %I79IRg=UhzES~M $H&$qEH#s?b9/US~zJz $w{oޕ-ϖۓ[;k&*a̪c #Ihpd"-O#3f}7ȳǔ?nG IŕR˒=<8m/Ǔ[7O#I?:}6q!8+${o|$5m'sHʎ"NAbގ8Ǡ$!:x7KWIl*OK{.G/>!''a$vֽCAh5z'boy ڢNSώBbWVZTha<$&?,0̵K7'1K2uitrbg~]$yywq I6Db6~{֕k+y[&q#}UOv}=xCff︞W' -߿0ILjVwsI$y. 5&Χ7*Hѧ0N:8v$nc\3ˇ0~I\p*!k}H㫥]Ir ;V#իǽ~W׏դI~f}~qI #'nj' w0:4qvtEdY<'gYC7~Ie$QWsOg0JY{}!urjIrw/T?KLo+ze3?F-v _]x~|MZ9_K^&bwƝHަ I\늖Pk{n%nf#b PP%/;a$dh9d#ypѫ{$mFLIb $i:%qۯ!:.1lfmDctľ,y?ǎ=H;,,FbWL̇H,bZxǁo$k\p$I^F|ֿF\>ju)$o7~Ŀ9jƅIR\+HRoЃN֘C%QcnqGgNM쫛^xvmqf I_ӤQtMt+tm2҅OWmhI+1׶X^3$1%č|-<?kˍF?߾_$)O[;ߊ_F</:./Hl?*7.ȞvH^kx gwQ~w Uz~ȫ,t`tTc%zWD>O L!0E` Lq0%aJ) SLy͊0`*T S :05`jԂ S&  SL}0 a  OU8.&C%́=E$+dhaÚbKe2TnOԩYG ɸ5g܆f܆e܆g͸q[S[r_Gr"7KC%ap}]}=ɽ!C$H "7Do!C%J *7ToPC%J &7Lo0a$I &7\op%SJKGcsUU8U3;\+Ƥ9b-d4lę!6>5md1"ɉLZJT-wݤm1 m^!خ66khJ56ePѶM-dmi[FJFҶmj:Mm6mh;Ma1*miHIm0˴m?mSi&+?bfbe_ʼzUKmo凷?& LSf0aZi L[v0a:t LWn0az6;0b| VhKL!)cӓQh{39bݱdsg,?4[DWUF>֖q:;=Ev iMq%ВC#9t1Nw?v:l!K،EH(YcQiv#EdSC?jk,mfgF3-=v+͆P4#ǝ1H(1;FʔTm[3}ݞ)mn<[B vw#֩,1^X{4foC^#kn)CEeRCmW=ٙb nu{k ۚj~V|SQtoΔ()р_(nnZ.T&Ȝ4wQd 1-ԨT[eMN(b$b]rP&P;om+C1VT:QgšjQ2.=]A[ l62ʻRKtv s.Bul]El]YXIHN; IXN³wR7{'w}d!٧nH}d!٧nH}d!٧95gSל}ꚳO]sk>u٧95g٧nh}f٧nh}f٧nh}ea٧nX}ea٧nX}e٧nx}g٧nxo (gZs/n)UwUL;0ȳfQ~[__߸1)M~_k#kpWc~% wYC YQ\MN~]/?޹閙3Nl- óuM~ex4Ҭzrf؏VaA-RLGڌ؂τiOטvm?1ЉJ;7|~[ ng64߫XD=C{ԆEikh6;Uƴc#łW<Oڟ h\[&sxH™]սί]bno;ľW#~˞-|ʉS_*W*Jh0%hsDbDB#j鼛G5Dn5˭rk.֕[ɭbA/^GaQ {+uz "|!(_"|!(_"|!(gVϬY>"|fE̊3+gVϬ_"|*_"|*_"|)_"|a)_"|a)_"|+_"|z9S9WӳMYWJUR$*[⌼/{Eyo0#g佄 Fc){r^E8#a1FF܋ԗ܋=b佖F{_p'B:= ˉ܋z1j!]E f佢Lr/g2zNތ'Ցܫj#8;>-8OUa2{Qg\ݩdz1{s⽨SEIEe-kmW6h2A-+,2E-kbWZ6_^ie +- b9W JZ&צBҼ^iҼo)ɧj#ɯrB򭜐w4iIvgy!O$䙘_<"䕘/Մ !/H6X{y4,"ı7j TWHo^HB . Eu^[Tgh 3fT0`|f0`6l C` f?Aas$i30?3/0Wa7`n܆?a e| 3f4XOa>3f 4/` 3Z2fB0KaìY -:F.Ed5&Jb3;+!Sd,hgp傪WNp%q2_N&ΜL*r+2/W  zdr)r"E 2 ( $ura b1}25 oI)P T#edrEzrfĿ,ӓ+'d-4+*Tohx#|?}jh]tD#t(tԎjZkYY\^<]70+E·1H"@KܥKEQrɻrfq^K2Y/\^t#.’.E(z)dk{z2LHF2!ґ..ůdi-Eq(n>-݄Z|o܈rj^\ ג-H7X"f|kq붌|kͯ}=7U"-)GJFhyo<d,%ZV0y.様'Mb(ӡF pTt#ݼn=o|6`1> ] FE6TTC4_1>Q ](FE5t,b|UOD#.2-хbbCo](v⯋pOm;>ҝ\^++gL, YTZ5|D}^r^<}Ks iА LIjƾnYArw*>=A.~=;g=_+ԇl)-G>}:xYOMX.*י}z+ܿ,yXzԪN_>E>WkiYopr~}K:}}׫>}`K#yǧPsQ?S~e5<3@7t,/[zQ)T_KgfI=iiP˶Kr=۾/W;QϳΡI?(”7+W62R> }Q)Ӌva2:Nc,v,hWz$vhdžv>h*|PYIwKvz`BܩBBقV\ACIC1KN$fbXܝB1q'*JA;bWܑ/QGv8Ď( 6:]qE o72FT@fI#dLn!c2c Yd/fN1 1ZI2JEƔ2dL1YD3qrT[^銥m.wSuxkz*s9a;FQ%ﺩ Pt"u=5Q}]@pL6֔XQMl8";smh^>+5lte}[?D6FC%֫xף?~64hi6%gM'%ݯ{ag4zd SRsnV/L̳7f2:h`|BƧ. f[bQ%:΀Ng| t,ll{V*g|t;-̾)ӭR2ƧNZd̞-ZƧ.Φnd| һwvlc2fY\lƷ=>&aƷ]QƷe1?ݺ۾GƷYƷ9ƷƷ%ƷeƷƷ5ƷuƷMƷoo;oo˯oۯ?__`O6`_R?wK0 {w0&n IWwva߻en[a߻ۈ * jWWWWWW[eWWWWW*T:0_U_d {F0***U_U_U_U_U_U_U_It***OVWWWP*******  V/}> Y,g? Yς,gsvl^8l~ H,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? ƴ/Yς,g[Ӊς,g? Yς;=?ς,g? Yς,g? Yς{ Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g? Yς,g?r.5W5W5W5W5W5W5W5W5W5W5Z9jjjjjjjjjjjjjjjjjjjjj𯎤7jjjjjjDǛ0_ݕ`_aE5x0׀ ׀ ׀ ׀ ׀ ׀ ׀ ׀ 1 ׀ ׀ ׀ ׀ ׀ ׀ ׀ ׀ O0_5_5_5_5_5, P"׀ ׀Mg:;Ce_5_5_5_5_C5N ׀ ׀ ׀ ׀ $Ykkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkw5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_5_C_ -ׂ-kkkkkkkkkkkkkkkkkkkkkkkkkkkkkkkk`ZZڶt. ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂ-ׂK4?9ρs s?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρsZSAka?TH9ρs?9ρsC `?9٨s?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρs?9ρOħ:::Kׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁׁ׽____zzzzzzzzzzzzzzzzzzzzzzzzzzzzzH___mf ׃=wj!0__________G5C`?Uڌ Оn CUat2ooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooooo¾FoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFoFo0ҧk&o&o&o&o&oc77777777777777777777777777777777777777777777777777777777777777777777777777777777777777.S}vUYmn-*S{< @ry sy (ȃy&GA(39 ?GAQ)yϼKm`M|'^}2g s9C!ΐ?gȟ3 s9C!ΐ?g>I62'ӷG9b\N#-5*5鶉̽t^sg DtsupĭhVDd W<ۣ: DVס݊0U]d'ϒt$ͫ,mM?|qƇ76gAՑf+S}'xi~AߊNǷy'?.jOt.@'3߿#GcUTWN-@ѩ6w?[ADV\ʹoDS0sAoΧҹV:Jf|,SdyV:ja|t.ΟZ:JB+i]/:JJ0*/Qi).ϱ7׺Vs>{vz~{_ziG.hs0ac%q%hל7yVD}fm.㄰M5kmyikz]_.{vg@Ž[iYKϦ}>gh_CNT=r?aIÏyv_]훞QƳr'ǔLc?{[#zNy(3bڶ*a*QzP_ȥT@% TZM+P D !=3llɩu{,J-aRKRWj'}:e:2[&;N&luez2,,!" K,,!" K,,!b, Y,,fYX̲ea1b, K,,* K,,aG]Ge:h=h>*A󩾃X.g24o||_D(AʃSă4/?Y>*A2||p|ă棔' G)||(A壔͋ϕ G)4{|yyz|8z|T}/248h>JyмM8h>*A.AQO{|T惒@d>^<灎 px{3C3F~|'̋G)O08a>w| QN?t¼h( .k?gT QO`sD:`>{|T3 Ő_YcҜT0S{=V#iyƭT!IHMiڬdkLR-P-F#fMf'moELlH`D=&!GAd"NLtJymœ41;iȅ`;9ghbN D[8Xm<ٿF-y$Ә&opF6k 4\-lndiCEhKOZŬ2OE:SPwAjéroS Ԉ''˽Z]v[hcc2L HՍUxVDH56@ɛ7oIV l9/ ZH<++؅KG)owk?xъ(_"+-54y3Z,X='Zm6"m,j144\9k TF xCIEץF+MZ[\HTTMYg^v0VPp+}.ˬ#dˉƟئ.q4bc%ݫtU_" /1gUl_ۜb,ؙUM[=$IJp\@U*0 F?nRԘQ\ޠ=?'D> g{/י\;?he_s-/\(l/MSjJ]OE4|>xX'E+۰5ȵʏ[zV?N~wF>^)U|1'N߅+]|~[77uů(o1vѢ9US><^.w+Yy|byiۧ{gа֋c5~0sGvؼtI]?S'-dhy7)ڛ\s{B\sǢowgr ~XwŪ/\v?ݰb˓ T.hҹ~'d6M_[eu~}CO__Ϳ^S:G𨤚λѹC:oGtFjNg|T4aj7E5j3^32DSC5q5};F5 E7gG5 3ݥVWc6M?ѾYZ|#ˣگ`tΐjҺ姌'Rj.|jRf|*A(狻WO++8$:HH-OkN/EPmM U ! iA1Iw @ [IR*dPMtW9U4ڻt ׶ o^ɉ# ˟^n{~vW/ƄYzRZ?n[jx^{´H϶US3[2;u\q?*7lgUȑݽoOn6~um~6Sw6Ģi7qӳV ?Iݝz[]לU=sخ?j%홗FME>+3Ϻ/ҫlz_~܏jzNHnv?Nϖ}s_}cv_ޕϳziĖVk׸Iu,\q?Tz7UY۶K;>_8gA=+V0]]_y{oߘƟc0D gXcE̳Li_ew[ڷ}yՋTEag{} y]1gӝ&g*^O^z*y9xNJ+k?~{nzDqeC?r:/j&}ݯ_9X8-quXcmngH|͞氹H7&YCj%7ycl{41҄ܝӒSkz(Jr&Y. )V%ڒ$Ѩ 1lͰ kwԱSMNNx&%WTkRj!I c[nxmNK3>pJRU鍛?~(WdwD 3EG=A9r+:y~qu uBӼO,`.-om%HӦLKHJ;bJot &#:#cR%uO䈡K,ÚM牝dsJt %K~ilR9"9ZVVGj!͍΃b fM[GZįLvْ)Ynklt{ EQ/<5tpLIjK^rg"K|FxWp=*?%O[–+WƔjk l撥q΃߱=ͶٵaD,떗8*􆅆Z o=:`Jҏ4^Yqo-_$Kؙ<}Ҥ*֙U߅<=iYGZO&,>t]eq)w8➥ M2G{溥~3tnvT;4qέw KiU [mhV-KYXs՝-  =D9XCCK.~cii6s9ZX0~KGbU{GnC}ϣv`%YGxM\ciicN涸G/^櫎qKfYlAj={TZ%WKUyq噋[ޭ31QUeś-5|Ҧɭv{Ao=YSK2Rx/ʝtZ4iҖm}_-Q|E47볽%aoիWCˈo]e?rMW3#o|%%~ggvsCM1}oKg[qPվqU6 %_TV g 5*QfHO}|BŦKn{G6Ji3oΈT\r|xѵ5e3^<\ov'^?gPM~~|1rr ?-~ ?cWo|gÏ7ӏ;e?~[ݫ }ơmWFh!?Ӈ3+|#C>Zb{ݣ}\'DoOҤo}hi5w=Wj!njw?D}xW5{Wty$?G!}=ǟ~ ~Aʨ%gtI)2~޺oSSOy5E˓J}ŧXǽyCYq?JցǾh˩r 7W^$qIr3eG5o_r]^b$&Os=ϯQ;ﰇ_<u=K/w]v.?3/I%۞_oo~mgoأx5]<Ů~0׳xR&-mZ޶%=k?ogٟՊhظGYوlv6 p?OMʳz+ Oc=l]2f*<[ g#>f[<}ⶼag;.~m -n*Y*voyV~5Huk+[}_=N.ђAm/[_8?zVp^N/4顙7{xɨc>M;9adn%..#~_r=t=4tagݟowk~'M?ʟ0fkUƳt_>} KO .In(Z{lȸ'$TE%U J%T`B%U`B%j0a-V!W&e_+~Q֯8FY(We_I+~P֯BYB(We_ +~O֯>Y'Wd_ɓ+x~N֯:YB'WdC~#Gߏ0a~?~#Gߏp~?~{m] {=k5CIˆJ %Jtys9]^.Lw5/gf0:6N`+>$^ߵ_Ufoo{%RhZ\W0o1cJmONGϣFksw1+UslR~/<֣gط3FLj+Zs_{ G/:yngY .NMɸ5g܆f܆e܆g͸q[S[r_Gr"7KC%ap}]}=ɽ!C$H "7Do!C%J *7ToPC%J &7Lo0a$I &7\op%SwtKqnwA&5C e-bOMpb/q3h3jE[Z8#uss9Or"|fE̊3+gVϬYPEB U/TPEB U/TPEB S/L0E S/L0E S/LpE W/\pEDuAU~ XH= 0ykiOWHNm_'mŎmk3FvhL;@BDhN})(dth#OfƘ6;4Ў ):AnѠ ?$Ў miC/vh XЎNcΏC8棘Y埘w2^G4ļR۝Qoǜ 8N{tGut,GotFitlցEHt;#.ڗ%ՓmK zѣ_t{>0Vh:v3t[c:O3-6)o{b' /NGIzR=?"y ^x0Z=o燌~ ! /O513sgxYxߪR]=aH@C= 0<ú 0PB($PB($PB($PB($PB($Ṕbd#s(F@129Ṕbd@1 @1 @1 #01mEo&:m%8$#D/V<[%:׭VJpSފ8M ug\dy߇'>d}\A1 ΃?űp׊Y'&+ϊCȸw"8@N,Y#WD>qrbY~ũrbg}W1'F=Qs)ĹB%&sי+&{42+ {/;?m8$^8N BV Ns2\wٜbW} t}Wp'&@V݉:N @c _*N+x;OHԾ*z5+Yօ9[ٺEx.f^.ĎBSvNd$${'을f$,{';z;>uCOݐS7$ >uCOݐS7$ >uCOݐSל}ꚳO]sk>u٧95gSל}ꚳOS74 >uCOS74 >uCOS74 >uòOݰS7, >uòOݰS7, >uòOS7< >uóOS7kAG亥TrV%0;A EmMJbC~}r[+Ԛ7}]:]ݢ]wTؗ4=f*wmh6CgM~Gq5];otO+z[f{:?3.>׉7~H>%ʙa?Zx#O-?KM2 o j3:c ?=7_c۵*C'*ew4?ek&?]{O;T3'`g]Rw9ՐٹzfU)1?8m `kdOo9!Z AfwHo6ݪ\0ꥬR7*ԣlHh~[_vKgMcq~eN˯r7Ÿ)w2_<8zl/LN._vo1g~b-gQyٰ_Wv ^0]4o9U|qKB!M!Pe\XсmϜ)]g|W2Bt9s9s=Mr4r4r4r4r4rsU~f)]O-٘#~i/18^xle->Os_`5%v}@[L:n1}=A{TE)EpJݨn24w.tW5&VX'jgKE_ Ւҡ/\i׹Qu'H̐2/3 9g9{wWZޑ#&T-PQo-.Iu%!bW7Mp=Ւ)kJo{#I%3:0pI.G|j;=&--ۢUs8cm5X'O*/EX{jZMm'ޚ)@4(5}[+\s-7%Ú\3/Li1i.tU R>kEWrP|?O(MTo\1bxZkxqmYSR5uE_tyu^_}gnP,z8;*&y_k(lw+ MFVG3|`}0!OF~pE4ܱkDL}U&&:3pŽ:55)ZMGL<g@[ZT=:=Y|j @)92bl~x$ 50d|]e A~?u@LH0(M D]X.3%Ѝɱih6: /pjs85[t"mGH6>dy@GH>QwI ^Pu% 8_>2yIKL/xȦx:FF+'c!}/PUTT4̯9Y!1{ ̱sGvʇԾʍ}+sN^)oG+([F[||=D{RFIscE$'cR(b{*"kPHn*7:a.@utMrеTE uʍZ A{t}ۂs:*h.ecN^@4 ~RUw0ut2]LEwJUZB{*2}ĞtaV"X+] Jj~Z:_NdKz9Z^Ndv9z]NPdKs9ٚ\Ndo9ٺ[NdKl9ZNdh9YNpdKe9YN8da9:XN|dK^9ZWN5oխZ֚7zւXZ y/]-BZZ꯬R-AYK-YD b jמ4(զAY,3 b}iW.,hEiKI 5Z<ŪтX.Z u_@4wAY, p-hP@X?eZ+BY,|Yx1g@8e|@6sZ'JBZ/Z'j̼a斯 :Qt 4[?H[8Sm\$"ũMiڬdkLR-Qdg3kYjYxdS/&QIQP;;-=8qzSz\polnC洊e:iȅ`\4Rx3_!jmKy(5ёLL6tă$ᩮ?^68?M1*F/_zֈrt(*fɗ (ҙz0 =F(k<,J2S#ڞ,kkwm^) (320/ )V7*WY!l&+'oD%qZY^H9wc`p$h"`.ݭ=D+*T|Ԉs:hhbhHcX鱲\9k TF xCIEץF+MZ[\HTTMYg^v0VPp+}.ˬ#dˉƟئ.q4bc%ݫtU_" /1gUl_# 4vfUB+)6;9c.B&/*?PJGy+ ,IRcFyW{sG{`3b_g^s-4mtȃ~}ϙ poho;7Mʯ)u=?xr:,apl|"ײޓO+?n1YA:-xMWǜ|^#:¯*wjEwl$ a1w[pߓFvTM_{_߭de~mN1BZ/Ï9b+~%'uLgcϛ?ݤho~vs s3gtܕZk7a?}bpٵvÊ-O*ݼ&G{BiӤXUV?d ko ]9hz en5~M3ҧ`rŕ0Y8:33jŪHE%TN uF kw TtE7K׆aSm}"1C6'ld|34ntn1vK %x3/6\g}أWhgu_W=(@#H~흞-3Z8z+7ӿ+g҈-Lg*֮qN&g㙬Ӿʦ%Ron=J}kse:bΦ;M/rUȟ([ j+-]U,]sjWc~22+~v2$,➵ˆ~#o{5t^5n`Mr_osO%_S:b gH|͞氹H7&YCj%7ycl{41씞J^;,Cvmɶ~VGĥKBzՁ'fqd#I4dD_G$zg3ljt14s1uxSzcc;q2՚Du$)a@lipɷr7vZ~VIv8qG5vOjlN0Magg4z: ӻs5>*`W>4uۓA8y3ޟmiY]ZZ1OKMsәnOwL+\ŔdMFuFƤJR.CtoY5W3; ?,!nKdKؤrDr4MTC)ccgK+ ( )"͚bJ _L%{S?t@W2 EXF8R1@s;%9A@iധF'۬`sIS2u*oz0G`NœAZ =fp=*?%%Kĝuc{jmk͓i2LY-/cqT" 4zt sRwEki2Z"ϟI3yIU3K׿ yzim",gۏ VcMY}7S(p=Kq7,euKgίRҥ?-=w85i~}Kg!⦝[3ȃӪn[ʗ'8z;[$8H{ns҅, 9 ;=ׇ]~rlks&-a=,!ff><Ŝ‰ ,݆Gw5Kޛ:=zǜmq^xW-)KVpͲ؂ztcK7 KKH狯n3[gb/1w7[TkM[6(lmӃV/` >{سӧ5e_;4itpr-!wPoKy-Z .dirog{=KjeiݫW.Kߺ6tqw6,n$߲#/./p1?רꏝw/]._KwRɶכ[_5m g}or1n_&%IKֹsIϪfYq56.z{E6;[]#y?kk=S=k-򬞾ʺSXa[tW٧ y2y=Ⱦ"V%ϺE-/dإG='~v[.oBg~۷8~jo,ݳin%?k*R>agּo_rsd#}P|y~˫"V4ϡ&?63~僗z }zhM1a-^2ENN43Yz{w{~K>dϢ] :ݳ}XA-k|Y[?ݚ_cbӏ'/L?xYF,<׭{;1qp~½oyғtK=k7}? ~X~ (ĞJDсJL~JLD F8a?6b ?Dcʤ_+~R֯<GY(Weʢ_Q+~Q֯CYR(Weʠ_+~P֯?Y'Wdʞ_ѓ+y~O֯;YR'WdʜS'ֿȉo7ob6 XVM&ֿ=ߘo7cb0 XK%ֿ+nMu,f9ҿ!D"!DNW'a_49ҿ33vdi6mڦݵmvq1͚l񢦣]Lr:M; 4]21uNKز*:S٦ď҂oޝDm70Y.څ;?#1xM&\&ca|,_C%ZdKű6dbs$x6=akZ71 YC;BjsAFvK]׃Ӟ$H`XJ݃wSSz]FZ /&|G[N ~)-o Upgܷ~'S[)#_Uj>}U!-QD{*Kyzڿ/< vKOIB9҈ez/#K焤xmrj9!"Mfz/ss_WQ[:ސ??hF^!o*repP^>+v>O1 ,b=b% n!Kx!pTQ[zR!*5S9?N>{VvSQ-QU,k] f^ .~X.*dOw^7r._.poEuk懯Sefi^fTApTdC OATPed2PaICnSAULM>&CyYVRCNeBBUTh \ W*00T놞N,TmNРJ;f@A3>Gt0#aFÌ3wd)0`&1f<0 iKaìY - ]I-D3טKΤ\r5mR#D'nW lp2љ_<&TL**|b2/IRW˼wd}rqD. (trɴ1פ|2o 'P 4"eDr@bj_!_u^O)XJ *TDҏ#rzo'=5K_vmk?G-5~V7? ~6o}_)o*_(}_Uw+ !Khws폞~ >ohx#|?}+*HmsJ^cK*Y ClZd[+z5|gUNx+mx*B\K^xo`o%)Ob2$*n#JZĈr-qm(YbI)dL-fD7**^rL4Fx/ݒF2Մ1*35-lj0R@[ڈEHKn{#nD^-x/.{kdHy,ri\3FN[FՎtv;ⒽL[z* Ȗ#%#K˷Xi f2eI-+A˃b~y"n}%.t%ćJfr.*Kt3tiP ]EO"!|2`1> ]E%2TC0o*˿$.EOI`e`ԅ0%`;0[F]B~BZ+ٙTJ[^e B{cK!n9i|&~ϯ2nrUΤf\4eɫFD V_KϗOv/mYKo~v*}3[ʕk kQٯ^iZy8?̓?>Zpk#y,8f٢vEMQ_:s7KDmO֥MKzu\^U,_b'~_זOv]݉ڛuM1Ef)^Zw 2gNO&D;bǂvzFb'vlhV~qi&'})*hh5^H;1cZ1NJ&v='c:;^!v|}hUhCҁgi)ʎ0\G@Qo䇨V&qߒ@GȏB~Ce~_$? (?(&:() +ɏ/?fOO6]_̛9ߋo / y{́]1+w?-/uJd,nU!W)R!BeQ8;%c_pKn'N=&{#FԿ!f\okpVuaIq7}%vMg4' *;1Ĵs#;;:;yF^Ҫ760r)inJֿ7$Mw5I~kW$EwꆒTn=$jıíff3qs3>#bW$&m ^뱱IttG#+1&>hlҐZkAE/^[캺,/LHBNx!I = w˃~z£˝$QV!O췖$}e6]n@b>(g%X&IuWq-EIeUO՗W@l\,2-%qNݟDo_$~&wĶ>_[I\UWĿA?=X eUݎ$a\6m} \MIHJ2$2F [J$$t̄c̏Y)2< eL {ws؟}9vkm7D6NCgYہ3=%ެ&gސKcNy\ ;p\ұPf|ȿ8o )\oذ^u Mp o]"zSF&DY ngF H۰wώCҭ_A>ƙA bo2G R $V=l]|6x˂IA6i{]雝SVH@9w$-..o<T )^5xfm@yY6g&P\{qUTH>:j 6τй0~&u!D}"(K ci#q3z[5vLQ|,=vi!ZX=8+3>Zc5֟me]DԴ~Ae lR'k*ߚ͌{8\S7[{iC7=ֵYfJu yl*.X*{Ctܗ6jEa۵xbDL}1 5޳> [9Hν? `"#s 0lh±ҦIp\fŕ7xaS.i C?Ύ?jwͱI~9cqiSOLkQҒPp{ m&OAi=OceW @Z5֜6$+Yi-7\u k!3^x 514qmKG{dc2? '{N.{YCA).ԋּa|^_PbZ NpAA[΂b#rfԬd OK1.G3:Ǭ;ٽAr0qzK[/+fAxΥ< D Vmڱ6{)ǂuye%D {\()w!¸Hp/5*@s1>7(Qj"J_k <IӸ dzA~Yv'_/g&QƩf@Ԙ#[l3Bƶºeþǁ~^DKDb]b 7Y(ǿד3/Aanv31u}C?BG'MңAqo #rHz w\13>k2d ^oqzpn$sS3 _AxZ㶀ҭά 1 V͍?Ͳ8I5_[^'_!SKj۶u; "l ܂UX`d[Ϙ  lu0w?Lѩ{{n+{g *@"3jv^}NV(\F|aXydyG[ dG\hY lۇo- 㖡s@\A&ͷX [/E6'ֲvD3.p_1:#m566_'Z]x-+Hӽ\ E Цy0(O'D/h l[Ùx3[^p"*6~v`656DYebf=6ن}020dIsAx?L ۖlP4qJXJCC.B ;E#!ő>౺:i/m! k;apguw"D1y8_q}yo$ֻ8Q~#-Ya1nDf0=96#S>s"[`Bb "99ss>Ob\\_k!r\F A j#sD^ܫS?{\v*K!` uDoo xA[w(>h'>#6[c?nֳmaT/=jt Kv7pZ'޹Ю}~Lҽݹ}-5DnbH?H;~VB"X 'K߰"vy9@@=/U\ ([x-Fr>jqIG\Nu %@ԡ/&t9CфyDHT(ގJ: 5bAb{Ҥ3w?nHp>Κϭԅțڟx•-O^3j1~)\6td7H۝|ͽG[(tLQ{gAK_!;l,yz4Š !jVn 0}88̠6Ze*`|Q 8ryZ) *Ouhz$"t7(7Jǿ=âs2^P~߇ K }IyCAd|ye#<֯*~  1,nʕ{lV hʹ:>湉j~hߎ zFoi\K/Y׳ o>gOehDlQ8&OW@6Cr@xH!CfՆ-ήo r.>1ͧ*>AArIPZ`^ Z^Aeӽp@At ,Lcwˇ-pz3-Ն+}x+](vZIőt6o ްp:t]ѣ0k_,Y|ٺތهO9Mw!<~D_.>^&e[?|8x\K 'b¨5G*UVz!s'P/gfEFx]AVzPP|mn|fq||~>W{zY c6%>ϑBY7b8+P42 O _Ʋ>m'>_$>xbUj]$m]Օ ^^/"֫ArP+]zdIF͠L:O3R;- Xb,8' DgOUݑþhI#ʛ@ kl׍% z=ǁWJJ.O8|.3]O~_`"ͮ?H^t|hznʈp2.'+B#֟9gqnZ'-*%~N; <}8Sc=5;]8{= ъa {ڽ|"Se\eչƓ|2߿EL /9:DfF7a_9 >>\̟c꥗Fř3[`Le= 7^ b ,!F|[W 6wda x QwԵY asUv2a|;ijZh"f0 Z~9@?otï@Z`:=;86Vkyu>G% K(i6ߨӫ# poc{P~#>-e7w˓)'΁ROWAԳpwӁӄ9eaaV6qB?YׁgŚ>5E2s2CԞpBc7@W0gSrYlsP[>qkMgpޜk~gVA0Bq7εh{߷!uși}ނ|à|]<-(& ~||Z`ϷoÖ;JPY9 Ojz1NPAc7@a?82F;XiH6#my OmePY ܢku/ص4P <-Vs)cAq&eZ/gwȝ@qE@Φ7(mm /Yـ^Gqv2]!&<߅mk`#{+AՉ N $UؿDY[ k;{牯3=nze# ;_.|*+\TO>g*Y u@Crz$(,. +>Aww~Di#gm_:oeXԩCXl M7}[br9ߣNl7: w[N;D.nO^d4SeBԅN @ldϓ'H@r}̺V5+?ρXA+6r('ϗN\ \ÃE3UAw^Ϯv^Hg:N _2,)ٗdod+mE  r$q R!] :`OOyճY ji9'HjyO2`VAT!wŒx߲ QҬ'APtT\<ȿq6Hoc $gׂbCP~musm[B+pt0(v&Z\ RwLi[~$T?|kL",2]z{\մ>5zx.TP4;om2HL{}l|9|dz>F=̮גP \z }o$/K`Z[Gר՟s̿Bۃ@Z&`_Bo@:i|hNq]M9de@"rzj| HNkY:"Oxu>ϴB5Q[#&^;Ԯ#ϺgSA!]pK#\_9Ⱥ8b7C@'dX´}ϳ8e)~Ϫܾz3`Vk G rH:=k ]MxV01_OD=A~` .ٻ o~ESBt抿 hLZϊ,{2|}?$s8ܞIG{ |?wO[ܼb*?{׷ TW:eAQ Kz.YOiRp[ _ީƨ ]a>oXn$7 (I罖~o?£l{9vttD >7FzdKѳzq71}B 1< _GlܛHۀf qg v,hˋ4ף(~8珋b$ucԥcO7¶S5Kfص(ŅiۀbQ .ǔ h>%O@>*7f (ߵbgu?Z]e1[GzšG }v o f A!yUͷe6yIq}+CۛC쐾MA݇[ldǮknɜ& :M@jw_y=|r&43CY7\}-:Pc/u>6,= _F ʠg="ƽF} rϖR">=HQ .۰,f`qݷy-^ҊBU[%";T}&C"Yː?)qsCWQ}{VׯVׯFVׯVׯsׯsׯFsׯs'a;ܝHXN$,w' ݉!Dw"a;0H2H2H2H2H2H2H2H2H2H2H2I2I2I2I2I2I2I2I2I2IHHHHHHHHHHIIIIIIIIII:u&LjיԮ3]g]TT8gUv2cUͦدr~#ĂBLh"=ba >bF,CbꊩbA$#b$FbjXЈXa & :D,hBޱ4hBb%+bq%2bH,bF,nhAt 2` ! Oa|G45;]E1>hlaxPk:@|ɇ2_Mx8? H>Hi$0_)H TIoD Kq$ 'apS0B }{ }vLv #cjr垳{.Zj5 ݫ wG&CM,m7n:kz#1G m=bhC[z#1GLm=bjS[z#1G,m=biK[Xz#U Ԏ8gUT{Hk(i ,Ja6Qڣ|ZBsM;1<[h0xgMg"kTShU-hZ9d9AKLBfⓡ5DD a@LDgefHdi0( w͐, *%y/QqWKTjk!iA}L }V%1cHR)屖(hV CkLyNִ5Dд!: 5qEí3zRShԊhFF؏2#=)4"@k`jKCZ5sSrj*@ρ4AsQǚk0t`Y.:kꬁf5s*N0tWa]*.ꮢ e.C7w]n2ts e.S7w]n2usLe.S7w]nts,e.K7wY]nusle.[7wٺ]nusκ묛κ묛κ̦Y%6?I,5shO8GZr=g_$/}8;79T2;eSYWuӾ|cwZ<;dι8W9:=x.月<㡵k/hu՝ N?^ӹ3oz7+' E&'->8^LjO9h6`?_+_aO0sCLNnΑ$_믎,+z~Vs&Yr s#{[i19׷1lUҎsUgԲ%OMx\(wL22da9Y÷ pgt~vsHQ˱qg:s]-wgٹ{m+ΞW/ q.I lǹdIoٷ_'#@7s%o_s^sNik$֘V $6k 8{|>bS8WgL!a&'`A5cԌEw O=5A4Wߋ"_."|o,s'/S VaDxJS&`Ad.0u:p)LNm˘:x{>nOTxxzx*3<%^?Ox'-h$[=|-=\pYXi=3<.z rg^/t$KA ZR1)O n);J_Նʢ(ȚNO' NԒ xI^JsJAER1K)P7ZZZj"aRa'ZZXZXZ04c -, -!0շkDX?%` 8ƿCWA,?CWн?#«[ lk֌6Q@o濡~C P@}FfPЭ8' :NUjֵJV ޣABA(A:?- =FTңA#B=BH7t`:ZRڒ{sI?CQ|4oy ݇[}|(F hEߪBaC}ޑ|d'2VzQ:(wjnT:#( *w)mB}?uӿ{C==GS׳~}$Ǝlw BwB(R ?R뗍~|T}Qw8ZОСZN?W'DixK Յ@v1~ʞfrwPߡKs5i.-Ut1]/doBkJO e:NDf~B%DraWuW4}?$Hk@cew_>GGYҍvPk~Oy-MN7C 2FqVm$a Aq8mUU!V^QXY&G.WD" L!04Ūi[hȐh)F([D$>2 ה C2!tivꢩO& vI0FK"KnZNZm@GQNMjJ&Y(T2j3kuOiK!ӁjǧxDcLTVkAC?6Q}jR~IX #Do3mmmmmԛG4y?`/?Y\Yc}}.Ŏl2'w_x='/3|1oh嬟#Z9Vw:= ={$Mq˯|RMͺ:OUGzoK??7@wa5I#iDڬ(4r:GFC0%YQji|@mؑ~zBۑe"xj>[aDzȲD =s4hL`Ԑ߈/t>jCMMXg]eUƦcj<-a!,1f ǿK qĤaj.LmA4V>ǿ0sq߷hU֯!5ݚ >>zӽjzwW{dTY{AM^3k罃h>mx!#j%w7^UދȻ_6NrI8{9D,^?zzU^2~ >R]CG>rrD]F^~#oE:UBt/G[9R{,FVU|YMIRT{3{wӔ"T7G3hRRP Cl&P ū E5 Aq/JrC:>Y1& )DŽRF( ȕ )(Y1&6 (>RZQ B@/3@r#3)mĆPt&.m<@ne@qKf<hm aTxKKh:hƣfLjߍGM w!a͈ϐ^{ڈ:b ;Q#FvX-bQԣjlzA3k2a7'm7 UucMEM"l?s(Z8<kjFDjx roDȢo8#lō;^>`tZ TK(K\Kb*Ԥ/B*Ct(M^(l2$_%Rh&oVtrotl/inst/extdata/protist_mutation_rates.csv0000644000176200001440000000053612547574666021232 0ustar liggesusersspecies,mu,pop.size,genome.size Tetrahymena thermophila,7.61E-012,1.12E+008,1.04E+008 Paramecium tetraurelia,1.94E-011,1.24E+008,7.20E+007 Chlamydomonas reinhardtii,2.08E-010,1.00E+008,1.12E+008 Dictyostelium discoideum,2.9E-011,7.40E+006,3.40E+007 Saccharomyces cerevisiae,3.3E-010,1.00E+008,1.25E+008 Saccharomyces pombe,2E-010,1.00E+007,1.25E+008 rotl/inst/CITATION0000644000176200001440000000506613106416775013365 0ustar liggesusersc( bibentry( header = "To cite rotl in publications use:", bibtype = "Article", title = "{rotl}: an R package to interact with the Open Tree of Life data", author = personList(as.person("Francois Michonneau"), as.person("Joseph W. Brown"), as.person("David J. Winter")), journal = "Methods in Ecology and Evolution", year = "2016", volume = "7", number = "12", pages = "1476-1481", doi = "10.1111/2041-210X.12593", textVersion = paste("Michonneau, F., Brown, J. W. and Winter, D. J. (2016), rotl: an R package to interact with the Open Tree of Life data. Methods in Ecology and Evolution. 7(12):1476-1481. doi:10.1111/2041-210X.12593") ), bibentry( header = "You may also want to cite the paper for the Open Tree of Life", bibtype = "Article", title = "Synthesis of phylogeny and taxonomy into a comprehensive tree of life", , author = personList( as.person("Cody E. Hinchliff"), as.person("Stephen A. Smith"), as.person("James F. Allman"), as.person("J. Gordon Burleigh"), as.person("Ruchi Chaudhary"), as.person("Lyndon M. Coghill"), as.person("Keith A. Crandall"), as.person("Jiabin Deng"), as.person("Bryan T. Drew"), as.person("Romina Gazis"), as.person("Karl Gude"), as.person("David S. Hibbett"), as.person("Laura A. Katz"), as.person("H. Dail Laughinghouse IV"), as.person("Emily Jane McTavish"), as.person("Peter E. Midford"), as.person("Christopher L. Owen"), as.person("Richard H. Ree"), as.person("Jonathan A. Rees"), as.person("Douglas E. Soltis"), as.person("Tiffani Williams"), as.person("Karen A. Cranston")), journal = "Proceedings of the National Academy of Sciences", year = "2015", volume = "112", number = "41", pages = "12764-12769", doi = "10.1073/pnas.1423041112", textVersion = c("Hinchliff, C. E., et al. (2015). Synthesis of phylogeny and taxonomy into a comprehensive tree of life. Proceedings of the National Academy of Sciences 112.41 (2015): 12764-12769. doi:10.1073/pnas.1423041112") ) )