Skip to content

Commit

Permalink
Add files via upload
Browse files Browse the repository at this point in the history
  • Loading branch information
equitable-equations authored Aug 14, 2023
1 parent a61b649 commit 35a1dd5
Show file tree
Hide file tree
Showing 5 changed files with 946 additions and 0 deletions.
Binary file added paper/cooccurrence_tibble.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
209 changes: 209 additions & 0 deletions paper/fqar_refs.bib
Original file line number Diff line number Diff line change
@@ -0,0 +1,209 @@
%% This BibTeX bibliography file was created using BibDesk.
%% https://bibdesk.sourceforge.io/
%% Created for Andrew Gard at 2023-08-12 13:59:04 -0500
%% Saved with string encoding Unicode (UTF-8)
@article{JSSv059i10,
abstract = {A huge amount of effort is spent cleaning data to get it ready for analysis, but there has been little research on how to make data cleaning as easy and effective as possible. This paper tackles a small, but important, component of data cleaning: data tidying. Tidy datasets are easy to manipulate, model and visualize, and have a specific structure: each variable is a column, each observation is a row, and each type of observational unit is a table. This framework makes it easy to tidy messy datasets because only a small set of tools are needed to deal with a wide range of un-tidy datasets. This structure also makes it easier to develop tidy tools for data analysis, tools that both input and output tidy datasets. The advantages of a consistent data structure and matching tools are demonstrated with a case study free from mundane data manipulation chores.},
author = {Wickham, Hadley},
date-added = {2023-08-12 13:58:47 -0500},
date-modified = {2023-08-12 13:58:47 -0500},
doi = {10.18637/jss.v059.i10},
journal = {Journal of Statistical Software},
number = {10},
pages = {1--23},
title = {Tidy Data},
url = {https://www.jstatsoft.org/index.php/jss/article/view/v059i10},
volume = {59},
year = {2014},
bdsk-url-1 = {https://www.jstatsoft.org/index.php/jss/article/view/v059i10},
bdsk-url-2 = {https://doi.org/10.18637/jss.v059.i10}}

@article{matthews2015null,
author = {Matthews, Jeffrey W and Spyreas, Greg and Long, Colleen M},
date-added = {2023-08-11 13:27:00 -0500},
date-modified = {2023-08-11 13:27:00 -0500},
journal = {Ecological Indicators},
pages = {1--7},
publisher = {Elsevier},
title = {A null model test of Floristic Quality Assessment: Are plant species' Coefficients of Conservatism valid?},
volume = {52},
year = {2015}}

@article{bourdaghs2006properties,
author = {Bourdaghs, Michael and Johnston, Carol A and Regal, Ronald R},
date-added = {2023-08-11 12:48:37 -0500},
date-modified = {2023-08-11 12:48:37 -0500},
journal = {Wetlands},
number = {3},
pages = {718--735},
publisher = {Springer},
title = {Properties and performance of the floristic quality index in Great Lakes coastal wetlands},
volume = {26},
year = {2006}}

@inproceedings{wilhelm2017flora,
author = {Wilhelm, Gerould and Rericha, Laura},
date-added = {2023-08-10 14:34:57 -0500},
date-modified = {2023-08-10 14:34:57 -0500},
organization = {Indiana Academy of Science Indianapolis},
title = {Flora of the Chicago region: A floristic and ecological synthesis},
year = {2017}}

@article{oldham1995floristic,
author = {Oldham, MJ and Bakowsky, WD and Sutherland, DA},
date-added = {2022-08-30 10:59:12 -0500},
date-modified = {2022-08-30 10:59:12 -0500},
journal = {Ontario. Natural Heritage Information Center Report, Ministry of Natural Resources, Peterborough, Ontario, Canada},
title = {Floristic Quality Assessment System},
year = {1995},
bdsk-url-1 = {http://dx.doi.org/10.13140/RG.2.2.35685.91360}}

@article{freeman2012coefficients,
author = {Freeman, Craig C},
date-added = {2022-08-30 10:23:15 -0500},
date-modified = {2022-08-30 10:23:15 -0500},
journal = {Kansas Biological Survey \& RL McGregor Herbarium http://ksnhi. ku. edu/resources/plants},
title = {Coefficients of conservatism for Kansas vascular plants (2012) and selected life history attributes},
year = {2012}}

@article{bowles2006testing,
author = {Bowles, Marlin and Jones, Michael},
date-added = {2022-08-30 10:07:03 -0500},
date-modified = {2022-08-31 17:49:04 -0500},
journal = {Natural Areas Journal},
number = {1},
pages = {17--30},
publisher = {BioOne},
title = {Testing the efficacy of species richness and floristic quality assessment of quality, temporal change, and fire effects in tallgrass prairie natural areas},
url = {https://doi.org/10.3375/0885-8608(2006)26[17:TTEOSR]2.0.CO;2},
volume = {26},
year = {2006},
bdsk-url-1 = {https://doi.org/10.3375/0885-8608(2006)26%5B17:TTEOSR%5D2.0.CO;2}}

@article{bauer,
author = {Bauer, J., Koziol, L., & Bever, J.},
date-added = {2022-08-30 09:42:59 -0500},
date-modified = {2022-08-30 09:42:59 -0500},
journal = {AoB PLANTS},
title = {Ecology of Floristic Quality Assessment: testing for correlations between coefficients of conservatism, species traits and mycorrhizal responsiveness},
url = {https://doi.org/10.1093/aobpla/plx073},
volume = 10,
year = 2018,
bdsk-url-1 = {https://doi.org/10.1093/aobpla/plx073}}

@article{zinnen,
author = {Zinnen, J., Spyreas, Zaya, D., Matthews, J.},
date-added = {2022-08-30 09:42:52 -0500},
date-modified = {2022-08-30 10:16:57 -0500},
journal = {Ecological Indicators},
title = {Niche ecology in Floristic Quality Assessment: Are species with higher conservatism more specialized?},
url = {https://doi.org/10.1016/j.ecolind.2020.107078},
volume = 121,
year = 2021,
bdsk-url-1 = {https://doi.org/10.1016/j.ecolind.2020.107078}}

@webpage{naturecite,
date-added = {2022-08-25 13:21:07 -0500},
date-modified = {2022-08-25 13:22:08 -0500},
url = {https://www.naturecite.org/},
bdsk-url-1 = {https://www.naturecite.org/}}

@manual{rcore,
address = {Vienna, Austria},
author = {{R Core Team}},
date-added = {2022-08-25 13:07:50 -0500},
date-modified = {2022-08-25 13:07:58 -0500},
organization = {R Foundation for Statistical Computing},
title = {R: A Language and Environment for Statistical Computing},
url = {https://www.R-project.org/},
year = {2022},
bdsk-url-1 = {https://www.R-project.org/}}

@book{rericha,
author = {Gerould Wilhelm and Laura Rericha},
date-added = {2022-08-25 12:52:27 -0500},
date-modified = {2022-08-25 12:54:13 -0500},
publisher = {Indiana Academy of Sciences},
title = {Flora of the Chicago Region: A Floristic and Ecological Synthesis},
year = {2017}}

@article{ladd2015ecological,
author = {Ladd, Douglas and Thomas, Justin R},
date-added = {2022-08-25 12:40:17 -0500},
date-modified = {2022-08-31 17:58:47 -0500},
journal = {Phytoneuron},
number = {1},
pages = {1--274},
title = {Ecological checklist of the Missouri flora for floristic quality assessment},
url = {https://www.biodiversitylibrary.org/part/175050},
volume = {12},
year = {2015},
bdsk-url-1 = {https://www.biodiversitylibrary.org/part/175050}}

@manual{Wickham:2022vf,
author = {Hadley Wickham and Romain Fran{\c c}ois and Lionel Henry and Kirill M{\"u}ller},
date-added = {2022-08-25 12:36:12 -0500},
date-modified = {2022-08-25 12:36:12 -0500},
note = {R package version 1.0.9},
title = {dplyr: A Grammar of Data Manipulation},
url = {https://CRAN.R-project.org/package=dplyr},
year = {2022},
bdsk-url-1 = {https://CRAN.R-project.org/package=dplyr}}

@techreport{wilhelm1977,
author = {Gerould Wilhelm},
date-added = {2022-08-25 09:15:42 -0500},
date-modified = {2022-08-25 09:17:19 -0500},
institution = {Kane county urban development division},
title = {Ecological assessment of open land areas in Kane County, Illinois},
year = {1977}}

@inproceedings{swink1994plants,
author = {Swink, Floyd and Wilhelm, Gerould and others},
date-added = {2022-08-18 14:00:38 -0500},
date-modified = {2022-08-18 14:00:38 -0500},
organization = {Indiana Academy of Science},
title = {Plants of the Chicago region},
year = {1994}}

@inproceedings{spyreas2015users,
author = {Spyreas, Greg},
booktitle = {Wild Things Conference 2015},
date-added = {2022-08-18 13:59:15 -0500},
date-modified = {2022-08-31 19:41:34 -0500},
title = {A Users Guide to Floristic Quality Assessment (FQI and Mean C)},
url = {http://www.wildthingscommunity.org/wild-things-conferences/wild-things-2015},
year = {2015},
bdsk-url-1 = {http://www.wildthingscommunity.org/wild-things-conferences/wild-things-2015}}

@article{spyreas2019floristic,
author = {Spyreas, Greg},
date-added = {2022-08-18 13:58:45 -0500},
date-modified = {2022-08-18 13:58:45 -0500},
journal = {Ecosphere},
number = {8},
pages = {e02825},
publisher = {Wiley Online Library},
title = {Floristic Quality Assessment: a critique, a defense, and a primer},
volume = {10},
year = {2019}}

@article{freyman2016universal,
author = {Freyman, William A and Masters, Linda A and Packard, Stephen},
date-added = {2022-08-18 13:57:10 -0500},
date-modified = {2022-08-31 17:54:26 -0500},
journal = {Methods in Ecology and Evolution},
number = {3},
pages = {380--383},
publisher = {Wiley Online Library},
title = {The Universal Floristic Quality Assessment (FQA) Calculator: an online tool for ecological assessment and monitoring},
url = {https://doi.org/10.1111/2041-210X.12491},
volume = {7},
year = {2016},
bdsk-url-1 = {https://doi.org/10.1111/2041-210X.12491}}
631 changes: 631 additions & 0 deletions paper/paper.html

Large diffs are not rendered by default.

106 changes: 106 additions & 0 deletions paper/paper.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,106 @@
---
title: 'The fqar package: R tools for analyzing floristic quality assessment data'
tags:
- R
- ecology
- floristic quality assessment
authors:
- name: Andrew Gard
orcid: 0000-0003-4434-0755
equal-contrib: false
affiliation: 1
corresponding: true
- name: Alexia Myers
equal-contrib: false
affiliation: 1
- name: Irene Luwabelwa
equal-contrib: false
affiliation: 1
affiliations:
- name: Lake Forest College, Lake Forest IL, USA
index: 1
date: 18 August 2023
bibliography: fqar_refs.bib

---

# Summary

Floristic Quality Assessment (FQA) is a standardized method for rating the ecological value of natural areas based on the plant species found within them [@spyreas2015users]. Each species considered native to a particular region is assigned a *coefficient of conservatism*, C, on a scale of 0-10 by experts in local flora. Larger values of C correspond to species that tend to be found in undegraded sites, while lower values indicate species that are more tolerant to human impacts [@bauer]. An inventory of the site is conducted and the average of the C-values found there is computed. This *native mean C-value*, sometimes weighted by the total number of plant species identified to give the so-called *floristic quality index* [@bowles2006testing], is frequently used by land managers and other agents to quantify an area's state of conservancy [@zinnen].

In recent years, it has become increasingly standard for practitioners to upload their floristic quality assessments to a central repository, [universalfqa.org](https://universalfqa.org/) [@freyman2016universal], which already includes tens of thousands of assessments from over one hundred floristic quality databases. This large public data cache represents a potentially invaluable resource for quantitative ecologists, though it has so far gone largely unexplored due to a lack of both technical tools for inteacting programatically with the repository and statistical methods for analyzing the floristic quality data housed there.

`fqar` is an R [@rcore] package which facilitates the analysis of occurrence and co-occurrence of plant taxa at the regional level. Pulling data on-demand from [universalfqa.org](https://universalfqa.org/), it provides both organizational tools for handling the disparate sorts of data housed there and statistical ones for drawing novel conclusions from that data.

# Statement of need

The [universalfqa.org](https://universalfqa.org/) website is designed primarily to aid field botanists, allowing them to rapidly obtain floristic quality assessment results simply by uploading their site inventories to the repository. While it facilitates storage and sharing, [universalfqa.org](https://universalfqa.org/) does not provide users any tools for make constructive use of its data beyond simple viewing and downloading of individual assessments. This is in keeping with the original motivation for floristic quality assessment: to aid land managers in making conservation decisions.
The `fqar` package enables analysis with a wider lens, allowing users to consider database-wide records of plant taxa or characteristics. By examining entire collections of assessments simultaneously, ecologists may gain insights into floristic quality assessment as well as the various plant species it tracks. Among the wide range of questions made answerable by `fqar` are the following:

- what is the co-occurrence profile of a given species of interest? What other plants (or types of plants) is it most frequently identified alongside?

- which species in a given database might be misclassified? Based on their co-occurrence profiles, might some be more or less conservative than previously thought?

- what species are most commonly identified in certain regions? Which have been reported seldom or not at all?

- which non-native species have become widespread in particular regions? Which tend to be symptomatic of degraded areas, and which seem to be able to coexist alongside conservative native plants?

There is currently great need in the ecological community to validate and potentially refine the floristic quality assessment methodology [@spyreas2019floristic]. Because C-values, the metric on which FQA is ultimately based, are assigned based on the experience of small numbers of local experts, there are inevitable inconsistencies and irregularities which only a larger-scale reconsideration can address. Thus far the community has only been able to take preliminary or ad hoc steps in that direction [@matthews2015null], [@bourdaghs2006properties]. The `fqar` package will allow for a more deep, targeted analysis.

# Typical workflow

Analysts using `fqar` will typically download and reformat assessments of interest before using functions like `assessment_cooccurrence_summary` to analyze the data. The following workflow does just this for the *Flora of the Chicago Region* database, an updated version of the original floristic quality manual [@wilhelm2017flora]. Depending on the needs of the specific user, such analysis can be restricted to particular practitioners, organizations, or locations, or redirected entirely along the lines described in the previous section.

First, download all public assessments in the desired database and reshape them into a standard format:

```r
library(fqar)
chicago_fqas <- download_assessment_list(database_id = 80)
chicago_invs <- assessment_list_inventory(chicago_fqas)
```

The output of the former command is a list of data frames in the original format provided by [universalfqa.org](https://universalfqa.org/). Each of these data frames includes several different sorts of information: species-level observations, summary statistics, and metadata. The second command isolates the species inventories and stores them in a tidy format [@JSSv059i10].

Next, extract co-occurrence information from this collection of species inventories:

```r
chicago_cooccurrence <- assessment_cooccurrences(chicago_invs)
````

`fqar` provides tools for both quantitative and visual descriptions of the co-occurrence profile of given species.

```r
species_profile(chicago_invs, species = "Fragaria virginiana", native = TRUE) # a data frame
species_profile_plot(chicago_invs, species = "Fragaria virginiana", native = TRUE) # a visualization
```

![\label{fig:strawberry}](strawberry_plot.png)

Here we see that *Fragaria virginiana*, the wild strawberry, is listed with C $=0$ in the Chicago database but co-occurs with a wide variety of more conservative species. In particular, it has been found with 10's more frequently than it has with other 0's.

Summary co-occurrence information for the entire database can be extracted with `assessment_cooccurrences_summary`, which gives a complete listing of all observed species and their co-occurring mean C-values.

```r
chicago_summary <- assessment_cooccurrences(chicago_invs)
```

The data generated by functions like these will be invaluable in the validation and refinement of floristic quality assessment.

# Availability

The `fqar` package is freely available via the Comprehensive R Archive Network (CRAN).

`install.packages("fqar")`

Alternatively, the latest developmental version can be installed directly from GitHub:

`devtools::install_github("equitable-equations/fqar")`

Thorough documentation is provided. A long-form vignette gives a birds-eye overview of the package's functionality while help files for individual functions provide guidance on particular data analysis tasks.

# Acknowledgements

Partial funding for this project was provided by the James Rocco Program. The authors also wish to thanks Glenn Adelson, Ph.D (Lake Forest College) and Justin Thomas, M.Sc ([NatureCITE](https://www.naturecite.org/)) for their insight into floristic quality assessment.

# References

Binary file added paper/strawberry_plot.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.

0 comments on commit 35a1dd5

Please sign in to comment.