\documentclass{article}
%\documentclass[journal=esthag,manuscript=article]{achemso}
\usepackage{authblk}
\usepackage{amsfonts}
\usepackage[version=3]{mhchem}
\usepackage{textgreek}
\usepackage{pdflscape} % landscape pages
\usepackage{lmodern} % Might prevent warnigns about unabailable fonts
\usepackage[margin=1in]{geometry} % bigger margins
%\usepackage{lineno} % line numbers
%\linenumbers
\title{Field trip report: PEEC, May 2015:\\ Novel peptidase activities in diverse freshwaters of the Pocono Mountains, PA}
\author[1]{Andrew D. Steen}
\affil[1]{Department of Microbiology, University of Tennessee, Knoxville}
\author[2]{\authorcr Malcolm X Shabazz High School Aquatic Geochemistry Team}
\author[2]{\authorcr Patrick Murray}
\author[2]{Nicholas Ferriero}
\affil[2]{Malcolm X Shabazz High School}
\author[3]{\authorcr Jeff Rosalsky}
\affil[3]{Poconos Environmental Education Center}
\usepackage{Sweave}
\begin{document}
%\input{2015-05-30_PEEC_trip_report-concordance}
\maketitle
\abstract{Extracellular enzymes are a key intermediate in the global carbon cycle, responsible for the initial step in the microbial transformation of organic matter to \ce{CO2}. Protein is a particularly important component of organic matter, becuase it contains both carbon and nitrogen, and because its component parts (amino acids) are used by all organisms. More than 300 peptidases (protein-degrading enzymes) are known, but despite the fact that many investigators have extensively studied the ecology and geochemistry of peptidases (protein-degrading enzymes) in aquatic ecosystems, all previous research in freshwater systems are limited to the analysis of a single peptidase, leucyl aminopeptidase. The purpose of this field trip was to continue a field program begun in 2013 to assess the activities of five distinct peptidases in diverse freshwater environments near the Poconos Environmental Education Center in the Delaware Water Gap National Recreation Area in eastern Pennsylvania. We show that at least four distinct peptidases are active in these waters: arginyl aminopeptidase, glycyl aminopeptidase, leucyl aminopeptidase, and trypsin. Enzymes hydrolyzing proteins containing terminal pyroglutamic acid were not observed. Patterns of peptidase activity varied among water bodies, and the ecological controls on that variability were not apparent. These data form a subset of a 3-year, multisite peptidase activity dataset which we are in the process of preparing for publication.}
%%%%%%%%%%%%
% Intro
%%%%%%%%%%%%
\section{Introduction}
Land plants `fix' \ce{CO2} into organic carbon. Most of this is rapidly reoxidized to \ce{CO2}, but approximately 0.2\% is mobilized from soils and transported by rivers to the ocean, where it may be sequestered over geological timescales \cite{Galy2015}. The transport of terrestrial organic carbon to the ocean therefore represents a key term in the global carbon cycle, so it is critical to understand the factors that control how much terrestrial organic carbon reaches the ocean. A major sink is biological activity in rivers \cite{Cole2007}, which emit $7.5 \times 10^{15}$ grams of \ce{CO2} to the atmosphere per year.
Much of this \ce{CO2} production is mediated by microorganisms, which produce extracellular enzymes in order to break down complex organic molecules outside of the cell \cite{Arnosti2013}. The set of extracellular enzymes present in an environment therefore constrains the total amount of organic carbon the community can convert to \ce{CO2}. A full, mechanistic understanding of the global carbon cycle therefore requires a good understanding of the controls on the presence and activity of extracellular enzymes produced by microbial ecosystems.
For that reason, the environmental controls on microbial extracellular enzyme production have been intensively investigated \cite{Arnosti2011,Sinsabaugh2009,Arnosti2013}. Nearly all of these studies, however, rely on a small class of compounds (`fluorogenic substrate proxies') which are capable of reporting the activities of only a small handful of distinct enzymes \cite{German2011}. Notably, we are unaware of any studies of freshwater in which activities of peptidases (protein-degrading enzymes) were assayed using any compound other than leucine 7-amido-4-methylcoumarin (or related leucine-based compounds), which reports the activity of an enzyme called leucyl aminopeptidase (E.C. 3.4.11.1). We know a great deal about the dynamics and controls of this enzyme - but there are more than 300 formally-recognized peptidases, any of which could be active and geochemically important in freshwaters.
Work by Suzuki and colleagues \cite{Obayashi2005, Obayashi2008a, Obayashi2009} has shown that in coastal Japanese seawater, endopeptidases (peptidases that cut proteins from the middle) are consistently more active than aminopeptidases (peptidases that cut proteins from one end). Our group has also observed this pattern in deep marine sediments from the Baltic Sea \cite{Lloyd2013}.This pattern, however, is far from universal: in an Arctic fjord \cite{Steen2013} and the Amazon River (Steen et al. in prep), aminopeptidases are more active than endopeptidases. It seems, therefore that different sets of peptidases are present in different environments. The goals of this field trip were to address the following questions about freshwater peptidases:
\begin{itemize}
\item What is the range of peptidases present in ecologically diverse freshwaters of the Pocono mountains?
\item Do patterns of peptidase activities vary from place to place?
\item Are patterns of peptidases predicted by ecological factors such as the type of water body?
\end{itemize}
%%%%%%%%%%
% METHODS
%%%%%%%%%%
\section{Methods}
\subsection{Sites and sample collection}
% Map of sample sites
\begin{figure}
\centering
\includegraphics{2015-05-30_PEEC_trip_report-p_map}
\caption{Map of sampling sites. \label{p_map}}
\end{figure}
Samples were collected from ecologically diverse sites in the vicinity of Pocono Environmental Education Center (Fig \ref{p_map}). Sample locations and brief descriptions are given in Table \ref{sites.table}. Samples were collected from near shore in clean, 1-L polyethylene bottles. Sample temperature was measured in bulk water at the time of collection. Sample pH was measured onsite using pH paper, and again at the University of Tennessee using an electronic pH meter.
\subsection{Enzyme assays}
Five peptidase substrates, intended to assay five distinct classes of peptidase, were used (Table \ref{substrate.table}). Enzyme activity was determined roughly following the procedure described in (Steen and Arnosti Svalbard peptidases): for each sample and substrate, there were three live samples and one kiled control. The control was killed by briefly boiling the sample. Incubations were performed in individual 1-mL (`semi-micro`) methacrylate cuvettes. To each cuvette, 860 \textmugreek L unfiltered sample or killed control, 100 \textmugreek L phosphate buffer (100 mM, pH=7.5), and 40 \textmugreek L substrate (10 mM stock concentration, dissolved in 90\% MilliQ-\ce{H2O} / 10\% DMSO, for a final substrate concentration of 400 \textmugreek L) was added. 400 \textmugreek M substrate concentration was observed in 2013 to be approximately saturating for these samples and substrates. Cuvettes were capped and mixed thoroughly, and a \ce{t_0} fluorescence measurement was made. Cuvettes were incubated at room temperature (20-22 $^o$C) for two hours (less in some cases due to logistical constraints). Fluorescence was then measured approximately every 15 minutes during the incubation period using a Promega Quantifluor ST fluorimeter or a Promega Glomax Jr fluorimeter, in each case set to UV mode. For each sample, a calibration curve was obtained using pure AMC standard dissolved in MilliQ-\ce{H2O}, again mixed with 860 \textmugreek L sample, 100 \textmugreek phosphate buffer and an appropriate volume of water such that the total volume was always 1000 \textmugreek L.
\subsection{Data analysis}
Enzyme data were analyzed using the R statistical package \cite{RCoreTeam2013} and the \texttt{enzalyze} package \linebreak (http://github.com/adsteen/enzalyze).
%%%%%%%%%%%%
% Results
%%%%%%%%%%%%
\section{Results}
\subsection{Data quality control}
\begin{figure}
\centering
\includegraphics{2015-05-30_PEEC_trip_report-p_raw}
\caption{All raw data from the 2015 PEEC trip. \label{p_raw}}
\end{figure}
Prior to analysis, three obvious outlier data points were removed, out of 1140 total data points collected. Plots of raw data showed that, in general, fluorescence increased linearly as a function of time in the live samples, and was constant in the killed controls (Fig. \ref{p_raw}). Note that, since the gain of the three fluorimeters varied significantly, rates of fluorescence activity should not be compared among sites.
\subsection{Levels of peptidase activity}
\begin{figure}
\includegraphics{2015-05-30_PEEC_trip_report-p_summed}
\caption{Summed activities of peptidases at each site. \label{p_summed}}
\end{figure}
Activities were highest in small, algae-covered ponds and lower in clearer ponds/lakes, streams, and the Delaware River (Fig \ref{p_summed}). There was not a terribly obvious ecological pattern to the summed activities, however: Front Pond and Loch Lomond, for instance, are both ponds of several hundred meters in diameter free from surface macroalgae, although they were on opposite ends of the spectrum of summed peptidase activities.
\subsection{Patterns of peptidase activity}
\begin{figure}
\centering
\includegraphics{2015-05-30_PEEC_trip_report-p_v0}
\caption{Activities of individual peptidases at each site. \label{p_v0}}
\end{figure}
Some patterns in the activities of individual enzymes were evident (Fig \ref{p_v0}). Hydrolysis rates of Gly-AMC and Pyr-AMC were always very close to zero, whereas hydrolysis rates of Arg-AMC, Leu-AMC, and GlyGlyArg-AMC were generally much faster. Leu-AMC was often the fastest-hydrolyzed substrate, but in some cases GlyGlyArg-AMC was much more active.
\begin{figure}
\centering
\includegraphics{2015-05-30_PEEC_trip_report-leuVsOthers}
\caption{Hydrolysis rate of Leu-AMC vs Arg-AMC (left) and Leu-AMC vs GlyGlyArg-AMC \label{leu.vs.others}}
\end{figure}
There was a relatively tight relationship between hydrolysis rate of arginyl aminopeptidase and leucyl aminopeptidase (p = 0.00081) and between glycyl aminopeptidase and leucyl aminopeptidase (p = 0.0017), whereas there was no significant relationship between trypsin and leucyl aminopeptidase (p = 0.84, Fig \ref{leu.vs.others}). The close correspondence between leucyl aminopeptidase and arginyl aminopeptidase, but not trypsin, is also evident from principal components analysis of the full dataset (with pyroglutamyl aminopeptidase removed, because those rates were generally not distinguishable from zero).
\begin{figure}
\centering
\includegraphics{2015-05-30_PEEC_trip_report-pPCA}
\caption{Principal components biplot of enzyme activities (Pyroglutamyl acid removed due because activities were generally below the detection limit). \label{p_pca}}
\end{figure}
\section{Discussion}
\subsection{Levels of peptidase activity}
There was no clear factor driving summed peptidase activities. However, the lack of metadata makes it difficult to evaluate this further: for instance, knowing cell concentrations would be useful, as cell-specific enzyme activities might be more constant. It will be possible to collect such data in 2016.
\subsection{Patterns of peptidase activity}
Patterns of enzyme activities likewise varied. Because leucyl aminopeptidase, glycyl aminopeptidase, and arginyl aminopeptidase were all fairly tightly inter-correlated, the main axis of variation of enzyme activities was the ratio of endopeptidase activity (trypsin, which cleaves proteins in the middle) to aminopeptidase activities (the aminopeptidases, which remove aminopeptidases from the N-termini of proteins). This difference seems to point to a difference in microbial communities' strategies for obtaining protein: the communities at sites TW, PP and DR (i.e., those in the bottom half of the Fig \ref{p_pca}) primarily access protein by degrading it from the middle, whereas communities at sites AC, LL, and BS primarily access protein from the ends. We note that we did not assay for carboxypeptidases (enzymes that cleave single amino acids from the C-terminus of proteins) because reliable fluorogenic substrates for those peptidases are not available, and that other peptidases (e.g. other endopeptidases, dipeptidyl aminopeptidases, etc.) may be present but poorly assayed by the substrates we have used. Thus, other dimensions of variability in protein acquisition may exist. The results presented here show - for the first time in any aquatic system - that substantial variability exists in the pathways by which microbial communities access protein.
These results do not point to an obvious factor driving protein acquisition strategies among sites: for instance, sites AC and TW are both small streams, yet they are on opposite ends of the endopeptidase/aminopeptidase spectrum. Likewise, sites PP and LL are both midsize (ca. 100-400 m major axis) ponds that are largely free from visible macroalgae, but have opposite protein degradation strategies.
We may hypothesize that protein acquisition strategies are driven by some combination of environmental and biological factors, possibly including nutrient status, dissolved orgnaic matter concentration or composition, microbial community composition (including microscopic eukaryotes), or other factors. Untangling those factors will require careful characterization of the chemical and biological environment of each site.
A substantial body of literature clearly demonstrates differences in ecosystem function at all spatial scales, at the level of `gross` ecosystem function: for instance, rates of carbon preservation or \ce{CO2} production, N transformation, etc. This work shows that functional variation may exist at very fine scale of individual enzyme production as well.
\section{Project overview}
\subsection{Previous work}
The 2015 trip represents the third year of the University of Tennessee / Malcolm X Shabazz High School collaboration to investigate enzyme activities around PEEC. In the first year, we collected saturation curves (measurements of enzyme activities at varying substrate concentrations) which told us what the correct substrate concentration to use in future experiments was, and which demonstrated clearly that the increase in fluorescence we measure in our samples is due to enzyme activities rather than to some artifact. The 2014 dataset looks a lot like the 2015 dataset, although we have not analyzed it as carefully at this point.
An undergraduate student, Lauren Mullen, has collected a parallel dataset of about 15 sites, using the same substrates and protocols as described in this report, in waters around the University of Tennessee and in the Smokies Mountains. Those data will be analyzed by the end of June 2015, and collated with the data presented here.
\subsection{Future work}
\subsubsection{Coastal samples}
During the end of the 2015 school year, Patrick Murray is expecting to add to our dataset by meausring enzyme activities in samples of coastal and estuarine water bodies around Newark, NJ. These samples will considerably expand the range of ecosystems we have measured, and will provide us with a true headwaters-to-ocean dataset.
\subsubsection{Temporal stability}
Over three years, we have sampled a wide range of environments, but none more than three times. \textbf{It will be important to determine how much temporal variability exists in protein degradation pathways}. We will use two strategies to address this. First, we can compare several sites that have been sampled in all three years of the PEEC experiments. Second, we can select several sites in Tennessee to repeatedly sample (say 1-2 times per week) for several weeks. We have reason to believe that the patterns will be broadly stable: the Suzuki lab, which has been using a range of peptidase substrates since 2005 but which has restricted their investigation to a single location in southern coastal Japan, has found that endopeptidases are consistently more active than exopeptidases \cite{Obayashi2005, Obayashi2008a, Obayashi2009}.
\subsubsection{Data integration and publication}
Between the three years of PEEC experiments, the soon-to-be-collected data from coastal New Jersey, and the more recent, parallel work in east Tennessee, we have collected a substantial dataset about relative activities of the five enzymes listed in Table \ref{sites.table}. It will take some time to confirm that the data have all been analyzed in the same way and to integrate the various datasets and synthesized the results. We expect to perform that data integration and synthesis, and to submit a manuscript (probably to the open-access journal Frontiers in Aquatic Microbiology) by the fall of 2015.
%%%%%%%%%%
% Horizontal-format tables
%%%%%%%%%%
% Landscape environment for tables because they're both wide
\begin{landscape}
% Table of site characteristics
\begin{table}
\centering
\begin{tabular}{l c c c c r}
site & name & coordinates & temp., $^o$C & date-time & description \\
\hline
FP & Front Pond & 41.170668 N, 74.91492 W & 25 & 5/27/15 12:10 & clearwater pond \\
AC & Alicia's Creek & 41.16923333 N, 74.91406667 & 20 & 5/27/15 13:58 & first-order stream \\
PP & Pickerel Pond & 41.167504 N, 74.917862 W & 27 & 5/27/15 14:06 & clearwater pond \\
BS & Briscoe Swamp & 41.16796667 N, 74.9211 W & 21 & 5/28/15 08:55 & macroalgae-rich shallow swamp \\
TW & Tumbling Waters Creek & 41.15451667 N, 74.91775 W & 18 & 5/28/15 09:16 & fast-flowing second-order stream \\
LL & Loch Lomond & 41.20705 N, 74.89605 W & 23 & 5/28/15 09:40 & clearwater pond \\
DR & Delaware River & 41.13724 N, 74.926029 W & 25 & 5/28/15 12:35 & major river \\
BB1 & Basketball Court Pond 1\footnote{Jeff, does this pond have a name?} & pending & 23 & 5/28/15 13:53 & small, macroalgae-rich pond \\
BB2 & Basketball Court Pond 2 & pending & 23 & 5/28/15 13:58 & semi-connected shallow bay adjacent to BB1 \\
VP & Vernal Pool & 41.16935 N, 74.91406667 W & 23 & 5/28/15 13:38 & Vernal pool on Fossil Trail \\
\hline
\end{tabular}
\caption{Sites sampled in 2015. \label{sites.table}}
\end{table}
% Table of substrates and enzymes
\begin{table}
\centering
\begin{tabular}{l l r}
Substrate & Abbrev. & Enzyme \\
\hline
Arginine-AMC & Arg-AMC & arginyl aminopeptidase \\
Glycine-AMC & Gly-AMC & glycyl aminopeptidase \\
Leucine AMC & Leu-AMC & leucyl aminopeptidase \\
Pyroglutamic acid-AMC & Pyr-AMC & pyroglutamyl aminopeptidase\footnote{This is a functional name for a hypothetical peptidase which has not been formally described.} \\
Glycine-Glycine-Argnine-AMC & GlyGlyArg-AMC & trypsin \\
\end{tabular}
\caption{List of substrates used in this experiment and the enzymes they assay.}
\label{substrate.table}
\end{table}
\end{landscape}
%%%%%%%%%%%
% References
%%%%%%%%%%%
\bibliographystyle{plain}
\bibliography{PEECbib}
\end{document}