{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Comparison of 201905 Model Phytoplankton to HPLC Phytoplankton Abundances from Nina Nemcek"
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {
"papermill": {
"duration": 2.59497,
"end_time": "2020-11-16T18:41:27.623510",
"exception": false,
"start_time": "2020-11-16T18:41:25.028540",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"import numpy as np # this module handles arrays, but here we need it for its NaN value\n",
"import pandas as pd # this module contains a lot of tools for handling tabular data\n",
"from matplotlib import pyplot as plt\n",
"from salishsea_tools import evaltools as et\n",
"import datetime as dt\n",
"import os\n",
"import gsw\n",
"import pickle\n",
"import netCDF4 as nc\n",
"import cmocean\n",
"from scipy import stats as spst\n",
"from pandas.plotting import register_matplotlib_converters\n",
"register_matplotlib_converters()\n",
"%matplotlib inline"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Note: crypto+hapto+prasino grouping was actually determined based on comparisons to 201812 model run"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Load data and matched model output"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"papermill": {
"duration": 0.021207,
"end_time": "2020-11-16T18:41:27.664289",
"exception": false,
"start_time": "2020-11-16T18:41:27.643082",
"status": "completed"
},
"tags": [
"parameters"
]
},
"outputs": [],
"source": [
"modSourceDir= '/results2/SalishSea/nowcast-green.201905/'\n",
"modver='201905'\n",
"Chl_N=1.8 # Chl:N ratio\n",
"startYMD=(2015,1,1)\n",
"endYMD=(2018,12,31)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"papermill": {
"duration": 0.021268,
"end_time": "2020-11-16T18:41:27.741462",
"exception": false,
"start_time": "2020-11-16T18:41:27.720194",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"start_date = dt.datetime(startYMD[0],startYMD[1],startYMD[2])\n",
"end_date = dt.datetime(endYMD[0],endYMD[1],endYMD[2]) #dt.datetime(2019,6,30)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"papermill": {
"duration": 0.020773,
"end_time": "2020-11-16T18:41:27.779566",
"exception": false,
"start_time": "2020-11-16T18:41:27.758793",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"datestr='_'+start_date.strftime('%Y%m%d')+'_'+end_date.strftime('%Y%m%d')"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"papermill": {
"duration": 0.056725,
"end_time": "2020-11-16T18:41:29.562101",
"exception": false,
"start_time": "2020-11-16T18:41:29.505376",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"with nc.Dataset('/ocean/eolson/MEOPAR/NEMO-forcing/grid/mesh_mask201702_noLPE.nc') as mesh:\n",
" tmask=np.copy(mesh.variables['tmask'][0,:,:,:])\n",
" navlat=np.copy(mesh.variables['nav_lat'][:,:])\n",
" navlon=np.copy(mesh.variables['nav_lon'][:,:])"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"papermill": {
"duration": 0.022584,
"end_time": "2020-11-16T18:41:27.819353",
"exception": false,
"start_time": "2020-11-16T18:41:27.796769",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"def subval(idf,colList):\n",
" # first value in colList should be the column you are going to keep\n",
" # follow with other columns that will be used to fill in when that column is NaN\n",
" # in order of precedence\n",
" if len(colList)==2:\n",
" idf[colList[0]]=[r[colList[0]] if not pd.isna(r[colList[0]]) \\\n",
" else r[colList[1]] for i,r in idf.iterrows()]\n",
" elif len(colList)==3:\n",
" idf[colList[0]]=[r[colList[0]] if not pd.isna(r[colList[0]]) \\\n",
" else r[colList[1]] if not pd.isna(r[colList[1]]) \\\n",
" else r[colList[2]] for i,r in idf.iterrows()]\n",
" else:\n",
" raise NotImplementedError('Add to code to handle this case')\n",
" idf.drop(columns=list(colList[1:]),inplace=True)\n",
" return idf"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {
"papermill": {
"duration": 0.032863,
"end_time": "2020-11-16T18:41:27.869564",
"exception": false,
"start_time": "2020-11-16T18:41:27.836701",
"status": "completed"
},
"tags": []
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"matched_201905_20150101_20181231_NewALLO.pkl\n"
]
}
],
"source": [
"if os.path.isfile('matched_'+modver+datestr+'_NewALLO.pkl'):\n",
" data=pickle.load(open( 'matched_'+modver+datestr+'_NewALLO.pkl', 'rb' ) )\n",
" print('matched_'+modver+datestr+'_NewALLO.pkl')\n",
"else:\n",
" # define paths to the source files and eventual output file\n",
" flist=('/ocean/eolson/MEOPAR/obs/NemcekHPLC/bottlePhytoMerged2015_NewALLO.csv',\n",
" '/ocean/eolson/MEOPAR/obs/NemcekHPLC/bottlePhytoMerged2016_NewALLO.csv',\n",
" '/ocean/eolson/MEOPAR/obs/NemcekHPLC/bottlePhytoMerged2017_NewALLO.csv',\n",
" '/ocean/eolson/MEOPAR/obs/NemcekHPLC/bottlePhytoMerged2018_NewALLO.csv')#,\n",
" #'/ocean/eolson/MEOPAR/obs/NemcekHPLC/bottlePhytoMerged2019.csv')\n",
"\n",
" dfs=list()\n",
" for fname in flist:\n",
" idf=pd.read_csv(fname)\n",
" print(fname,sorted(idf.keys()))\n",
" dfs.append(idf)\n",
" df=pd.concat(dfs,ignore_index=True,sort=False); # concatenate the list into a single table\n",
"\n",
" df.drop(labels=['ADM:MISSION','ADM:PROJECT','ADM:SCIENTIST','Zone','Zone.1','Temperature:Draw',\n",
" 'Temperature:Draw [deg C (ITS90)]','Bottle:Firing_Sequence','Comments by sample_numbeR',\n",
" 'File Name','LOC:EVENT_NUMBER','Number_of_bin_records'\n",
" ],axis=1,inplace=True)\n",
"\n",
" #df=subval(df,('Dictyochophytes','Dictyo'))\n",
" df=subval(df,('Chlorophyll:Extracted [mg/m^3]','Chlorophyll:Extracted'))\n",
" #df=subval(df,('Dinoflagellates','Dinoflagellates-1'))\n",
" df=subval(df,('Fluorescence [mg/m^3]','Fluorescence:URU:Seapoint [mg/m^3]','Fluorescence:URU:Seapoint'))\n",
" df=subval(df,('Lat','LOC:LATITUDE'))\n",
" df=subval(df,('Lon','LOC:LONGITUDE'))\n",
" df=subval(df,('Nitrate_plus_Nitrite [umol/L]','Nitrate_plus_Nitrite'))\n",
" df=subval(df,('PAR [uE/m^2/sec]','PAR'))\n",
" df=subval(df,('Phaeo-Pigment:Extracted [mg/m^3]','Phaeo-Pigment:Extracted'))\n",
" df=subval(df,('Phosphate [umol/L]','Phosphate'))\n",
" df=subval(df,('Pressure [decibar]','Pressure'))\n",
" #df=subval(df,('Raphidophytes','Raphido'))\n",
" df=subval(df,('Salinity','Salinity [PSS-78]','Salinity:T1:C1 [PSS-78]'))\n",
" df=subval(df,('Salinity:Bottle','Salinity:Bottle [PSS-78]'))\n",
" df=subval(df,('Silicate [umol/L]','Silicate'))\n",
" #df=subval(df,('TchlA (ug/L)','TchlA'))\n",
" df=subval(df,('Temperature','Temperature [deg C (ITS90)]','Temperature:Secondary [deg C (ITS90)]'))\n",
" df=subval(df,('Transmissivity [*/metre]','Transmissivity'))\n",
"\n",
" df['Z']=np.where(pd.isna(df['Depth [metres]']),\n",
" -1*gsw.z_from_p(df['Pressure [decibar]'].values,df['Lat'].values),\n",
" df['Depth [metres]'])\n",
" df['p']=np.where(pd.isna(df['Pressure [decibar]']),\n",
" gsw.p_from_z(-1*df['Depth [metres]'].values,df['Lat'].values),\n",
" df['Pressure [decibar]'])\n",
" df['SA']=gsw.SA_from_SP(df['Salinity'].values,df['p'].values,df['Lon'].values,df['Lat'].values)\n",
" df['CT']=gsw.CT_from_t(df['SA'].values,df['Temperature'].values,df['p'].values)\n",
" df.rename({'TchlA':'TchlA (ug/L)','Raphido':'Raphidophytes','Dinoflagellates-1':'Dinoflagellates',\n",
" 'Dictyo':'Dictyochophytes'},axis=1, inplace=True, errors='raise')\n",
" df['dtUTC']=[dt.datetime.strptime(ii,'%Y-%m-%d %H:%M:%S') if isinstance(ii,str) else np.nan for ii in df['FIL:START TIME YYYY/MM/DD HH:MM:SS'] ]\n",
"\n",
" PATH= modSourceDir\n",
"\n",
" flen=1\n",
" namfmt='nowcast'\n",
" #varmap={'N':'nitrate','Si':'silicon','Ammonium':'ammonium'}\n",
" filemap={'nitrate':'ptrc_T','silicon':'ptrc_T','ammonium':'ptrc_T','diatoms':'ptrc_T','ciliates':'ptrc_T','flagellates':'ptrc_T','vosaline':'grid_T','votemper':'grid_T'}\n",
" #gridmap={'nitrate':'tmask','silicon':'tmask','ammonium':'tmask'}\n",
" fdict={'ptrc_T':1,'grid_T':1}\n",
"\n",
" data=et.matchData(df,filemap,fdict,start_date,end_date,namfmt,PATH,flen)\n",
"\n",
" with open('matched_'+modver+datestr+'_NewALLO.pkl','wb') as f:\n",
" pickle.dump(data,f)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Index(['FIL:START TIME YYYY/MM/DD HH:MM:SS', 'LOC:STATION', 'Lat', 'Lon',\n",
" 'LOC:WATER DEPTH', 'Sample_Number', 'Temperature', 'Salinity',\n",
" 'Oxygen:Dissolved:CTD', 'pH:SBE:Nominal', 'Salinity:Bottle',\n",
" 'Flag:Salinity:Bottle', 'Flag:Chlorophyll:Extracted',\n",
" 'Flag:Nitrate_plus_Nitrite', 'Flag:Silicate', 'Flag:Phosphate',\n",
" 'Cruise', 'Oxygen:Dissolved', 'Flag:Oxygen:Dissolved', 'Diatoms-1',\n",
" 'Diatoms-2', 'Prasinophytes', 'Cryptophytes', 'Dinoflagellates',\n",
" 'Haptophytes', 'Dictyochophytes', 'Raphidophytes', 'Cyanobacteria',\n",
" 'TchlA (ug/L)', 'Pressure [decibar]', 'Transmissivity [*/metre]',\n",
" 'PAR [uE/m^2/sec]', 'PAR:Reference [uE/m^2/sec]',\n",
" 'Oxygen:Dissolved:SBE [mL/L]', 'Oxygen:Dissolved:SBE [umol/kg]',\n",
" 'Chlorophyll:Extracted [mg/m^3]', 'Phaeo-Pigment:Extracted [mg/m^3]',\n",
" 'Nitrate_plus_Nitrite [umol/L]', 'Silicate [umol/L]',\n",
" 'Phosphate [umol/L]', 'Bottle_Number', 'Oxygen:Dissolved [mL/L]',\n",
" 'Oxygen:Dissolved [umol/kg]', 'Depth [metres]', 'Fluorescence [mg/m^3]',\n",
" 'Oxygen:Dissolved:CTD [mL/L]', 'Oxygen:Dissolved:CTD [umol/kg]',\n",
" 'Depth:Nominal [metres]', 'Alkalinity:Total [umol/L]',\n",
" 'Flag:Alkalinity:Total', 'Carbon:Dissolved:Inorganic [umol/kg]',\n",
" 'Flag:Carbon:Dissolved:Inorganic', 'Z', 'p', 'SA', 'CT', 'dtUTC', 'j',\n",
" 'i', 'mod_nitrate', 'mod_silicon', 'mod_ammonium', 'mod_diatoms',\n",
" 'mod_ciliates', 'mod_flagellates', 'mod_vosaline', 'mod_votemper', 'k'],\n",
" dtype='object')"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data.keys()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['SI', '59', '102', '75', '72', '69', 'ADCP', '65', '63', '62',\n",
" '56', '46', '42', '39', 'GE01', '27', '2', '3', 'BS', '6', '9',\n",
" '12', '14', '16', '22', '11', 'CPF2', 'CPF1', '24', '28', '38',\n",
" '41', 'BS17', '19', 'GEO1', 'BS11', 'SC-04', '66', 'BI2', 'JF2',\n",
" 'HARO59', 'SI03', '15', 'SC04', '40', 'qu39', 'Van1', 'BS-11',\n",
" 'adcp', 'QU39', 'CPF-2', 'CPF-1', 'Haro 59', 'BS2', 'IS-2', 'PEN1',\n",
" 'PEN2', 'PEN3'], dtype=object)"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['LOC:STATION'].unique()"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {
"papermill": {
"duration": 0.026848,
"end_time": "2020-11-16T18:41:27.913839",
"exception": false,
"start_time": "2020-11-16T18:41:27.886991",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"data['other']=0.0\n",
"for el in ('Cryptophytes', 'Cyanobacteria', 'Dictyochophytes', 'Dinoflagellates',\n",
" 'Haptophytes', 'Prasinophytes', 'Raphidophytes'):\n",
" data['other']=data['other']+data[el]"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {
"papermill": {
"duration": 0.104595,
"end_time": "2020-11-16T18:41:29.169217",
"exception": false,
"start_time": "2020-11-16T18:41:29.064622",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"def yd(idt):\n",
" if type(idt)==dt.datetime:\n",
" yd=(idt-dt.datetime(idt.year-1,12,31)).days\n",
" else: # assume array or pandas\n",
" yd=[(ii-dt.datetime(ii.year-1,12,31)).days for ii in idt]\n",
" return yd\n",
"\n",
"data['yd']=yd(data['dtUTC'])\n",
"data['Year']=[ii.year for ii in data['dtUTC']]"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {
"papermill": {
"duration": 0.022354,
"end_time": "2020-11-16T18:41:28.515306",
"exception": false,
"start_time": "2020-11-16T18:41:28.492952",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"# define log transform function with slight shift to accommodate zero values\n",
"def logt(x):\n",
" return np.log10(x+.001)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Determine which HPLC groups have the highest biomass"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"2.1757399193548412"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Diatoms-1'].mean() ## Highest biomass"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.3043850806451614"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Diatoms-2'].mean() ## include"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.03817540322580645"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Cyanobacteria'].mean() ## exclude due to low biomass"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.4574556451612899"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Cryptophytes'].mean() ## include"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.21607862903225808"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Prasinophytes'].mean() ## include"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.23795766129032253"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Haptophytes'].mean() ## include"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.039802419354838664"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Dictyochophytes'].mean() ## exclude due to low biomass"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.10347580645161288"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Dinoflagellates'].mean() # exclude due to low biomass"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.40433064516129036"
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data['Raphidophytes'].mean() ## Include"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [],
"source": [
"data['Month']=[ii.month for ii in data['dtUTC']]"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [],
"source": [
"monthlymean=data.groupby(['Month']).mean()"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Month\n",
"2 0.120424\n",
"3 3.233714\n",
"4 4.943088\n",
"5 2.529966\n",
"6 2.168265\n",
"7 0.551176\n",
"8 2.249000\n",
"9 0.941815\n",
"10 1.593719\n",
"11 0.785317\n",
"Name: Diatoms-1, dtype: float64"
]
},
"execution_count": 24,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"monthlymean['Diatoms-1']"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [],
"source": [
"monthlymean['HPLCDiatoms']=(monthlymean['Diatoms-1']+monthlymean['Raphidophytes']+monthlymean['Diatoms-2'])"
]
},
{
"cell_type": "code",
"execution_count": 26,
"metadata": {},
"outputs": [],
"source": [
"monthlymean['HPLCFlag']=(monthlymean['Cryptophytes']+monthlymean['Haptophytes']+monthlymean['Raphidophytes'])"
]
},
{
"cell_type": "code",
"execution_count": 27,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Month\n",
"2 0.337182\n",
"3 3.697286\n",
"4 5.422284\n",
"5 3.205103\n",
"6 3.780675\n",
"7 0.780706\n",
"8 4.946000\n",
"9 1.361207\n",
"10 2.194649\n",
"11 0.897024\n",
"Name: HPLCDiatoms, dtype: float64"
]
},
"execution_count": 27,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"monthlymean['HPLCDiatoms']"
]
},
{
"cell_type": "code",
"execution_count": 28,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/ksuchy/anaconda3/envs/py39/lib/python3.9/site-packages/pandas/core/groupby/groupby.py:1510: RuntimeWarning: divide by zero encountered in true_divide\n",
" result.iloc[:, cols].values / np.sqrt(self.count().iloc[:, cols]).values\n"
]
}
],
"source": [
"monthlysem=logt(data.groupby(['Month']).sem())"
]
},
{
"cell_type": "code",
"execution_count": 29,
"metadata": {},
"outputs": [],
"source": [
"monthlymean['L10mod_diatoms']=logt(monthlymean['mod_diatoms']*Chl_N)\n",
"monthlymean['L10mod_flagellates']=logt(monthlymean['mod_flagellates']*Chl_N)\n",
"monthlymean['L10Diatoms-1']=logt(monthlymean['Diatoms-1'])\n",
"monthlymean['L10Diatoms-2']=logt(monthlymean['Diatoms-2'])\n",
"monthlymean['L10Cryptophytes']=logt(monthlymean['Cryptophytes'])\n",
"monthlymean['L10Prasinophytes']=logt(monthlymean['Prasinophytes'])\n",
"monthlymean['L10Haptophytes']=logt(monthlymean['Haptophytes'])\n",
"monthlymean['L10Raphidophytes']=logt(monthlymean['Raphidophytes'])\n",
"monthlymean['L10TotalChla']=logt(monthlymean['TchlA (ug/L)'])\n",
"\n",
"monthlymean['L10HPLCDiatoms']=logt(monthlymean['HPLCDiatoms'])\n",
"monthlymean['L10HPLCFlag']=logt(monthlymean['HPLCFlag'])"
]
},
{
"cell_type": "code",
"execution_count": 30,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Month\n",
"2 -2.432694\n",
"3 -1.367311\n",
"4 -0.199868\n",
"5 0.144985\n",
"6 -0.174303\n",
"7 -0.161647\n",
"8 -0.892479\n",
"9 -1.197468\n",
"10 -1.436750\n",
"11 -1.700827\n",
"Name: L10mod_diatoms, dtype: float64"
]
},
"execution_count": 30,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"monthlymean['L10mod_diatoms']"
]
},
{
"cell_type": "code",
"execution_count": 31,
"metadata": {},
"outputs": [],
"source": [
"# define inverse log transform with same shift\n",
"def logt_inv(y):\n",
" return 10**y-.001"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Model vs Obs Plots for various model-obs groups"
]
},
{
"cell_type": "markdown",
"metadata": {
"papermill": {
"duration": 0.028767,
"end_time": "2020-11-16T18:41:32.112120",
"exception": false,
"start_time": "2020-11-16T18:41:32.083353",
"status": "completed"
},
"tags": []
},
"source": [
"### Correlation Coefficient Matrix"
]
},
{
"cell_type": "code",
"execution_count": 32,
"metadata": {
"papermill": {
"duration": 0.040984,
"end_time": "2020-11-16T18:41:31.918310",
"exception": false,
"start_time": "2020-11-16T18:41:31.877326",
"status": "completed"
},
"tags": []
},
"outputs": [],
"source": [
"data['mod_diatoms_chl']=Chl_N*data['mod_diatoms']\n",
"data['mod_flagellates_chl']=Chl_N*data['mod_flagellates']\n",
"data['mod_ciliates_chl']=Chl_N*data['mod_ciliates']\n",
"data['mod_TChl']=data['mod_diatoms_chl']+data['mod_flagellates_chl']+data['mod_ciliates_chl']\n",
"data['CPH']=data['Cryptophytes']+data['Prasinophytes']+data['Haptophytes']\n",
"data['DD']=data['Diatoms-1']+data['Diatoms-2']\n",
"dfVars=data.loc[:,['Diatoms-1', 'Diatoms-2','Cyanobacteria','Cryptophytes', 'Prasinophytes', \n",
" 'Haptophytes', 'Dictyochophytes','Dinoflagellates','Raphidophytes','DD','CPH','TchlA (ug/L)',\n",
" 'mod_diatoms_chl','mod_flagellates_chl','mod_ciliates_chl','mod_TChl']]"
]
},
{
"cell_type": "code",
"execution_count": 33,
"metadata": {
"papermill": {
"duration": 0.046279,
"end_time": "2020-11-16T18:41:32.187547",
"exception": false,
"start_time": "2020-11-16T18:41:32.141268",
"status": "completed"
},
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Diatoms-1 | \n",
" Diatoms-2 | \n",
" Cyanobacteria | \n",
" Cryptophytes | \n",
" Prasinophytes | \n",
" Haptophytes | \n",
" Dictyochophytes | \n",
" Dinoflagellates | \n",
" Raphidophytes | \n",
" DD | \n",
" CPH | \n",
" TchlA (ug/L) | \n",
" mod_diatoms_chl | \n",
" mod_flagellates_chl | \n",
" mod_ciliates_chl | \n",
" mod_TChl | \n",
"
\n",
" \n",
" \n",
" \n",
" Diatoms-1 | \n",
" 1.000000 | \n",
" 0.129174 | \n",
" -0.044520 | \n",
" -0.104293 | \n",
" -0.155529 | \n",
" -0.089528 | \n",
" -0.038014 | \n",
" 0.068507 | \n",
" 0.186019 | \n",
" 0.986013 | \n",
" -0.143394 | \n",
" 0.799078 | \n",
" 0.329545 | \n",
" -0.107524 | \n",
" 0.086555 | \n",
" 0.240522 | \n",
"
\n",
" \n",
" Diatoms-2 | \n",
" 0.129174 | \n",
" 1.000000 | \n",
" 0.087055 | \n",
" 0.065789 | \n",
" 0.041872 | \n",
" 0.045439 | \n",
" 0.204256 | \n",
" 0.030159 | \n",
" 0.089479 | \n",
" 0.292639 | \n",
" 0.067138 | \n",
" 0.278908 | \n",
" 0.068727 | \n",
" -0.136186 | \n",
" -0.003254 | \n",
" -0.009364 | \n",
"
\n",
" \n",
" Cyanobacteria | \n",
" -0.044520 | \n",
" 0.087055 | \n",
" 1.000000 | \n",
" 0.455047 | \n",
" 0.673585 | \n",
" 0.265069 | \n",
" 0.134517 | \n",
" 0.111427 | \n",
" 0.471045 | \n",
" -0.028299 | \n",
" 0.565312 | \n",
" 0.323326 | \n",
" -0.064953 | \n",
" 0.271249 | \n",
" 0.028373 | \n",
" 0.083302 | \n",
"
\n",
" \n",
" Cryptophytes | \n",
" -0.104293 | \n",
" 0.065789 | \n",
" 0.455047 | \n",
" 1.000000 | \n",
" 0.629727 | \n",
" 0.330846 | \n",
" 0.059123 | \n",
" 0.105006 | \n",
" 0.151756 | \n",
" -0.089512 | \n",
" 0.850031 | \n",
" 0.145622 | \n",
" 0.107619 | \n",
" 0.283430 | \n",
" 0.018542 | \n",
" 0.238735 | \n",
"
\n",
" \n",
" Prasinophytes | \n",
" -0.155529 | \n",
" 0.041872 | \n",
" 0.673585 | \n",
" 0.629727 | \n",
" 1.000000 | \n",
" 0.273744 | \n",
" 0.115485 | \n",
" 0.043839 | \n",
" 0.193154 | \n",
" -0.142939 | \n",
" 0.760689 | \n",
" 0.115373 | \n",
" -0.114043 | \n",
" 0.288055 | \n",
" -0.032531 | \n",
" 0.043383 | \n",
"
\n",
" \n",
" Haptophytes | \n",
" -0.089528 | \n",
" 0.045439 | \n",
" 0.265069 | \n",
" 0.330846 | \n",
" 0.273744 | \n",
" 1.000000 | \n",
" 0.028364 | \n",
" -0.005455 | \n",
" -0.014300 | \n",
" -0.078695 | \n",
" 0.718854 | \n",
" 0.040637 | \n",
" -0.024129 | \n",
" 0.309359 | \n",
" 0.041182 | \n",
" 0.139303 | \n",
"
\n",
" \n",
" Dictyochophytes | \n",
" -0.038014 | \n",
" 0.204256 | \n",
" 0.134517 | \n",
" 0.059123 | \n",
" 0.115485 | \n",
" 0.028364 | \n",
" 1.000000 | \n",
" 0.070478 | \n",
" 0.073749 | \n",
" -0.002326 | \n",
" 0.079637 | \n",
" 0.084752 | \n",
" -0.061454 | \n",
" 0.083663 | \n",
" -0.033596 | \n",
" -0.014315 | \n",
"
\n",
" \n",
" Dinoflagellates | \n",
" 0.068507 | \n",
" 0.030159 | \n",
" 0.111427 | \n",
" 0.105006 | \n",
" 0.043839 | \n",
" -0.005455 | \n",
" 0.070478 | \n",
" 1.000000 | \n",
" 0.224567 | \n",
" 0.071130 | \n",
" 0.063264 | \n",
" 0.247006 | \n",
" 0.051962 | \n",
" 0.131246 | \n",
" 0.028659 | \n",
" 0.114278 | \n",
"
\n",
" \n",
" Raphidophytes | \n",
" 0.186019 | \n",
" 0.089479 | \n",
" 0.471045 | \n",
" 0.151756 | \n",
" 0.193154 | \n",
" -0.014300 | \n",
" 0.073749 | \n",
" 0.224567 | \n",
" 1.000000 | \n",
" 0.194417 | \n",
" 0.130332 | \n",
" 0.697246 | \n",
" 0.198755 | \n",
" -0.038571 | \n",
" 0.003086 | \n",
" 0.153761 | \n",
"
\n",
" \n",
" DD | \n",
" 0.986013 | \n",
" 0.292639 | \n",
" -0.028299 | \n",
" -0.089512 | \n",
" -0.142939 | \n",
" -0.078695 | \n",
" -0.002326 | \n",
" 0.071130 | \n",
" 0.194417 | \n",
" 1.000000 | \n",
" -0.126991 | \n",
" 0.817431 | \n",
" 0.329332 | \n",
" -0.126575 | \n",
" 0.082919 | \n",
" 0.230362 | \n",
"
\n",
" \n",
" CPH | \n",
" -0.143394 | \n",
" 0.067138 | \n",
" 0.565312 | \n",
" 0.850031 | \n",
" 0.760689 | \n",
" 0.718854 | \n",
" 0.079637 | \n",
" 0.063264 | \n",
" 0.130332 | \n",
" -0.126991 | \n",
" 1.000000 | \n",
" 0.127898 | \n",
" 0.004846 | \n",
" 0.377130 | \n",
" 0.017882 | \n",
" 0.196614 | \n",
"
\n",
" \n",
" TchlA (ug/L) | \n",
" 0.799078 | \n",
" 0.278908 | \n",
" 0.323326 | \n",
" 0.145622 | \n",
" 0.115373 | \n",
" 0.040637 | \n",
" 0.084752 | \n",
" 0.247006 | \n",
" 0.697246 | \n",
" 0.817431 | \n",
" 0.127898 | \n",
" 1.000000 | \n",
" 0.343112 | \n",
" -0.045938 | \n",
" 0.063879 | \n",
" 0.281355 | \n",
"
\n",
" \n",
" mod_diatoms_chl | \n",
" 0.329545 | \n",
" 0.068727 | \n",
" -0.064953 | \n",
" 0.107619 | \n",
" -0.114043 | \n",
" -0.024129 | \n",
" -0.061454 | \n",
" 0.051962 | \n",
" 0.198755 | \n",
" 0.329332 | \n",
" 0.004846 | \n",
" 0.343112 | \n",
" 1.000000 | \n",
" 0.188324 | \n",
" 0.462767 | \n",
" 0.842638 | \n",
"
\n",
" \n",
" mod_flagellates_chl | \n",
" -0.107524 | \n",
" -0.136186 | \n",
" 0.271249 | \n",
" 0.283430 | \n",
" 0.288055 | \n",
" 0.309359 | \n",
" 0.083663 | \n",
" 0.131246 | \n",
" -0.038571 | \n",
" -0.126575 | \n",
" 0.377130 | \n",
" -0.045938 | \n",
" 0.188324 | \n",
" 1.000000 | \n",
" 0.552138 | \n",
" 0.682743 | \n",
"
\n",
" \n",
" mod_ciliates_chl | \n",
" 0.086555 | \n",
" -0.003254 | \n",
" 0.028373 | \n",
" 0.018542 | \n",
" -0.032531 | \n",
" 0.041182 | \n",
" -0.033596 | \n",
" 0.028659 | \n",
" 0.003086 | \n",
" 0.082919 | \n",
" 0.017882 | \n",
" 0.063879 | \n",
" 0.462767 | \n",
" 0.552138 | \n",
" 1.000000 | \n",
" 0.696784 | \n",
"
\n",
" \n",
" mod_TChl | \n",
" 0.240522 | \n",
" -0.009364 | \n",
" 0.083302 | \n",
" 0.238735 | \n",
" 0.043383 | \n",
" 0.139303 | \n",
" -0.014315 | \n",
" 0.114278 | \n",
" 0.153761 | \n",
" 0.230362 | \n",
" 0.196614 | \n",
" 0.281355 | \n",
" 0.842638 | \n",
" 0.682743 | \n",
" 0.696784 | \n",
" 1.000000 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Diatoms-1 Diatoms-2 Cyanobacteria Cryptophytes \\\n",
"Diatoms-1 1.000000 0.129174 -0.044520 -0.104293 \n",
"Diatoms-2 0.129174 1.000000 0.087055 0.065789 \n",
"Cyanobacteria -0.044520 0.087055 1.000000 0.455047 \n",
"Cryptophytes -0.104293 0.065789 0.455047 1.000000 \n",
"Prasinophytes -0.155529 0.041872 0.673585 0.629727 \n",
"Haptophytes -0.089528 0.045439 0.265069 0.330846 \n",
"Dictyochophytes -0.038014 0.204256 0.134517 0.059123 \n",
"Dinoflagellates 0.068507 0.030159 0.111427 0.105006 \n",
"Raphidophytes 0.186019 0.089479 0.471045 0.151756 \n",
"DD 0.986013 0.292639 -0.028299 -0.089512 \n",
"CPH -0.143394 0.067138 0.565312 0.850031 \n",
"TchlA (ug/L) 0.799078 0.278908 0.323326 0.145622 \n",
"mod_diatoms_chl 0.329545 0.068727 -0.064953 0.107619 \n",
"mod_flagellates_chl -0.107524 -0.136186 0.271249 0.283430 \n",
"mod_ciliates_chl 0.086555 -0.003254 0.028373 0.018542 \n",
"mod_TChl 0.240522 -0.009364 0.083302 0.238735 \n",
"\n",
" Prasinophytes Haptophytes Dictyochophytes \\\n",
"Diatoms-1 -0.155529 -0.089528 -0.038014 \n",
"Diatoms-2 0.041872 0.045439 0.204256 \n",
"Cyanobacteria 0.673585 0.265069 0.134517 \n",
"Cryptophytes 0.629727 0.330846 0.059123 \n",
"Prasinophytes 1.000000 0.273744 0.115485 \n",
"Haptophytes 0.273744 1.000000 0.028364 \n",
"Dictyochophytes 0.115485 0.028364 1.000000 \n",
"Dinoflagellates 0.043839 -0.005455 0.070478 \n",
"Raphidophytes 0.193154 -0.014300 0.073749 \n",
"DD -0.142939 -0.078695 -0.002326 \n",
"CPH 0.760689 0.718854 0.079637 \n",
"TchlA (ug/L) 0.115373 0.040637 0.084752 \n",
"mod_diatoms_chl -0.114043 -0.024129 -0.061454 \n",
"mod_flagellates_chl 0.288055 0.309359 0.083663 \n",
"mod_ciliates_chl -0.032531 0.041182 -0.033596 \n",
"mod_TChl 0.043383 0.139303 -0.014315 \n",
"\n",
" Dinoflagellates Raphidophytes DD CPH \\\n",
"Diatoms-1 0.068507 0.186019 0.986013 -0.143394 \n",
"Diatoms-2 0.030159 0.089479 0.292639 0.067138 \n",
"Cyanobacteria 0.111427 0.471045 -0.028299 0.565312 \n",
"Cryptophytes 0.105006 0.151756 -0.089512 0.850031 \n",
"Prasinophytes 0.043839 0.193154 -0.142939 0.760689 \n",
"Haptophytes -0.005455 -0.014300 -0.078695 0.718854 \n",
"Dictyochophytes 0.070478 0.073749 -0.002326 0.079637 \n",
"Dinoflagellates 1.000000 0.224567 0.071130 0.063264 \n",
"Raphidophytes 0.224567 1.000000 0.194417 0.130332 \n",
"DD 0.071130 0.194417 1.000000 -0.126991 \n",
"CPH 0.063264 0.130332 -0.126991 1.000000 \n",
"TchlA (ug/L) 0.247006 0.697246 0.817431 0.127898 \n",
"mod_diatoms_chl 0.051962 0.198755 0.329332 0.004846 \n",
"mod_flagellates_chl 0.131246 -0.038571 -0.126575 0.377130 \n",
"mod_ciliates_chl 0.028659 0.003086 0.082919 0.017882 \n",
"mod_TChl 0.114278 0.153761 0.230362 0.196614 \n",
"\n",
" TchlA (ug/L) mod_diatoms_chl mod_flagellates_chl \\\n",
"Diatoms-1 0.799078 0.329545 -0.107524 \n",
"Diatoms-2 0.278908 0.068727 -0.136186 \n",
"Cyanobacteria 0.323326 -0.064953 0.271249 \n",
"Cryptophytes 0.145622 0.107619 0.283430 \n",
"Prasinophytes 0.115373 -0.114043 0.288055 \n",
"Haptophytes 0.040637 -0.024129 0.309359 \n",
"Dictyochophytes 0.084752 -0.061454 0.083663 \n",
"Dinoflagellates 0.247006 0.051962 0.131246 \n",
"Raphidophytes 0.697246 0.198755 -0.038571 \n",
"DD 0.817431 0.329332 -0.126575 \n",
"CPH 0.127898 0.004846 0.377130 \n",
"TchlA (ug/L) 1.000000 0.343112 -0.045938 \n",
"mod_diatoms_chl 0.343112 1.000000 0.188324 \n",
"mod_flagellates_chl -0.045938 0.188324 1.000000 \n",
"mod_ciliates_chl 0.063879 0.462767 0.552138 \n",
"mod_TChl 0.281355 0.842638 0.682743 \n",
"\n",
" mod_ciliates_chl mod_TChl \n",
"Diatoms-1 0.086555 0.240522 \n",
"Diatoms-2 -0.003254 -0.009364 \n",
"Cyanobacteria 0.028373 0.083302 \n",
"Cryptophytes 0.018542 0.238735 \n",
"Prasinophytes -0.032531 0.043383 \n",
"Haptophytes 0.041182 0.139303 \n",
"Dictyochophytes -0.033596 -0.014315 \n",
"Dinoflagellates 0.028659 0.114278 \n",
"Raphidophytes 0.003086 0.153761 \n",
"DD 0.082919 0.230362 \n",
"CPH 0.017882 0.196614 \n",
"TchlA (ug/L) 0.063879 0.281355 \n",
"mod_diatoms_chl 0.462767 0.842638 \n",
"mod_flagellates_chl 0.552138 0.682743 \n",
"mod_ciliates_chl 1.000000 0.696784 \n",
"mod_TChl 0.696784 1.000000 "
]
},
"execution_count": 33,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dfVars.corr()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"##### Strongest correlations:\n",
"Model diatoms and:\n",
"- Total chla: 0.343112\n",
"- Diatoms-1: 0.329545\n",
"- Diatoms-1+Diatoms-2: 0.329332\n",
"\n",
"Model flagellates and:\n",
"- crypto+hapto+prasino: 0.377130\n",
"- haptophytes: 0.309359\n",
"- prasinophytes: 0.288055\n",
"- cryptophytes: 0.283430\n",
"- cyanobacteria: 0.271249 (but remember that cyanobacteria abundances are low)"
]
},
{
"cell_type": "markdown",
"metadata": {
"papermill": {
"duration": 0.028561,
"end_time": "2020-11-16T18:41:31.976144",
"exception": false,
"start_time": "2020-11-16T18:41:31.947583",
"status": "completed"
},
"tags": []
},
"source": [
"### Variance-Covariance Matrix"
]
},
{
"cell_type": "code",
"execution_count": 34,
"metadata": {
"papermill": {
"duration": 0.049078,
"end_time": "2020-11-16T18:41:32.054432",
"exception": false,
"start_time": "2020-11-16T18:41:32.005354",
"status": "completed"
},
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Diatoms-1 | \n",
" Diatoms-2 | \n",
" Cyanobacteria | \n",
" Cryptophytes | \n",
" Prasinophytes | \n",
" Haptophytes | \n",
" Dictyochophytes | \n",
" Dinoflagellates | \n",
" Raphidophytes | \n",
" DD | \n",
" CPH | \n",
" TchlA (ug/L) | \n",
" mod_diatoms_chl | \n",
" mod_flagellates_chl | \n",
" mod_ciliates_chl | \n",
" mod_TChl | \n",
"
\n",
" \n",
" \n",
" \n",
" Diatoms-1 | \n",
" 17.030227 | \n",
" 0.383433 | \n",
" -0.014114 | \n",
" -0.180451 | \n",
" -0.176579 | \n",
" -0.147258 | \n",
" -0.029133 | \n",
" 0.111324 | \n",
" 2.290018 | \n",
" 17.413661 | \n",
" -0.504288 | \n",
" 19.195920 | \n",
" 2.849766 | \n",
" -0.540311 | \n",
" 0.080426 | \n",
" 2.389881 | \n",
"
\n",
" \n",
" Diatoms-2 | \n",
" 0.383433 | \n",
" 0.517381 | \n",
" 0.004810 | \n",
" 0.019841 | \n",
" 0.008286 | \n",
" 0.013027 | \n",
" 0.027284 | \n",
" 0.008542 | \n",
" 0.191999 | \n",
" 0.900814 | \n",
" 0.041154 | \n",
" 1.167819 | \n",
" 0.103589 | \n",
" -0.119279 | \n",
" -0.000527 | \n",
" -0.016217 | \n",
"
\n",
" \n",
" Cyanobacteria | \n",
" -0.014114 | \n",
" 0.004810 | \n",
" 0.005901 | \n",
" 0.014656 | \n",
" 0.014236 | \n",
" 0.008116 | \n",
" 0.001919 | \n",
" 0.003371 | \n",
" 0.107947 | \n",
" -0.009303 | \n",
" 0.037008 | \n",
" 0.144586 | \n",
" -0.010456 | \n",
" 0.025373 | \n",
" 0.000491 | \n",
" 0.015408 | \n",
"
\n",
" \n",
" Cryptophytes | \n",
" -0.180451 | \n",
" 0.019841 | \n",
" 0.014656 | \n",
" 0.175789 | \n",
" 0.072638 | \n",
" 0.055288 | \n",
" 0.004603 | \n",
" 0.017336 | \n",
" 0.189807 | \n",
" -0.160610 | \n",
" 0.303715 | \n",
" 0.355411 | \n",
" 0.094552 | \n",
" 0.144700 | \n",
" 0.001750 | \n",
" 0.241003 | \n",
"
\n",
" \n",
" Prasinophytes | \n",
" -0.176579 | \n",
" 0.008286 | \n",
" 0.014236 | \n",
" 0.072638 | \n",
" 0.075690 | \n",
" 0.030017 | \n",
" 0.005900 | \n",
" 0.004749 | \n",
" 0.158524 | \n",
" -0.168293 | \n",
" 0.178345 | \n",
" 0.184770 | \n",
" -0.065746 | \n",
" 0.096499 | \n",
" -0.002015 | \n",
" 0.028737 | \n",
"
\n",
" \n",
" Haptophytes | \n",
" -0.147258 | \n",
" 0.013027 | \n",
" 0.008116 | \n",
" 0.055288 | \n",
" 0.030017 | \n",
" 0.158861 | \n",
" 0.002099 | \n",
" -0.000856 | \n",
" -0.017002 | \n",
" -0.134231 | \n",
" 0.244167 | \n",
" 0.094285 | \n",
" -0.020153 | \n",
" 0.150141 | \n",
" 0.003696 | \n",
" 0.133684 | \n",
"
\n",
" \n",
" Dictyochophytes | \n",
" -0.029133 | \n",
" 0.027284 | \n",
" 0.001919 | \n",
" 0.004603 | \n",
" 0.005900 | \n",
" 0.002099 | \n",
" 0.034487 | \n",
" 0.005154 | \n",
" 0.040856 | \n",
" -0.001849 | \n",
" 0.012603 | \n",
" 0.091620 | \n",
" -0.023915 | \n",
" 0.018919 | \n",
" -0.001405 | \n",
" -0.006401 | \n",
"
\n",
" \n",
" Dinoflagellates | \n",
" 0.111324 | \n",
" 0.008542 | \n",
" 0.003371 | \n",
" 0.017336 | \n",
" 0.004749 | \n",
" -0.000856 | \n",
" 0.005154 | \n",
" 0.155056 | \n",
" 0.263792 | \n",
" 0.119866 | \n",
" 0.021229 | \n",
" 0.566188 | \n",
" 0.042876 | \n",
" 0.062930 | \n",
" 0.002541 | \n",
" 0.108347 | \n",
"
\n",
" \n",
" Raphidophytes | \n",
" 2.290018 | \n",
" 0.191999 | \n",
" 0.107947 | \n",
" 0.189807 | \n",
" 0.158524 | \n",
" -0.017002 | \n",
" 0.040856 | \n",
" 0.263792 | \n",
" 8.899071 | \n",
" 2.482017 | \n",
" 0.331329 | \n",
" 12.107873 | \n",
" 1.242441 | \n",
" -0.140106 | \n",
" 0.002073 | \n",
" 1.104408 | \n",
"
\n",
" \n",
" DD | \n",
" 17.413661 | \n",
" 0.900814 | \n",
" -0.009303 | \n",
" -0.160610 | \n",
" -0.168293 | \n",
" -0.134231 | \n",
" -0.001849 | \n",
" 0.119866 | \n",
" 2.482017 | \n",
" 18.314475 | \n",
" -0.463135 | \n",
" 20.363739 | \n",
" 2.953355 | \n",
" -0.659590 | \n",
" 0.079900 | \n",
" 2.373664 | \n",
"
\n",
" \n",
" CPH | \n",
" -0.504288 | \n",
" 0.041154 | \n",
" 0.037008 | \n",
" 0.303715 | \n",
" 0.178345 | \n",
" 0.244167 | \n",
" 0.012603 | \n",
" 0.021229 | \n",
" 0.331329 | \n",
" -0.463135 | \n",
" 0.726227 | \n",
" 0.634466 | \n",
" 0.008653 | \n",
" 0.391340 | \n",
" 0.003431 | \n",
" 0.403424 | \n",
"
\n",
" \n",
" TchlA (ug/L) | \n",
" 19.195920 | \n",
" 1.167819 | \n",
" 0.144586 | \n",
" 0.355411 | \n",
" 0.184770 | \n",
" 0.094285 | \n",
" 0.091620 | \n",
" 0.566188 | \n",
" 12.107873 | \n",
" 20.363739 | \n",
" 0.634466 | \n",
" 33.885888 | \n",
" 4.185330 | \n",
" -0.325619 | \n",
" 0.083726 | \n",
" 3.943436 | \n",
"
\n",
" \n",
" mod_diatoms_chl | \n",
" 2.849766 | \n",
" 0.103589 | \n",
" -0.010456 | \n",
" 0.094552 | \n",
" -0.065746 | \n",
" -0.020153 | \n",
" -0.023915 | \n",
" 0.042876 | \n",
" 1.242441 | \n",
" 2.953355 | \n",
" 0.008653 | \n",
" 4.185330 | \n",
" 1.205209 | \n",
" 0.160073 | \n",
" 0.076402 | \n",
" 1.441683 | \n",
"
\n",
" \n",
" mod_flagellates_chl | \n",
" -0.540311 | \n",
" -0.119279 | \n",
" 0.025373 | \n",
" 0.144700 | \n",
" 0.096499 | \n",
" 0.150141 | \n",
" 0.018919 | \n",
" 0.062930 | \n",
" -0.140106 | \n",
" -0.659590 | \n",
" 0.391340 | \n",
" -0.325619 | \n",
" 0.160073 | \n",
" 0.599467 | \n",
" 0.064289 | \n",
" 0.823829 | \n",
"
\n",
" \n",
" mod_ciliates_chl | \n",
" 0.080426 | \n",
" -0.000527 | \n",
" 0.000491 | \n",
" 0.001750 | \n",
" -0.002015 | \n",
" 0.003696 | \n",
" -0.001405 | \n",
" 0.002541 | \n",
" 0.002073 | \n",
" 0.079900 | \n",
" 0.003431 | \n",
" 0.083726 | \n",
" 0.076402 | \n",
" 0.064289 | \n",
" 0.022616 | \n",
" 0.163307 | \n",
"
\n",
" \n",
" mod_TChl | \n",
" 2.389881 | \n",
" -0.016217 | \n",
" 0.015408 | \n",
" 0.241003 | \n",
" 0.028737 | \n",
" 0.133684 | \n",
" -0.006401 | \n",
" 0.108347 | \n",
" 1.104408 | \n",
" 2.373664 | \n",
" 0.403424 | \n",
" 3.943436 | \n",
" 1.441683 | \n",
" 0.823829 | \n",
" 0.163307 | \n",
" 2.428820 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Diatoms-1 Diatoms-2 Cyanobacteria Cryptophytes \\\n",
"Diatoms-1 17.030227 0.383433 -0.014114 -0.180451 \n",
"Diatoms-2 0.383433 0.517381 0.004810 0.019841 \n",
"Cyanobacteria -0.014114 0.004810 0.005901 0.014656 \n",
"Cryptophytes -0.180451 0.019841 0.014656 0.175789 \n",
"Prasinophytes -0.176579 0.008286 0.014236 0.072638 \n",
"Haptophytes -0.147258 0.013027 0.008116 0.055288 \n",
"Dictyochophytes -0.029133 0.027284 0.001919 0.004603 \n",
"Dinoflagellates 0.111324 0.008542 0.003371 0.017336 \n",
"Raphidophytes 2.290018 0.191999 0.107947 0.189807 \n",
"DD 17.413661 0.900814 -0.009303 -0.160610 \n",
"CPH -0.504288 0.041154 0.037008 0.303715 \n",
"TchlA (ug/L) 19.195920 1.167819 0.144586 0.355411 \n",
"mod_diatoms_chl 2.849766 0.103589 -0.010456 0.094552 \n",
"mod_flagellates_chl -0.540311 -0.119279 0.025373 0.144700 \n",
"mod_ciliates_chl 0.080426 -0.000527 0.000491 0.001750 \n",
"mod_TChl 2.389881 -0.016217 0.015408 0.241003 \n",
"\n",
" Prasinophytes Haptophytes Dictyochophytes \\\n",
"Diatoms-1 -0.176579 -0.147258 -0.029133 \n",
"Diatoms-2 0.008286 0.013027 0.027284 \n",
"Cyanobacteria 0.014236 0.008116 0.001919 \n",
"Cryptophytes 0.072638 0.055288 0.004603 \n",
"Prasinophytes 0.075690 0.030017 0.005900 \n",
"Haptophytes 0.030017 0.158861 0.002099 \n",
"Dictyochophytes 0.005900 0.002099 0.034487 \n",
"Dinoflagellates 0.004749 -0.000856 0.005154 \n",
"Raphidophytes 0.158524 -0.017002 0.040856 \n",
"DD -0.168293 -0.134231 -0.001849 \n",
"CPH 0.178345 0.244167 0.012603 \n",
"TchlA (ug/L) 0.184770 0.094285 0.091620 \n",
"mod_diatoms_chl -0.065746 -0.020153 -0.023915 \n",
"mod_flagellates_chl 0.096499 0.150141 0.018919 \n",
"mod_ciliates_chl -0.002015 0.003696 -0.001405 \n",
"mod_TChl 0.028737 0.133684 -0.006401 \n",
"\n",
" Dinoflagellates Raphidophytes DD CPH \\\n",
"Diatoms-1 0.111324 2.290018 17.413661 -0.504288 \n",
"Diatoms-2 0.008542 0.191999 0.900814 0.041154 \n",
"Cyanobacteria 0.003371 0.107947 -0.009303 0.037008 \n",
"Cryptophytes 0.017336 0.189807 -0.160610 0.303715 \n",
"Prasinophytes 0.004749 0.158524 -0.168293 0.178345 \n",
"Haptophytes -0.000856 -0.017002 -0.134231 0.244167 \n",
"Dictyochophytes 0.005154 0.040856 -0.001849 0.012603 \n",
"Dinoflagellates 0.155056 0.263792 0.119866 0.021229 \n",
"Raphidophytes 0.263792 8.899071 2.482017 0.331329 \n",
"DD 0.119866 2.482017 18.314475 -0.463135 \n",
"CPH 0.021229 0.331329 -0.463135 0.726227 \n",
"TchlA (ug/L) 0.566188 12.107873 20.363739 0.634466 \n",
"mod_diatoms_chl 0.042876 1.242441 2.953355 0.008653 \n",
"mod_flagellates_chl 0.062930 -0.140106 -0.659590 0.391340 \n",
"mod_ciliates_chl 0.002541 0.002073 0.079900 0.003431 \n",
"mod_TChl 0.108347 1.104408 2.373664 0.403424 \n",
"\n",
" TchlA (ug/L) mod_diatoms_chl mod_flagellates_chl \\\n",
"Diatoms-1 19.195920 2.849766 -0.540311 \n",
"Diatoms-2 1.167819 0.103589 -0.119279 \n",
"Cyanobacteria 0.144586 -0.010456 0.025373 \n",
"Cryptophytes 0.355411 0.094552 0.144700 \n",
"Prasinophytes 0.184770 -0.065746 0.096499 \n",
"Haptophytes 0.094285 -0.020153 0.150141 \n",
"Dictyochophytes 0.091620 -0.023915 0.018919 \n",
"Dinoflagellates 0.566188 0.042876 0.062930 \n",
"Raphidophytes 12.107873 1.242441 -0.140106 \n",
"DD 20.363739 2.953355 -0.659590 \n",
"CPH 0.634466 0.008653 0.391340 \n",
"TchlA (ug/L) 33.885888 4.185330 -0.325619 \n",
"mod_diatoms_chl 4.185330 1.205209 0.160073 \n",
"mod_flagellates_chl -0.325619 0.160073 0.599467 \n",
"mod_ciliates_chl 0.083726 0.076402 0.064289 \n",
"mod_TChl 3.943436 1.441683 0.823829 \n",
"\n",
" mod_ciliates_chl mod_TChl \n",
"Diatoms-1 0.080426 2.389881 \n",
"Diatoms-2 -0.000527 -0.016217 \n",
"Cyanobacteria 0.000491 0.015408 \n",
"Cryptophytes 0.001750 0.241003 \n",
"Prasinophytes -0.002015 0.028737 \n",
"Haptophytes 0.003696 0.133684 \n",
"Dictyochophytes -0.001405 -0.006401 \n",
"Dinoflagellates 0.002541 0.108347 \n",
"Raphidophytes 0.002073 1.104408 \n",
"DD 0.079900 2.373664 \n",
"CPH 0.003431 0.403424 \n",
"TchlA (ug/L) 0.083726 3.943436 \n",
"mod_diatoms_chl 0.076402 1.441683 \n",
"mod_flagellates_chl 0.064289 0.823829 \n",
"mod_ciliates_chl 0.022616 0.163307 \n",
"mod_TChl 0.163307 2.428820 "
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dfVars.cov()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"##### largest covariances:\n",
"Model diatoms and:\n",
"- TChlA: 4.185330\n",
"- Diatoms-1+Diatoms-2: 2.953355\n",
"- Diatoms-1: 2.849766\n",
"- Raphidophytes: 1.242441\n",
"\n",
"Model flagellates and:\n",
"- crypto+hapto+prasino: 0.391340\n",
"- haptophytes: 0.150141\n",
"- cryptophytes: 0.144700"
]
},
{
"cell_type": "markdown",
"metadata": {
"papermill": {
"duration": 0.030535,
"end_time": "2020-11-16T18:41:32.395616",
"exception": false,
"start_time": "2020-11-16T18:41:32.365081",
"status": "completed"
},
"tags": []
},
"source": [
"### Corr Coeff matrix with log transformed values:"
]
},
{
"cell_type": "code",
"execution_count": 35,
"metadata": {
"papermill": {
"duration": 0.047132,
"end_time": "2020-11-16T18:41:32.473848",
"exception": false,
"start_time": "2020-11-16T18:41:32.426716",
"status": "completed"
},
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Diatoms-1 | \n",
" Diatoms-2 | \n",
" Cyanobacteria | \n",
" Cryptophytes | \n",
" Prasinophytes | \n",
" Haptophytes | \n",
" Dictyochophytes | \n",
" Dinoflagellates | \n",
" Raphidophytes | \n",
" CPH | \n",
" TchlA (ug/L) | \n",
" mod_diatoms_chl | \n",
" mod_flagellates_chl | \n",
" mod_ciliates_chl | \n",
" mod_TChl | \n",
"
\n",
" \n",
" \n",
" \n",
" Diatoms-1 | \n",
" 1.000000 | \n",
" 0.158963 | \n",
" -0.183906 | \n",
" -0.200691 | \n",
" -0.330748 | \n",
" -0.178564 | \n",
" -0.022753 | \n",
" 0.257098 | \n",
" -0.044532 | \n",
" -0.240631 | \n",
" 0.620741 | \n",
" 0.381332 | \n",
" -0.121685 | \n",
" 0.098088 | \n",
" 0.158253 | \n",
"
\n",
" \n",
" Diatoms-2 | \n",
" 0.158963 | \n",
" 1.000000 | \n",
" -0.070727 | \n",
" -0.017724 | \n",
" -0.081120 | \n",
" -0.206987 | \n",
" 0.260879 | \n",
" 0.110120 | \n",
" -0.069205 | \n",
" -0.095680 | \n",
" 0.117311 | \n",
" -0.054775 | \n",
" -0.295843 | \n",
" -0.045642 | \n",
" -0.179840 | \n",
"
\n",
" \n",
" Cyanobacteria | \n",
" -0.183906 | \n",
" -0.070727 | \n",
" 1.000000 | \n",
" 0.308677 | \n",
" 0.391266 | \n",
" 0.322685 | \n",
" 0.341206 | \n",
" 0.001006 | \n",
" 0.323720 | \n",
" 0.387215 | \n",
" 0.114417 | \n",
" -0.177385 | \n",
" 0.423884 | \n",
" 0.162395 | \n",
" 0.141110 | \n",
"
\n",
" \n",
" Cryptophytes | \n",
" -0.200691 | \n",
" -0.017724 | \n",
" 0.308677 | \n",
" 1.000000 | \n",
" 0.705089 | \n",
" 0.328445 | \n",
" 0.337350 | \n",
" 0.256664 | \n",
" 0.383761 | \n",
" 0.872284 | \n",
" 0.077971 | \n",
" -0.057914 | \n",
" 0.290401 | \n",
" 0.036045 | \n",
" 0.120324 | \n",
"
\n",
" \n",
" Prasinophytes | \n",
" -0.330748 | \n",
" -0.081120 | \n",
" 0.391266 | \n",
" 0.705089 | \n",
" 1.000000 | \n",
" 0.299601 | \n",
" 0.401870 | \n",
" 0.140807 | \n",
" 0.462423 | \n",
" 0.698793 | \n",
" -0.023818 | \n",
" -0.289977 | \n",
" 0.340049 | \n",
" 0.021557 | \n",
" 0.023916 | \n",
"
\n",
" \n",
" Haptophytes | \n",
" -0.178564 | \n",
" -0.206987 | \n",
" 0.322685 | \n",
" 0.328445 | \n",
" 0.299601 | \n",
" 1.000000 | \n",
" 0.204290 | \n",
" 0.047297 | \n",
" 0.189056 | \n",
" 0.576696 | \n",
" 0.063931 | \n",
" -0.102367 | \n",
" 0.250856 | \n",
" 0.062734 | \n",
" 0.100466 | \n",
"
\n",
" \n",
" Dictyochophytes | \n",
" -0.022753 | \n",
" 0.260879 | \n",
" 0.341206 | \n",
" 0.337350 | \n",
" 0.401870 | \n",
" 0.204290 | \n",
" 1.000000 | \n",
" 0.267118 | \n",
" 0.337107 | \n",
" 0.328808 | \n",
" 0.131390 | \n",
" -0.229019 | \n",
" 0.120689 | \n",
" -0.086112 | \n",
" -0.078591 | \n",
"
\n",
" \n",
" Dinoflagellates | \n",
" 0.257098 | \n",
" 0.110120 | \n",
" 0.001006 | \n",
" 0.256664 | \n",
" 0.140807 | \n",
" 0.047297 | \n",
" 0.267118 | \n",
" 1.000000 | \n",
" 0.354625 | \n",
" 0.246911 | \n",
" 0.416244 | \n",
" 0.176141 | \n",
" 0.109616 | \n",
" 0.039243 | \n",
" 0.135781 | \n",
"
\n",
" \n",
" Raphidophytes | \n",
" -0.044532 | \n",
" -0.069205 | \n",
" 0.323720 | \n",
" 0.383761 | \n",
" 0.462423 | \n",
" 0.189056 | \n",
" 0.337107 | \n",
" 0.354625 | \n",
" 1.000000 | \n",
" 0.370869 | \n",
" 0.227029 | \n",
" -0.102750 | \n",
" 0.287205 | \n",
" 0.039728 | \n",
" 0.080884 | \n",
"
\n",
" \n",
" CPH | \n",
" -0.240631 | \n",
" -0.095680 | \n",
" 0.387215 | \n",
" 0.872284 | \n",
" 0.698793 | \n",
" 0.576696 | \n",
" 0.328808 | \n",
" 0.246911 | \n",
" 0.370869 | \n",
" 1.000000 | \n",
" 0.125576 | \n",
" -0.084175 | \n",
" 0.324159 | \n",
" 0.059914 | \n",
" 0.130502 | \n",
"
\n",
" \n",
" TchlA (ug/L) | \n",
" 0.620741 | \n",
" 0.117311 | \n",
" 0.114417 | \n",
" 0.077971 | \n",
" -0.023818 | \n",
" 0.063931 | \n",
" 0.131390 | \n",
" 0.416244 | \n",
" 0.227029 | \n",
" 0.125576 | \n",
" 1.000000 | \n",
" 0.405982 | \n",
" 0.160721 | \n",
" 0.208456 | \n",
" 0.367118 | \n",
"
\n",
" \n",
" mod_diatoms_chl | \n",
" 0.381332 | \n",
" -0.054775 | \n",
" -0.177385 | \n",
" -0.057914 | \n",
" -0.289977 | \n",
" -0.102367 | \n",
" -0.229019 | \n",
" 0.176141 | \n",
" -0.102750 | \n",
" -0.084175 | \n",
" 0.405982 | \n",
" 1.000000 | \n",
" 0.674353 | \n",
" 0.749027 | \n",
" 0.831184 | \n",
"
\n",
" \n",
" mod_flagellates_chl | \n",
" -0.121685 | \n",
" -0.295843 | \n",
" 0.423884 | \n",
" 0.290401 | \n",
" 0.340049 | \n",
" 0.250856 | \n",
" 0.120689 | \n",
" 0.109616 | \n",
" 0.287205 | \n",
" 0.324159 | \n",
" 0.160721 | \n",
" 0.674353 | \n",
" 1.000000 | \n",
" 0.914387 | \n",
" 0.947829 | \n",
"
\n",
" \n",
" mod_ciliates_chl | \n",
" 0.098088 | \n",
" -0.045642 | \n",
" 0.162395 | \n",
" 0.036045 | \n",
" 0.021557 | \n",
" 0.062734 | \n",
" -0.086112 | \n",
" 0.039243 | \n",
" 0.039728 | \n",
" 0.059914 | \n",
" 0.208456 | \n",
" 0.749027 | \n",
" 0.914387 | \n",
" 1.000000 | \n",
" 0.959662 | \n",
"
\n",
" \n",
" mod_TChl | \n",
" 0.158253 | \n",
" -0.179840 | \n",
" 0.141110 | \n",
" 0.120324 | \n",
" 0.023916 | \n",
" 0.100466 | \n",
" -0.078591 | \n",
" 0.135781 | \n",
" 0.080884 | \n",
" 0.130502 | \n",
" 0.367118 | \n",
" 0.831184 | \n",
" 0.947829 | \n",
" 0.959662 | \n",
" 1.000000 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Diatoms-1 Diatoms-2 Cyanobacteria Cryptophytes \\\n",
"Diatoms-1 1.000000 0.158963 -0.183906 -0.200691 \n",
"Diatoms-2 0.158963 1.000000 -0.070727 -0.017724 \n",
"Cyanobacteria -0.183906 -0.070727 1.000000 0.308677 \n",
"Cryptophytes -0.200691 -0.017724 0.308677 1.000000 \n",
"Prasinophytes -0.330748 -0.081120 0.391266 0.705089 \n",
"Haptophytes -0.178564 -0.206987 0.322685 0.328445 \n",
"Dictyochophytes -0.022753 0.260879 0.341206 0.337350 \n",
"Dinoflagellates 0.257098 0.110120 0.001006 0.256664 \n",
"Raphidophytes -0.044532 -0.069205 0.323720 0.383761 \n",
"CPH -0.240631 -0.095680 0.387215 0.872284 \n",
"TchlA (ug/L) 0.620741 0.117311 0.114417 0.077971 \n",
"mod_diatoms_chl 0.381332 -0.054775 -0.177385 -0.057914 \n",
"mod_flagellates_chl -0.121685 -0.295843 0.423884 0.290401 \n",
"mod_ciliates_chl 0.098088 -0.045642 0.162395 0.036045 \n",
"mod_TChl 0.158253 -0.179840 0.141110 0.120324 \n",
"\n",
" Prasinophytes Haptophytes Dictyochophytes \\\n",
"Diatoms-1 -0.330748 -0.178564 -0.022753 \n",
"Diatoms-2 -0.081120 -0.206987 0.260879 \n",
"Cyanobacteria 0.391266 0.322685 0.341206 \n",
"Cryptophytes 0.705089 0.328445 0.337350 \n",
"Prasinophytes 1.000000 0.299601 0.401870 \n",
"Haptophytes 0.299601 1.000000 0.204290 \n",
"Dictyochophytes 0.401870 0.204290 1.000000 \n",
"Dinoflagellates 0.140807 0.047297 0.267118 \n",
"Raphidophytes 0.462423 0.189056 0.337107 \n",
"CPH 0.698793 0.576696 0.328808 \n",
"TchlA (ug/L) -0.023818 0.063931 0.131390 \n",
"mod_diatoms_chl -0.289977 -0.102367 -0.229019 \n",
"mod_flagellates_chl 0.340049 0.250856 0.120689 \n",
"mod_ciliates_chl 0.021557 0.062734 -0.086112 \n",
"mod_TChl 0.023916 0.100466 -0.078591 \n",
"\n",
" Dinoflagellates Raphidophytes CPH TchlA (ug/L) \\\n",
"Diatoms-1 0.257098 -0.044532 -0.240631 0.620741 \n",
"Diatoms-2 0.110120 -0.069205 -0.095680 0.117311 \n",
"Cyanobacteria 0.001006 0.323720 0.387215 0.114417 \n",
"Cryptophytes 0.256664 0.383761 0.872284 0.077971 \n",
"Prasinophytes 0.140807 0.462423 0.698793 -0.023818 \n",
"Haptophytes 0.047297 0.189056 0.576696 0.063931 \n",
"Dictyochophytes 0.267118 0.337107 0.328808 0.131390 \n",
"Dinoflagellates 1.000000 0.354625 0.246911 0.416244 \n",
"Raphidophytes 0.354625 1.000000 0.370869 0.227029 \n",
"CPH 0.246911 0.370869 1.000000 0.125576 \n",
"TchlA (ug/L) 0.416244 0.227029 0.125576 1.000000 \n",
"mod_diatoms_chl 0.176141 -0.102750 -0.084175 0.405982 \n",
"mod_flagellates_chl 0.109616 0.287205 0.324159 0.160721 \n",
"mod_ciliates_chl 0.039243 0.039728 0.059914 0.208456 \n",
"mod_TChl 0.135781 0.080884 0.130502 0.367118 \n",
"\n",
" mod_diatoms_chl mod_flagellates_chl mod_ciliates_chl \\\n",
"Diatoms-1 0.381332 -0.121685 0.098088 \n",
"Diatoms-2 -0.054775 -0.295843 -0.045642 \n",
"Cyanobacteria -0.177385 0.423884 0.162395 \n",
"Cryptophytes -0.057914 0.290401 0.036045 \n",
"Prasinophytes -0.289977 0.340049 0.021557 \n",
"Haptophytes -0.102367 0.250856 0.062734 \n",
"Dictyochophytes -0.229019 0.120689 -0.086112 \n",
"Dinoflagellates 0.176141 0.109616 0.039243 \n",
"Raphidophytes -0.102750 0.287205 0.039728 \n",
"CPH -0.084175 0.324159 0.059914 \n",
"TchlA (ug/L) 0.405982 0.160721 0.208456 \n",
"mod_diatoms_chl 1.000000 0.674353 0.749027 \n",
"mod_flagellates_chl 0.674353 1.000000 0.914387 \n",
"mod_ciliates_chl 0.749027 0.914387 1.000000 \n",
"mod_TChl 0.831184 0.947829 0.959662 \n",
"\n",
" mod_TChl \n",
"Diatoms-1 0.158253 \n",
"Diatoms-2 -0.179840 \n",
"Cyanobacteria 0.141110 \n",
"Cryptophytes 0.120324 \n",
"Prasinophytes 0.023916 \n",
"Haptophytes 0.100466 \n",
"Dictyochophytes -0.078591 \n",
"Dinoflagellates 0.135781 \n",
"Raphidophytes 0.080884 \n",
"CPH 0.130502 \n",
"TchlA (ug/L) 0.367118 \n",
"mod_diatoms_chl 0.831184 \n",
"mod_flagellates_chl 0.947829 \n",
"mod_ciliates_chl 0.959662 \n",
"mod_TChl 1.000000 "
]
},
"execution_count": 35,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dflog=pd.DataFrame()\n",
"for el in ['Diatoms-1', 'Diatoms-2','Cyanobacteria','Cryptophytes', 'Prasinophytes', \n",
" 'Haptophytes', 'Dictyochophytes','Dinoflagellates','Raphidophytes','CPH','TchlA (ug/L)',\n",
" 'mod_diatoms_chl','mod_flagellates_chl','mod_ciliates_chl','mod_TChl']:\n",
" dflog[el]=logt(data[el])\n",
"dflog.corr()"
]
},
{
"cell_type": "markdown",
"metadata": {
"papermill": {
"duration": 0.030079,
"end_time": "2020-11-16T18:41:32.247688",
"exception": false,
"start_time": "2020-11-16T18:41:32.217609",
"status": "completed"
},
"tags": []
},
"source": [
"### Cov matrix with log transformed values:"
]
},
{
"cell_type": "code",
"execution_count": 36,
"metadata": {
"papermill": {
"duration": 0.056303,
"end_time": "2020-11-16T18:41:32.334217",
"exception": false,
"start_time": "2020-11-16T18:41:32.277914",
"status": "completed"
},
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Diatoms-1 | \n",
" Diatoms-2 | \n",
" Cyanobacteria | \n",
" Cryptophytes | \n",
" Prasinophytes | \n",
" Haptophytes | \n",
" Dictyochophytes | \n",
" Dinoflagellates | \n",
" Raphidophytes | \n",
" CPH | \n",
" TchlA (ug/L) | \n",
" mod_diatoms_chl | \n",
" mod_flagellates_chl | \n",
" mod_ciliates_chl | \n",
" mod_TChl | \n",
"
\n",
" \n",
" \n",
" \n",
" Diatoms-1 | \n",
" 1.707049 | \n",
" 0.223426 | \n",
" -0.191222 | \n",
" -0.156507 | \n",
" -0.337293 | \n",
" -0.224417 | \n",
" -0.022976 | \n",
" 0.263191 | \n",
" -0.054699 | \n",
" -0.169667 | \n",
" 0.364806 | \n",
" 0.476603 | \n",
" -0.084867 | \n",
" 0.038920 | \n",
" 0.104432 | \n",
"
\n",
" \n",
" Diatoms-2 | \n",
" 0.223426 | \n",
" 1.157251 | \n",
" -0.060550 | \n",
" -0.011380 | \n",
" -0.068113 | \n",
" -0.214188 | \n",
" 0.216906 | \n",
" 0.092818 | \n",
" -0.069990 | \n",
" -0.055547 | \n",
" 0.056765 | \n",
" -0.056367 | \n",
" -0.169885 | \n",
" -0.014911 | \n",
" -0.097714 | \n",
"
\n",
" \n",
" Cyanobacteria | \n",
" -0.191222 | \n",
" -0.060550 | \n",
" 0.633347 | \n",
" 0.146625 | \n",
" 0.243042 | \n",
" 0.247024 | \n",
" 0.209872 | \n",
" 0.000628 | \n",
" 0.242199 | \n",
" 0.166302 | \n",
" 0.040958 | \n",
" -0.135042 | \n",
" 0.180073 | \n",
" 0.039249 | \n",
" 0.056720 | \n",
"
\n",
" \n",
" Cryptophytes | \n",
" -0.156507 | \n",
" -0.011380 | \n",
" 0.146625 | \n",
" 0.356259 | \n",
" 0.328485 | \n",
" 0.188575 | \n",
" 0.155626 | \n",
" 0.120032 | \n",
" 0.215341 | \n",
" 0.280974 | \n",
" 0.020934 | \n",
" -0.033067 | \n",
" 0.092525 | \n",
" 0.006534 | \n",
" 0.036274 | \n",
"
\n",
" \n",
" Prasinophytes | \n",
" -0.337293 | \n",
" -0.068113 | \n",
" 0.243042 | \n",
" 0.328485 | \n",
" 0.609223 | \n",
" 0.224942 | \n",
" 0.242433 | \n",
" 0.086112 | \n",
" 0.339321 | \n",
" 0.294348 | \n",
" -0.008362 | \n",
" -0.216512 | \n",
" 0.141680 | \n",
" 0.005110 | \n",
" 0.009428 | \n",
"
\n",
" \n",
" Haptophytes | \n",
" -0.224417 | \n",
" -0.214188 | \n",
" 0.247024 | \n",
" 0.188575 | \n",
" 0.224942 | \n",
" 0.925289 | \n",
" 0.151881 | \n",
" 0.035647 | \n",
" 0.170967 | \n",
" 0.299372 | \n",
" 0.027662 | \n",
" -0.094195 | \n",
" 0.128808 | \n",
" 0.018326 | \n",
" 0.048811 | \n",
"
\n",
" \n",
" Dictyochophytes | \n",
" -0.022976 | \n",
" 0.216906 | \n",
" 0.209872 | \n",
" 0.155626 | \n",
" 0.242433 | \n",
" 0.151881 | \n",
" 0.597360 | \n",
" 0.161760 | \n",
" 0.244945 | \n",
" 0.137147 | \n",
" 0.045678 | \n",
" -0.169324 | \n",
" 0.049793 | \n",
" -0.020213 | \n",
" -0.030679 | \n",
"
\n",
" \n",
" Dinoflagellates | \n",
" 0.263191 | \n",
" 0.092818 | \n",
" 0.000628 | \n",
" 0.120032 | \n",
" 0.086112 | \n",
" 0.035647 | \n",
" 0.161760 | \n",
" 0.613904 | \n",
" 0.261217 | \n",
" 0.104403 | \n",
" 0.146699 | \n",
" 0.132020 | \n",
" 0.045846 | \n",
" 0.009338 | \n",
" 0.053734 | \n",
"
\n",
" \n",
" Raphidophytes | \n",
" -0.054699 | \n",
" -0.069990 | \n",
" 0.242199 | \n",
" 0.215341 | \n",
" 0.339321 | \n",
" 0.170967 | \n",
" 0.244945 | \n",
" 0.261217 | \n",
" 0.883823 | \n",
" 0.188160 | \n",
" 0.096005 | \n",
" -0.092404 | \n",
" 0.144130 | \n",
" 0.011343 | \n",
" 0.038407 | \n",
"
\n",
" \n",
" CPH | \n",
" -0.169667 | \n",
" -0.055547 | \n",
" 0.166302 | \n",
" 0.280974 | \n",
" 0.294348 | \n",
" 0.299372 | \n",
" 0.137147 | \n",
" 0.104403 | \n",
" 0.188160 | \n",
" 0.291239 | \n",
" 0.030483 | \n",
" -0.043455 | \n",
" 0.093382 | \n",
" 0.009820 | \n",
" 0.035571 | \n",
"
\n",
" \n",
" TchlA (ug/L) | \n",
" 0.364806 | \n",
" 0.056765 | \n",
" 0.040958 | \n",
" 0.020934 | \n",
" -0.008362 | \n",
" 0.027662 | \n",
" 0.045678 | \n",
" 0.146699 | \n",
" 0.096005 | \n",
" 0.030483 | \n",
" 0.202329 | \n",
" 0.174689 | \n",
" 0.038590 | \n",
" 0.028476 | \n",
" 0.083405 | \n",
"
\n",
" \n",
" mod_diatoms_chl | \n",
" 0.476603 | \n",
" -0.056367 | \n",
" -0.135042 | \n",
" -0.033067 | \n",
" -0.216512 | \n",
" -0.094195 | \n",
" -0.169324 | \n",
" 0.132020 | \n",
" -0.092404 | \n",
" -0.043455 | \n",
" 0.174689 | \n",
" 0.996790 | \n",
" 0.547935 | \n",
" 0.528631 | \n",
" 0.718548 | \n",
"
\n",
" \n",
" mod_flagellates_chl | \n",
" -0.084867 | \n",
" -0.169885 | \n",
" 0.180073 | \n",
" 0.092525 | \n",
" 0.141680 | \n",
" 0.128808 | \n",
" 0.049793 | \n",
" 0.045846 | \n",
" 0.144130 | \n",
" 0.093382 | \n",
" 0.038590 | \n",
" 0.547935 | \n",
" 0.662337 | \n",
" 0.526045 | \n",
" 0.667923 | \n",
"
\n",
" \n",
" mod_ciliates_chl | \n",
" 0.038920 | \n",
" -0.014911 | \n",
" 0.039249 | \n",
" 0.006534 | \n",
" 0.005110 | \n",
" 0.018326 | \n",
" -0.020213 | \n",
" 0.009338 | \n",
" 0.011343 | \n",
" 0.009820 | \n",
" 0.028476 | \n",
" 0.528631 | \n",
" 0.526045 | \n",
" 0.499697 | \n",
" 0.587392 | \n",
"
\n",
" \n",
" mod_TChl | \n",
" 0.104432 | \n",
" -0.097714 | \n",
" 0.056720 | \n",
" 0.036274 | \n",
" 0.009428 | \n",
" 0.048811 | \n",
" -0.030679 | \n",
" 0.053734 | \n",
" 0.038407 | \n",
" 0.035571 | \n",
" 0.083405 | \n",
" 0.718548 | \n",
" 0.667923 | \n",
" 0.587392 | \n",
" 0.749744 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Diatoms-1 Diatoms-2 Cyanobacteria Cryptophytes \\\n",
"Diatoms-1 1.707049 0.223426 -0.191222 -0.156507 \n",
"Diatoms-2 0.223426 1.157251 -0.060550 -0.011380 \n",
"Cyanobacteria -0.191222 -0.060550 0.633347 0.146625 \n",
"Cryptophytes -0.156507 -0.011380 0.146625 0.356259 \n",
"Prasinophytes -0.337293 -0.068113 0.243042 0.328485 \n",
"Haptophytes -0.224417 -0.214188 0.247024 0.188575 \n",
"Dictyochophytes -0.022976 0.216906 0.209872 0.155626 \n",
"Dinoflagellates 0.263191 0.092818 0.000628 0.120032 \n",
"Raphidophytes -0.054699 -0.069990 0.242199 0.215341 \n",
"CPH -0.169667 -0.055547 0.166302 0.280974 \n",
"TchlA (ug/L) 0.364806 0.056765 0.040958 0.020934 \n",
"mod_diatoms_chl 0.476603 -0.056367 -0.135042 -0.033067 \n",
"mod_flagellates_chl -0.084867 -0.169885 0.180073 0.092525 \n",
"mod_ciliates_chl 0.038920 -0.014911 0.039249 0.006534 \n",
"mod_TChl 0.104432 -0.097714 0.056720 0.036274 \n",
"\n",
" Prasinophytes Haptophytes Dictyochophytes \\\n",
"Diatoms-1 -0.337293 -0.224417 -0.022976 \n",
"Diatoms-2 -0.068113 -0.214188 0.216906 \n",
"Cyanobacteria 0.243042 0.247024 0.209872 \n",
"Cryptophytes 0.328485 0.188575 0.155626 \n",
"Prasinophytes 0.609223 0.224942 0.242433 \n",
"Haptophytes 0.224942 0.925289 0.151881 \n",
"Dictyochophytes 0.242433 0.151881 0.597360 \n",
"Dinoflagellates 0.086112 0.035647 0.161760 \n",
"Raphidophytes 0.339321 0.170967 0.244945 \n",
"CPH 0.294348 0.299372 0.137147 \n",
"TchlA (ug/L) -0.008362 0.027662 0.045678 \n",
"mod_diatoms_chl -0.216512 -0.094195 -0.169324 \n",
"mod_flagellates_chl 0.141680 0.128808 0.049793 \n",
"mod_ciliates_chl 0.005110 0.018326 -0.020213 \n",
"mod_TChl 0.009428 0.048811 -0.030679 \n",
"\n",
" Dinoflagellates Raphidophytes CPH TchlA (ug/L) \\\n",
"Diatoms-1 0.263191 -0.054699 -0.169667 0.364806 \n",
"Diatoms-2 0.092818 -0.069990 -0.055547 0.056765 \n",
"Cyanobacteria 0.000628 0.242199 0.166302 0.040958 \n",
"Cryptophytes 0.120032 0.215341 0.280974 0.020934 \n",
"Prasinophytes 0.086112 0.339321 0.294348 -0.008362 \n",
"Haptophytes 0.035647 0.170967 0.299372 0.027662 \n",
"Dictyochophytes 0.161760 0.244945 0.137147 0.045678 \n",
"Dinoflagellates 0.613904 0.261217 0.104403 0.146699 \n",
"Raphidophytes 0.261217 0.883823 0.188160 0.096005 \n",
"CPH 0.104403 0.188160 0.291239 0.030483 \n",
"TchlA (ug/L) 0.146699 0.096005 0.030483 0.202329 \n",
"mod_diatoms_chl 0.132020 -0.092404 -0.043455 0.174689 \n",
"mod_flagellates_chl 0.045846 0.144130 0.093382 0.038590 \n",
"mod_ciliates_chl 0.009338 0.011343 0.009820 0.028476 \n",
"mod_TChl 0.053734 0.038407 0.035571 0.083405 \n",
"\n",
" mod_diatoms_chl mod_flagellates_chl mod_ciliates_chl \\\n",
"Diatoms-1 0.476603 -0.084867 0.038920 \n",
"Diatoms-2 -0.056367 -0.169885 -0.014911 \n",
"Cyanobacteria -0.135042 0.180073 0.039249 \n",
"Cryptophytes -0.033067 0.092525 0.006534 \n",
"Prasinophytes -0.216512 0.141680 0.005110 \n",
"Haptophytes -0.094195 0.128808 0.018326 \n",
"Dictyochophytes -0.169324 0.049793 -0.020213 \n",
"Dinoflagellates 0.132020 0.045846 0.009338 \n",
"Raphidophytes -0.092404 0.144130 0.011343 \n",
"CPH -0.043455 0.093382 0.009820 \n",
"TchlA (ug/L) 0.174689 0.038590 0.028476 \n",
"mod_diatoms_chl 0.996790 0.547935 0.528631 \n",
"mod_flagellates_chl 0.547935 0.662337 0.526045 \n",
"mod_ciliates_chl 0.528631 0.526045 0.499697 \n",
"mod_TChl 0.718548 0.667923 0.587392 \n",
"\n",
" mod_TChl \n",
"Diatoms-1 0.104432 \n",
"Diatoms-2 -0.097714 \n",
"Cyanobacteria 0.056720 \n",
"Cryptophytes 0.036274 \n",
"Prasinophytes 0.009428 \n",
"Haptophytes 0.048811 \n",
"Dictyochophytes -0.030679 \n",
"Dinoflagellates 0.053734 \n",
"Raphidophytes 0.038407 \n",
"CPH 0.035571 \n",
"TchlA (ug/L) 0.083405 \n",
"mod_diatoms_chl 0.718548 \n",
"mod_flagellates_chl 0.667923 \n",
"mod_ciliates_chl 0.587392 \n",
"mod_TChl 0.749744 "
]
},
"execution_count": 36,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"\n",
"dflog.cov()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Individual phytoplankton groups compared to model groups (1:1 correspondence not expected)"
]
},
{
"cell_type": "code",
"execution_count": 37,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Text(0.001584893192461114, 10, 'r = 0.33')"
]
},
"execution_count": 37,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"