Comparison of plot characteristics and digitized deadwood

Author

Janne Mäyrä

Published

December 22, 2022

Code

from drone_detector.utils import * 
from drone_detector.imports import *
import rasterio.mask as rio_mask
import seaborn as sns
sns.set_style('whitegrid')
import warnings
warnings.filterwarnings("ignore")
sys.path.append('..')
from src.tree_functions import *

The following shows how we compared the field-measured data from both study sites and annotations that are located within these plots.

1 Hiidenportti

Read data and do some wrangling.

Code

field_data_path = Path('../data/hiidenportti')
anns = gpd.read_file('../../data/raw/hiidenportti/virtual_plots/all_deadwood_hiidenportti.geojson')
plot_circles = gpd.read_file(field_data_path/'plot_circles.geojson')
field_data = pd.read_csv(field_data_path/'all_plot_data.csv')
virtual_plot_grid = gpd.read_file(field_data_path/'envelopes_with_trees.geojson')
conservation_areas = gpd.read_file('../data/common/LsAlueValtio.shp')
cons_hp = conservation_areas[conservation_areas.geometry.intersects(box(*anns.total_bounds))]
cons_hp = gpd.clip(cons_hp, virtual_plot_grid)

Filter plot circles so that only those present in scenes remain.

Code

plot_circles['in_vplot'] = plot_circles.apply(lambda row: 1 if any(virtual_plot_grid.geometry.contains(row.geometry)) 
                                              else 0, axis=1)
plot_circles['id'] = plot_circles['id'].astype(int)
field_data = field_data[field_data.id.isin(plot_circles[plot_circles.in_vplot==1].id.unique())]
field_data.rename(columns= {c: c.replace('.','_') for c in field_data.columns}, inplace=True)
dw_cols = ['id'] + [c for c in field_data.columns if 'dw' in c]
plot_dw_data = field_data[dw_cols].copy()
plot_circles = plot_circles[plot_circles.in_vplot == 1]

Read individual tree measurements.

Code

tree_data = pd.read_csv(field_data_path/'hp_tree_data_fixed_1512.csv')
tree_data = tree_data[tree_data.plot_id.isin(plot_dw_data.id.unique())]

Count the number of deadwood (n_dw), fallen deadwood (n_ddw) and standing deadwood (n_udw) from the individual field data measurements.

Code

plot_dw_data['n_dw_plot'] = plot_dw_data.id.apply(lambda row: len(tree_data[tree_data.plot_id == row]))
plot_dw_data['n_ddw_plot'] = plot_dw_data.id.apply(lambda row: len(tree_data[(tree_data.plot_id == row) 
                                                                             & (tree_data.tree_class == 4)]))
plot_dw_data['n_udw_plot'] = plot_dw_data.id.apply(lambda row: len(tree_data[(tree_data.plot_id == row) 
                                                                             & (tree_data.tree_class == 3)]))

Code

def match_circular_plot(row, plots):
    "Match annotations with field plots"
    for p in plots.itertuples():
        if row.geometry.intersects(p.geometry):
            return int(p.id)

Code

anns['plot_id'] = anns.apply(lambda row: match_circular_plot(row, plot_circles), axis=1)
anns_in_plots = anns.overlay(plot_circles[['geometry']])
anns_in_plots['plot_id'] = anns_in_plots.plot_id.astype(int)

Count the number of annotated deadwood instances in each circular field plot, as well as note which of the circular plots are located in the conserved areas.

Code

plot_dw_data['n_dw_ann'] = plot_dw_data.apply(lambda row: anns_in_plots.plot_id.value_counts()[row.id] 
                                              if row.id in anns_in_plots.plot_id.unique() else 0, axis=1)
plot_dw_data['n_ddw_ann'] = plot_dw_data.apply(lambda row: anns_in_plots[anns_in_plots.groundwood==2].plot_id.value_counts()[row.id] 
                                              if row.id in anns_in_plots[anns_in_plots.groundwood==2].plot_id.unique() else 0, axis=1)
plot_dw_data['n_udw_ann'] = plot_dw_data.apply(lambda row: anns_in_plots[anns_in_plots.groundwood==1].plot_id.value_counts()[row.id] 
                                              if row.id in anns_in_plots[anns_in_plots.groundwood==1].plot_id.unique() else 0, axis=1)
plot_dw_data['geometry'] = plot_dw_data.apply(lambda row: plot_circles[plot_circles.id == row.id].geometry.iloc[0], 
                                              axis=1)
plot_dw_data = gpd.GeoDataFrame(plot_dw_data, crs=plot_circles.crs)
plot_dw_data['conservation'] = plot_dw_data.apply(lambda row: 1 if any(cons_hp.geometry.contains(row.geometry))
                                                  else 0, axis=1)

Add information about conservation area to tree data.

Code

tree_data['conservation'] = tree_data.apply(lambda row: plot_dw_data[plot_dw_data.id == row.plot_id].conservation.unique()[0], axis=1)

Plot the numbers. These show that we were able to annotate slighly less deadwood than what was measured in the field. On the other hand, especially in managed forests there were also several cases where there were more fallen deadwood annotations than field measured fallen deadwood. As the resolution of our data makes it impossible to accurately tell whether a fallen trunk had DBH less than 100mm, some of the annotations can be such that were determined too thin in the field. Other likely reason is that canopy obscured the deadwood instances, as the average canopy cover percentage was around 61 % for the field plots.

Code

plot_dw_data.pivot_table(index='conservation', values=['n_ddw_plot', 'n_udw_plot', 'n_ddw_ann', 'n_udw_ann'], 
                         aggfunc='sum', margins=True)

	n_ddw_ann	n_ddw_plot	n_udw_ann	n_udw_plot
conservation
0	248	217	49	75
1	48	96	10	24
All	296	313	59	99

Get plot-wise canopy cover percentage based on LiDAR derived canopy height model as the percentage of plot area with height more than 2 meters.

Code

pcts = []

with rio.open('../../data/raw/hiidenportti/full_mosaics/CHM_Hiidenportti_epsg.tif') as src:
    crs = src.crs
    for row in plot_dw_data.itertuples():
        plot_im, plot_tfm = rio_mask.mask(src, [row.geometry], crop=True)
        pcts.append(plot_im[plot_im > 2].shape[0] / plot_im[plot_im >= 0].shape[0])

plot_dw_data['canopy_cover_pct'] = pcts

pd.pivot_table(data=plot_dw_data, index=['conservation'], values=['canopy_cover_pct'],
               aggfunc=['min', 'max', 'mean', 'std', 'count'], margins=True)

	min	max	mean	std	count
	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct
conservation
0	0.142006	0.947162	0.593817	0.187985	51
1	0.083333	0.855172	0.641549	0.176416	20
All	0.083333	0.947162	0.607263	0.184815	71

Overall the conserved forests are a bit more dense, but not that much.

Plot the relationship between annotated deadwood and field-measured deadwood. Each dot is a single field plot.

For annotated groundwood, as the annotations can be twisted due to e.g. orthorectification errors, we use the longest side of the smallest rotated rectangle that can be fit around the polygon as a proxy for the trunk length.

Diameter can be approximated with the following approach. For each polygon,

Get minimum rotated rectangle
Draw three lines that are perpendicular to the longer side of the minimum rotated rectangle, starting from the points of 10%, 50% and 90% of the length of the minimum rotated rectangle
Intersect these lines with the polygon. Diameter is the mean lenght of these intersecting lines.

This is not the same as DBH, but close enough.

Code

anns_in_plots['tree_length'] = anns_in_plots.apply(lambda row: get_len(row.geometry), axis=1)

Compare the distributions of the downed trunk lengths. Both graphs only take the parts within the plots into account. Lengths are binned into 1m bins.

As expected, the field measured fallen deadwood were clearly shorter than annotated deadwood. Most of the annotated fallen deadwood were shorter than 2 meters, while field measured trees were typically longer than 5 meters. However, this is most likely due to canopy obscuring the fallen deadwood, and some of the longer trees are annotated as multiple shorter ones. When comparing the difference in total lengths of field-measured trees and annotated trees, typically denser canopy cover meant also larger difference.

As expected, annotated trunks are clearly on average shorter than field measured.

Compare the measured DBH for downed trees and estimated diameter of annotated downed deadwood. For annotated deadwood, the diameter is estimated for the whole tree, not only for the part within the field plot. DBHs are binned into 50mm bins.

When comparing the DBH distributions for fallen deadwood, the diameter classes 125-150mm, 150-175mm and 175-200mm were clearly overrepresented in the annotated data. As these DBH classes were also the most common among field data, the reason for this could be the same as with length differences, and the visible trees area partially obscured by the canopy.

Aggregate the above, first field data.

Code

pd.pivot_table(data=tree_data[(tree_data.tree_class == 4)&(tree_data.DBH>0)],
               index=['conservation'], values=['l', 'DBH'],
               aggfunc=['mean', 'min', 'max', 'count'], margins=True)

	mean		min		max		count
	DBH	l	DBH	l	DBH	l	DBH	l
conservation
0	133.786875	6.768601	15.558197	0.518478	450.000000	16.700000	217	217
1	185.538932	7.588368	39.167120	0.214113	580.560964	18.000666	96	96
All	149.659711	7.020031	15.558197	0.214113	580.560964	18.000666	313	313

Then annotations.

Code

pd.pivot_table(data=anns_in_plots[anns_in_plots.groundwood==2], index=['conservation'], values=['tree_length', 'diam'],
               aggfunc=['mean', 'min', 'max', 'count'], margins=True)

	mean		min		max		count
	diam	tree_length	diam	tree_length	diam	tree_length	diam	tree_length
conservation
0	175.046987	1.818960	16.64560	0.095362	381.292305	6.485503	236	236
1	208.354703	2.083887	27.32243	0.149797	625.927586	5.907329	60	60
All	181.798551	1.872662	16.64560	0.095362	625.927586	6.485503	296	296

Check the relationship between canopy cover and deadwood types. First standing deadwood.

Code

g = sns.lmplot(data=plot_dw_data, x='n_udw_plot', y='canopy_cover_pct', col='conservation', hue='conservation', ci=1,
                legend=False)
g.axes[0,0].set_title('Managed forests')
g.axes[0,1].set_title('Protected forests')
g.axes[0,0].set_xticks(range(0,10,2))
g.axes[0,1].set_xticks(range(0,10,2))
g.set_ylabels('Canopy cover percentage ffor field plots')
g.set_xlabels('Number of field-measured standing deadwood within plots')
plt.show()

Code

pd.pivot_table(data=anns_in_plots[anns_in_plots.groundwood==2], index=['conservation'], values=['tree_length', 'diam'],
               aggfunc=['mean', 'min', 'max', 'count'], margins=True)

	mean		min		max		count
	diam	tree_length	diam	tree_length	diam	tree_length	diam	tree_length
conservation
0	175.046987	1.818960	16.64560	0.095362	381.292305	6.485503	236	236
1	208.354703	2.083887	27.32243	0.149797	625.927586	5.907329	60	60
All	181.798551	1.872662	16.64560	0.095362	625.927586	6.485503	296	296

Code

g = sns.lmplot(data=plot_dw_data, x='n_udw_ann', y='canopy_cover_pct', col='conservation', hue='conservation', ci=1,
                legend=False)
g.axes[0,0].set_title('Managed forests')
g.axes[0,1].set_title('Protected forests')
g.axes[0,0].set_xticks(range(0,10,2))
g.axes[0,1].set_xticks(range(0,10,2))
g.set_ylabels('Canopy cover percentage for field plots')
g.set_xlabels('Number of annotated standing deadwood')
plt.show()

Then fallen deadwood

Code

g = sns.lmplot(data=plot_dw_data, x='n_ddw_plot', y='canopy_cover_pct', col='conservation', hue='conservation', ci=1,
                legend=False)
g.axes[0,0].set_title('Managed forests')
g.axes[0,1].set_title('Protected forests')
g.axes[0,0].set_xticks(range(0,21,2))
g.axes[0,1].set_xticks(range(0,21,2))
g.set_ylabels('Canopy cover percentage for field plots')
g.set_xlabels('Number of field-measured fallen deadwood within plots')
plt.show()

Code

g = sns.lmplot(data=plot_dw_data, x='n_ddw_ann', y='canopy_cover_pct', col='conservation', hue='conservation',
                legend=False, ci=1)
g.axes[0,0].set_title('Managed forests')
g.axes[0,1].set_title('Protected forests')
g.axes[0,0].set_xticks(range(0,21,2))
g.axes[0,1].set_xticks(range(0,21,2))
g.set_ylabels('Total lengths (m) of field-measured groundwood within plots')
g.set_xlabels('Total lengths (m) of annotated groundwood within plots')
plt.show()

Plot the total lengths of groundwood located within a single field plot.

Code

plot_dw_data['n_dw_stand_field'] = plot_dw_data.apply(lambda row: len(tree_data[(tree_data.plot_id == row.id) &
                                                                                (tree_data.tree_class == 3)]),
                                                      axis=1)
plot_dw_data['n_dw_fall_field'] = plot_dw_data.apply(lambda row: len(tree_data[(tree_data.plot_id == row.id) &
                                                                               ((tree_data.tree_class == 4)|
                                                                                (tree_data.tree_class == 5))]),
                                                     axis=1)
plot_dw_data['n_dw_tot_field'] = plot_dw_data.n_dw_stand_field + plot_dw_data.n_dw_fall_field
plot_dw_data['l_gw_field'] = plot_dw_data.apply(lambda row: tree_data[(tree_data.plot_id == row.id) &
                                                                      (tree_data.tree_class == 4)].l.sum()
                                              , axis=1)
plot_dw_data['l_gw_ann'] = plot_dw_data.apply(lambda row: anns_in_plots[(anns_in_plots.plot_id == row.id) &
                                                                        (anns_in_plots.layer == 'groundwood')
                                                                       ].tree_length.sum()
                                              , axis=1)

Total lengths for annotations are generally much less than field-measured.

Plot the difference in the numbers of annotated deadwood.

Code

plot_dw_data['n_ddw_plot_diff'] = plot_dw_data.n_ddw_plot - plot_dw_data.n_ddw_ann
plot_dw_data['n_udw_plot_diff'] = plot_dw_data.n_udw_plot - plot_dw_data.n_udw_ann

Text(0.5, 1.0, 'Conserved forests')

Typically more fallen deadwood is left unannotated if the canopy cover is high.

Text(0.5, 1.0, 'Conserved forests')

For standing deadwood the same effect is not present, at least it can’t be seen as clearly.

Code

plot_dw_data['l_dw_plot_diff'] = plot_dw_data.l_ddw - plot_dw_data.l_gw_ann

Relation between canopy cover percentage and total lengths of groundwood in field plots.

Estimate within-plot volume of downed deadwood from annotations.

Code

anns_in_plots['v_ddw'] = anns_in_plots.geometry.apply(cut_cone_volume)
plot_dw_data['v_ddw_ann'] = plot_dw_data.apply(lambda row: anns_in_plots[(anns_in_plots.plot_id == row.id) &
                                                                        (anns_in_plots.layer == 'groundwood')
                                                                       ].v_ddw.sum()
                                              , axis=1)
plot_dw_data['v_dw_plot'] = (plot_dw_data['v_dw']/10000)*np.pi*9**2
plot_dw_data['v_ddw_plot'] = (plot_dw_data['v_ddw']/10000)*np.pi*9**2
plot_dw_data['v_udw_plot'] = plot_dw_data.v_dw_plot - plot_dw_data.v_ddw_plot

Compare statistics for the total volume of fallen deadwood. First field data.

Code

pd.pivot_table(data=plot_dw_data, index=['conservation'], values=['v_ddw'],
               aggfunc=['min', 'max', 'mean', 'median','std', 'count'], margins=True)

	min	max	mean	median	std	count
	v_ddw	v_ddw	v_ddw	v_ddw	v_ddw	v_ddw
conservation
0	0.0	97.300652	22.922567	14.343594	26.380391	51
1	0.0	139.171786	42.482418	28.313861	42.481488	20
All	0.0	139.171786	28.432385	15.575737	32.641219	71

Then estimation based on annotations.

Code

pd.pivot_table(data=plot_dw_data, index=['conservation'], values=['v_ddw_ann_ha'],
               aggfunc=['min', 'max', 'mean', 'median','std', 'count'], margins=True)

	min	max	mean	median	std	count
	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha
conservation
0	0.0	64.201482	11.277266	6.746180	13.582354	51
1	0.0	43.360494	9.047403	5.115679	11.749208	20
All	0.0	64.201482	10.649135	5.661624	13.048417	71

Plot the difference between volume based on field data and estimated volume based on annotations.

<seaborn.axisgrid.FacetGrid>

Again, denser canopy means generally more difference.

2 Sudenpesänkangas

Read data and do some wrangling.

Code

evo_fd_path = Path('../data/sudenpesankangas/')
evo_anns = gpd.read_file('../../data/raw/sudenpesankangas/virtual_plots/sudenpesankangas_deadwood.geojson')
evo_anns = evo_anns.to_crs('epsg:3067')
evo_plot_circles = gpd.read_file(evo_fd_path/'plot_circles.geojson')
evo_plot_circles['id'] = evo_plot_circles['id'].astype(int)

evo_field_data = pd.read_csv(evo_fd_path/'puutiedot_sudenpesänkangas.csv', sep=';', decimal=',')
evo_field_data = gpd.GeoDataFrame(evo_field_data, geometry=gpd.points_from_xy(evo_field_data.gx, evo_field_data.gy), 
                                   crs='epsg:3067')
evo_grid = gpd.read_file(evo_fd_path/'vplots.geojson')
evo_grid = evo_grid.to_crs('epsg:3067')
evo_field_data['plotid'] = evo_field_data.kaid + 1000
evo_field_data = evo_field_data[evo_field_data.puuluo.isin([3,4])]

cons_evo = conservation_areas[conservation_areas.geometry.intersects(box(*evo_anns.total_bounds))]
cons_evo = gpd.clip(cons_evo, evo_grid)

def match_plotid_spk(geom, plots):
    for r in plots.itertuples():
        if r.geometry.contains(geom):
            return r.id
    return None

evo_plots_updated = pd.read_csv(evo_fd_path/'Koealatunnukset_Evo_2018.txt', sep=' ')
evo_plots_luke = pd.read_csv(evo_fd_path/'Koealatunnukset_Evo_2018_LUKE.txt', sep=' ')
evo_plots_updated = gpd.GeoDataFrame(evo_plots_updated, geometry=gpd.points_from_xy(evo_plots_updated.x,
                                                                                    evo_plots_updated.y),
                                     crs='epsg:3067')
evo_plots_luke = gpd.GeoDataFrame(evo_plots_luke, geometry=gpd.points_from_xy(evo_plots_luke.x,
                                                                              evo_plots_luke.y),
                                     crs='epsg:3067')
evo_plots = pd.concat([evo_plots_updated, evo_plots_luke])
evo_plots.rename(columns= {c: c.replace('.','_') for c in evo_plots.columns}, inplace=True)

evo_plots['spk_id'] = evo_plots.geometry.apply(lambda row: match_plotid_spk(row, evo_plot_circles))

evo_plots.dropna(subset='spk_id', inplace=True)

evo_plots['geometry'] = evo_plots.spk_id.apply(lambda row: evo_plot_circles[evo_plot_circles.id == row].geometry.iloc[0])

evo_plots.drop(columns=['id'], inplace=True)
evo_plots.rename(columns={'spk_id': 'id'}, inplace=True)

evo_plots['conservation'] = evo_plots.geometry.apply(lambda row: 1 if cons_evo.geometry.unary_union.intersects(row)
                                                     else 0)

evo_anns['plot_id'] = evo_anns.apply(lambda row: int(row.vplot_id.split('_')[1]), axis=1)

evo_plots = evo_plots[evo_plots.id.isin(evo_anns.plot_id.unique())]

evo_anns['plot_id'] = evo_anns.apply(lambda row: match_circular_plot(row, evo_plots), axis=1)
evo_anns = evo_anns.overlay(evo_plots[['geometry']])

Add canopy density based on LiDAR derived canopy height model. The density is the percentage of field plot area with height above 2 meters.

Code

pcts = []

with rio.open('../../data/raw/sudenpesankangas/full_mosaics/sudenpesankangas_chm.tif') as src:
    for row in evo_plots.itertuples():
        plot_im, plot_tfm = rio_mask.mask(src, [row.geometry], crop=True)
        pcts.append(plot_im[plot_im > 2].shape[0] / plot_im[plot_im >= 0].shape[0])
        
evo_plots['canopy_cover_pct'] = pcts

pd.pivot_table(data=evo_plots, index=['conservation'], values=['canopy_cover_pct'],
               aggfunc=['min', 'max', 'mean', 'std', 'count'], margins=True)

	min	max	mean	std	count
	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct	canopy_cover_pct
conservation
0	0.237288	0.989960	0.782452	0.200439	42
1	0.678000	0.991992	0.869878	0.085901	29
All	0.237288	0.991992	0.818162	0.168393	71

As seen here, canopies in Evo are far more dense than in Hiidenportti.

Count the number of deadwood instances similarly as for Hiidenportti data and plot the relationship between them.

Code

evo_plots['n_dw_ann'] = evo_plots.apply(lambda row: evo_anns.plot_id.value_counts()[int(row.id)]
                                        if row.id in evo_anns.plot_id.unique() else 0, axis=1)
evo_plots['n_ddw_ann'] = evo_plots.apply(lambda row: evo_anns[evo_anns.label=='groundwood'].plot_id.value_counts()[int(row.id)]
                                        if row.id in evo_anns[evo_anns.label=='groundwood'].plot_id.unique() else 0, axis=1)
evo_plots['n_udw_ann'] = evo_plots.apply(lambda row: evo_anns[evo_anns.label!='groundwood'].plot_id.value_counts()[int(row.id)]
                                        if row.id in evo_anns[evo_anns.label!='groundwood'].plot_id.unique() else 0, axis=1)

evo_plots['n_dw_plot'] = np.round((evo_plots['n_dw']/10000)*np.pi*9**2).astype(int)
evo_plots['n_ddw_plot'] = np.round((evo_plots['n_ddw']/10000)*np.pi*9**2).astype(int)
evo_plots['n_udw_plot'] = evo_plots.n_dw_plot - evo_plots.n_ddw_plot
evo_plots['conservation'] = evo_plots.apply(lambda row: 1 if any(cons_evo.geometry.contains(row.geometry))
                                                        else 0, axis=1)

evo_plots.pivot_table(index='conservation', values=['n_ddw_plot', 'n_udw_plot', 'n_ddw_ann', 'n_udw_ann'], 
                         aggfunc='sum', margins=True)

	n_ddw_ann	n_ddw_plot	n_udw_ann	n_udw_plot
conservation
0	65	14	14	68
1	22	29	29	92
All	87	43	43	160

For Evo dataset, we were able to annotate twice as much groundwood as there are in total in the field data, and only a quarter of the number of standing deadwood. Because Evo dataset is missing the field-measured information for deadwood height, we were not able to check whether the missing standing deadwood were, for instance, only a couple of meters tall and thus hidden below the canopy. Compared to Hiidenportti, the forest canopy in Evo was significantly thicker, as the average canopy cover percentage in the field plots was around 82%.

Plot the plot-wise differences between field-measurements and annotations.

Code

g = sns.lmplot(data=evo_plots, x='n_udw_plot', y='canopy_cover_pct', col='conservation',
               hue='conservation', ci=0)
g.set_ylabels('Canopy cover percentage in circular plot')
g.set_xlabels('Field-measured standing deadwood')
plt.show()

Code

g = sns.lmplot(data=evo_plots, x='n_udw_ann', y='canopy_cover_pct', col='conservation',
               hue='conservation', ci=0)
g.set_ylabels('Canopy cover percentage in circular plot')
g.set_xlabels('Number of annotated standing deadwood')
plt.show()

Code

g = sns.lmplot(data=evo_plots, x='n_ddw_plot', y='canopy_cover_pct', col='conservation',
               hue='conservation', ci=0)
g.set_ylabels('Canopy cover percentage in circular plot')
g.set_xlabels('Number of field-measured fallen deadwood')
plt.show()

Code

g = sns.lmplot(data=evo_plots, x='n_ddw_ann', y='canopy_cover_pct', col='conservation',
               hue='conservation', ci=0)
g.set_ylabels('Canopy cover percentage in circular plot')
g.set_xlabels('Number of annotated fallen deadwood')
plt.show()

Again, denser canopy indicates less annotated fallen data.

Same plots but for differences in numbers.

Code

evo_plots['n_ddw_diff'] = evo_plots.n_ddw_plot - evo_plots.n_ddw_ann
evo_plots['n_udw_diff'] = evo_plots.n_udw_plot - evo_plots.n_udw_ann

First for fallen deadwood.

<seaborn.axisgrid.FacetGrid>

Then for standing deadwood.

<seaborn.axisgrid.FacetGrid>

See whether there is any realotion between the number of annotated fallen deadwood an canopy cover.

<seaborn.axisgrid.FacetGrid>

Or the difference between the number of annotations (positive means more field data than annotated data) and canopy cover.

Code

evo_plots['n_dw_plot_diff'] = evo_plots.n_dw_plot - evo_plots.n_dw_ann

<seaborn.axisgrid.FacetGrid>

Again, denser canopy indicates less annotated groundwood, and here also deadwood in general. However, Evo has such a low number of fallen deadwood that evaluating that is difficult.

As Evo data doesn’t have field-measured deadwood lengths, we can’t plot that relationship. We can, however, plot the DBH distributions, even though Evo dataset only has 43 downed deadwood with dbh measured.

Code

evo_field_data = evo_field_data[evo_field_data.plotid.isin(evo_plots.id.unique())]
evo_field_data['conservation'] = evo_field_data.apply(lambda row: evo_plots[evo_plots.id == row.plotid].conservation.unique()[0], axis=1)

Some statistics for field data.

Code

pd.pivot_table(data=evo_field_data[(evo_field_data.puuluo == 4)&(evo_field_data.lapimitta_mm>0)],
               index=['conservation'], values=['est_pituus_m', 'lapimitta_mm'],
               aggfunc=['mean', 'min', 'max', 'count'], margins=True)

	mean		min		max		count
	est_pituus_m	lapimitta_mm	est_pituus_m	lapimitta_mm	est_pituus_m	lapimitta_mm	est_pituus_m	lapimitta_mm
conservation
0	13.609571	169.357143	5.934	55	34.211	552	14	14
1	11.905690	115.896552	5.446	45	28.101	445	29	29
All	12.460442	133.302326	5.446	45	34.211	552	43	43

Same for annotated data.

Code

evo_anns['tree_length'] = evo_anns.geometry.apply(get_len)
pd.pivot_table(data=evo_anns[evo_anns.label=='groundwood'], index=['conservation'], values=['tree_length', 'diam'],
               aggfunc=['mean', 'min', 'max', 'count'], margins=True)

	mean		min		max		count
	diam	tree_length	diam	tree_length	diam	tree_length	diam	tree_length
conservation
0	200.620326	2.520178	44.682490	0.251763	760.781151	9.225878	63	63
1	237.091999	2.592576	139.506761	0.535882	612.397653	6.664814	24	24
All	210.681477	2.540150	44.682490	0.251763	760.781151	9.225878	87	87

Volume estimations for Evo data are really inaccurate, as most field data measurements are zero.

Code

evo_anns['v_ddw'] = evo_anns.geometry.apply(cut_cone_volume)
evo_plots['v_ddw_ann'] = evo_plots.apply(lambda row: evo_anns[(evo_anns.plot_id == row.id) &
                                                              (evo_anns.label == 'groundwood')
                                                              ].v_ddw.sum()
                                              , axis=1)

Statistics for volume based on annotations.

Code

pd.pivot_table(data=evo_plots, index=['conservation'], values=['v_ddw'],
               aggfunc=['min', 'max', 'mean', 'median','std', 'count'], margins=True)

	min	max	mean	median	std	count
	v_ddw	v_ddw	v_ddw	v_ddw	v_ddw	v_ddw
conservation
0	0.0	123.004587	5.522673	0.0	23.497052	42
1	0.0	98.258093	6.338610	0.0	18.873961	29
All	0.0	123.004587	5.855943	0.0	21.587804	71

Code

pd.pivot_table(data=evo_plots, index=['conservation'], values=['v_ddw_ann_ha'],
               aggfunc=['min', 'max', 'mean', 'median','std', 'count'], margins=True)

	min	max	mean	median	std	count
	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha	v_ddw_ann_ha
conservation
0	0.0	96.060293	7.991108	0.0	19.252499	42
1	0.0	71.154407	5.065659	0.0	13.517535	29
All	0.0	96.060293	6.796206	0.0	17.096402	71