import pandas as pd
surveys_df = pd.read_csv("data/surveys.csv")
surveys_df.columns
surveys_df.shape
surveys_df.head(15)
surveys_df.tail()
site_names = pd.unique(surveys_df['plot_id'])
site_names
surveys_df['plot_id'].nunique()
surveys_df['species_id'].nunique()
len(site_names) - surveys_df['plot_id'].nunique()
grouped_data = surveys_df.groupby('sex')
grouped_data['sex'].count()
grouped_data2 = surveys_df.groupby(['plot_id', 'sex'])
grouped_data2.mean()
grouped_data3 = surveys_df.groupby('plot_id')
grouped_data3['weight'].describe()
species_counts = surveys_df.groupby('species_id')['record_id'].count()
print(species_counts)
grouped_ave = surveys_df.groupby('plot_id')['weight'].mean()
grouped_ave.plot(kind='bar');
grouped_total = surveys_df.groupby('sex').count()
grouped_total.plot(kind='bar');
by_site_sex = surveys_df.groupby(['plot_id', 'sex'])
site_sex_count = by_site_sex['weight'].sum()
spc = site_sex_count.unstack()
s_plot = spc.plot(kind='bar', stacked=True, title="Total weight by site and sex")
s_plot.set_ylabel("Weight")
s_plot.set_xlabel("Plot")