# HIDDEN
from datascience import *
%matplotlib inline
import matplotlib.pyplot as plots
plots.style.use('fivethirtyeight')
import numpy as np
values = make_array(2, 3, 3, 9)
sum(values)/len(values)
np.average(values)
np.mean(values)
(2 + 3 + 3 + 9)/4
2*(1/4) + 3*(2/4) + 9*(1/4)
values_table = Table().with_columns('value', values)
values_table
bins_for_display = np.arange(0.5, 10.6, 1)
values_table.hist(0, bins = bins_for_display)
twos = 2 * np.ones(10)
threes = 3 * np.ones(20)
nines = 9 * np.ones(10)
new_vals = np.append(np.append(twos, threes), nines)
new_vals
len(new_vals)
Table().with_column('value', new_vals).hist(bins = bins_for_display)
np.average(values)
np.average(new_vals)
####################################
nba = Table.read_table('nba2013.csv')
nba.labels
nba.hist('Height', bins=np.arange(65.5, 90.5))
heights = nba.column('Height')
percentile(50, heights)
np.average(heights)
sd_table = Table().with_columns('Value', values)
sd_table
average_value = np.average(sd_table.column(0))
average_value
deviations = values - average_value
sd_table = sd_table.with_column('Deviation', deviations)
sd_table
sum(deviations)
sd_table = sd_table.with_columns('Squared Deviation', deviations ** 2)
sd_table
# Variance of the data
variance = np.mean(sd_table.column('Squared Deviation'))
variance
# Standard Deviation (SD) is the square root of the variance
sd = variance ** 0.5
sd
np.std(values)