Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Binary file modified __pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q01_cond_prob/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q01_cond_prob/__pycache__/build.cpython-36.pyc
Binary file not shown.
14 changes: 11 additions & 3 deletions q01_cond_prob/build.py
Original file line number Diff line number Diff line change
@@ -1,12 +1,20 @@
# So that float division is by default in python 2.7
from __future__ import division

import pandas as pd

df = pd.read_csv('data/house_pricing.csv')

def cond_prob(df):
allhouses = df.shape[0]
houses_in_OldTown = df[df['Neighborhood'] == 'OldTown'].shape[0]
n = (houses_in_OldTown)*(houses_in_OldTown-1)*(houses_in_OldTown-2)
k = ( allhouses)*(allhouses-1)*(allhouses-2)
probofthree = float(n/k)

return probofthree

cond_prob(df)


# Enter Code Here



Binary file modified q01_cond_prob/tests/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file not shown.
Binary file modified q02_confidence_interval/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q02_confidence_interval/__pycache__/build.cpython-36.pyc
Binary file not shown.
22 changes: 20 additions & 2 deletions q02_confidence_interval/build.py
Original file line number Diff line number Diff line change
@@ -1,13 +1,31 @@
# Default imports
import math
import scipy.stats as stats
import pandas as pd
import numpy as np

df = pd.read_csv('data/house_pricing.csv')
sample = df['GrLivArea']
z_critical = stats.norm.ppf(q = 0.95)

def confidence_interval(sample):
sample_mean = sample.mean()
samplestd = sample.std()
n = np.size(sample)
stderror = samplestd/(n**(1/2))
marginerror = z_critical*stderror
lower = sample_mean - marginerror
upper = sample_mean + marginerror

return lower, upper

confidence_interval(sample)







# Write your solution here :



Binary file not shown.
Binary file not shown.
Binary file modified q03_t_test/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q03_t_test/__pycache__/build.cpython-36.pyc
Binary file not shown.
13 changes: 11 additions & 2 deletions q03_t_test/build.py
Original file line number Diff line number Diff line change
@@ -1,9 +1,18 @@
# Default imports
import scipy.stats as stats
import pandas as pd
import numpy as np

df = pd.read_csv('data/house_pricing.csv')

def t_statistic(df):
t_statistic, p_value = stats.ttest_1samp(a= df[df['Neighborhood'] == 'OldTown']['GrLivArea'],
popmean= df['GrLivArea'].mean())
t_critical = stats.t.ppf(1-0.1,df[df['Neighborhood'] == 'OldTown']['GrLivArea'].shape[0])
test_result = p_value>t_critical

return p_value, test_result

t_statistic(df)


# Enter Code Here

Binary file modified q03_t_test/tests/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q03_t_test/tests/__pycache__/test_q03_t_test.cpython-36.pyc
Binary file not shown.
Binary file modified q04_chi2_test/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file modified q04_chi2_test/__pycache__/build.cpython-36.pyc
Binary file not shown.
13 changes: 11 additions & 2 deletions q04_chi2_test/build.py
Original file line number Diff line number Diff line change
@@ -1,10 +1,19 @@
# Default imports
import scipy.stats as stats
import pandas as pd


df = pd.read_csv('data/house_pricing.csv')

def chi_square(df):
lsdf = df['LandSlope']
catdf = pd.qcut(df['SalePrice'], 3, labels = ['High','Med','Low'], retbins= False)
freqtab=pd.crosstab(df['LandSlope'],catdf)
chi2,p_value,dof,expected = stats.chi2_contingency(freqtab)
test_result=(p_value<0.05)
print(freqtab)

return p_value, test_result

# Enter Code Here
chi_square(df)


Binary file modified q04_chi2_test/tests/__pycache__/__init__.cpython-36.pyc
Binary file not shown.
Binary file not shown.