我使用了此代码,但由于KeyError:“状态”而出现错误 将熊猫作为pd导入 将numpy导入为np 从scipy.stats导入ttest_ind
unitowns = get_list_of_university_towns()
bottom = get_recession_bottom()
start = get_recession_start()
hdata = convert_housing_data_to_quarters()
bstart = hdata.columns[hdata.columns.get_loc(start) - 1]
hdata['ratio'] = hdata[bstart] - hdata[bottom]
hdata = hdata[[bottom, bstart, 'ratio']]
hdata = hdata.reset_index()
unitowns_hdata = pd.merge(hdata,unitowns,how='inner',on=['State','RegionName'])
unitowns_hdata['uni'] = True
hdata2 = pd.merge(hdata, unitowns_hdata, how='outer', on=['State','RegionName',bottom, bstart, 'ratio'])
hdata2['uni'] = hdata2['uni'].fillna(False)
ut = hdata2[hdata2['uni'] == True]
nut = hdata2[hdata2['uni'] == False]
t,p = ttest_ind(ut['ratio'].dropna(), nut['ratio'].dropna())
different = True if p<0.01 else False
better = "university town" if ut['ratio'].mean() < nut['ratio'].mean() else "non-university town"
return(different, p, better)
run_ttest()