get_hospital_costs_data = function(){ ## ## xpdf ../EBook/Applied_Linear_Models_with_R.pdf -z 200 183 & ## data = read.table('~/Projects/Reading/N_Z/Zelterman/Data/hospital_costs.txt', header=FALSE, skip=0, na.strings='.', col.names=c('hospital', 'avg_paid_medicare', 'avg_paid_insurance', 'postsurgical_length', 'cases', 'n_in_hospital_deaths', 'in_hospital_death_rate')) ## Convert in_hospital_death_rate into a factor which meaningful names: ## data$ihdr = '' ihdr_char = as.character(data$in_hospital_death_rate) mask = ihdr_char=='0' data[mask, 'ihdr'] = 'normal' mask = ihdr_char=='+' data[mask, 'ihdr'] = 'above' mask = ihdr_char=='-' data[mask, 'ihdr'] = 'below' data$in_hospital_death_rate = data$ihdr data$ihdr = NULL data$in_hospital_death_rate = factor(data$in_hospital_death_rate, levels=c('below', 'normal', 'above'), ordered=TRUE) return(data) }