require(readxl)
require(dplyr)
require(tidyverse)
require(ggplot2)
getwd()
LE_A = read_xls("LE.xls")
LE_A = as.data.frame(LE_A)
#Selecting the columns necessary for Linear Regression evaluation
LE_GDP = select(LE_A, LE, GDP, Inc_resources, Year, Country, Status, Population)
LE_GDP_C = na.omit(LE_GDP)# Omit the N/A values
LE_GDP_C$log_gdp = log(LE_GDP_C$GDP) # added new variable log_gdp instead of mutating GDP
str(LE_GDP_C)
datapasts::df_paste(head(LE_GDP_C,6))[,c('LE' , 'log_gdp' , 'Year')]
# I want to do linear regression over years
finalResult = purrr::map_df(unique(LE_GDP_C$year), function(modelYear){
myModel = lm(sqrt(LE) ~log_gdp, data = LE_GDP_C %>% filter(year == modelYear) %>% select(-year))
data.frame(year = modelYear, RSquared = summary(myModel)$r.squared)
}
)