library(readxl)
options(warn=-1)
setwd("~/Pulpit/")
dane <- read_excel("reg_JJA.xlsx", sheet=1)
#str(dane)
ind <- which(is.na(dane$TmaxPoznań))
dane <- dane[-ind, ]
model <- (lm(TmaxPoznań~PCA1+PCA2+PCA3+PCA4+PCA5+PCA6, data=dane))
hist(resid(model))

plot(predict(model), dane$TmaxPoznań)
abline(0,1, col='red')

summary(model)
##
## Call:
## lm(formula = TmaxPoznań ~ PCA1 + PCA2 + PCA3 + PCA4 + PCA5 +
## PCA6, data = dane)
##
## Residuals:
## Min 1Q Median 3Q Max
## -12.2159 -1.9253 -0.0166 1.9493 11.3257
##
## Coefficients:
## Estimate Std. Error t value Pr(>|t|)
## (Intercept) -2.477e-15 4.372e-02 0.00 1
## PCA1 -1.662e+00 4.373e-02 -38.02 <2e-16 ***
## PCA2 2.188e+00 4.373e-02 50.04 <2e-16 ***
## PCA3 6.200e-01 4.373e-02 14.18 <2e-16 ***
## PCA4 -6.330e-01 4.373e-02 -14.47 <2e-16 ***
## PCA5 7.082e-01 4.373e-02 16.20 <2e-16 ***
## PCA6 -7.176e-01 4.373e-02 -16.41 <2e-16 ***
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 2.966 on 4593 degrees of freedom
## Multiple R-squared: 0.5157, Adjusted R-squared: 0.5151
## F-statistic: 815.2 on 6 and 4593 DF, p-value: < 2.2e-16
cor(predict(model), dane$TmaxPoznań)
## [1] 0.7181438
# drugi model, dla wiekszej liczby PCA
model2 <- (lm(TmaxPoznań~PCA1+PCA2+PCA3+PCA4+PCA5+PCA6+PCA7+PCA8+PCA9+PCA10+PCA11+PCA12, data=dane))
hist(resid(model2))

plot(predict(model2), dane$TmaxPoznań)
cor(predict(model2), dane$TmaxPoznań)
## [1] 0.746994
abline(0,1, col='red')

summary(model2)
##
## Call:
## lm(formula = TmaxPoznań ~ PCA1 + PCA2 + PCA3 + PCA4 + PCA5 +
## PCA6 + PCA7 + PCA8 + PCA9 + PCA10 + PCA11 + PCA12, data = dane)
##
## Residuals:
## Min 1Q Median 3Q Max
## -12.2863 -1.8715 -0.0017 1.8778 10.8171
##
## Coefficients:
## Estimate Std. Error t value Pr(>|t|)
## (Intercept) -1.340e-15 4.180e-02 0.000 1.0000
## PCA1 -1.662e+00 4.180e-02 -39.768 < 2e-16 ***
## PCA2 2.188e+00 4.180e-02 52.342 < 2e-16 ***
## PCA3 6.200e-01 4.180e-02 14.831 < 2e-16 ***
## PCA4 -6.330e-01 4.180e-02 -15.142 < 2e-16 ***
## PCA5 7.082e-01 4.180e-02 16.942 < 2e-16 ***
## PCA6 -7.176e-01 4.180e-02 -17.166 < 2e-16 ***
## PCA7 3.113e-01 4.180e-02 7.447 1.14e-13 ***
## PCA8 4.088e-01 4.180e-02 9.779 < 2e-16 ***
## PCA9 -2.973e-01 4.180e-02 -7.112 1.32e-12 ***
## PCA10 -3.522e-01 4.180e-02 -8.426 < 2e-16 ***
## PCA11 5.330e-01 4.180e-02 12.751 < 2e-16 ***
## PCA12 7.747e-02 4.180e-02 1.853 0.0639 .
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 2.835 on 4587 degrees of freedom
## Multiple R-squared: 0.558, Adjusted R-squared: 0.5568
## F-statistic: 482.6 on 12 and 4587 DF, p-value: < 2.2e-16