aboutsummaryrefslogtreecommitdiff
path: root/R_LinR/main.r
diff options
context:
space:
mode:
authorleshe4ka46 <alex9102naid1@ya.ru>2025-11-15 16:30:38 +0300
committerleshe4ka46 <alex9102naid1@ya.ru>2025-11-18 14:05:14 +0300
commit2ade61411a014b3eed24bd2b382687d55233a9b5 (patch)
tree1b91eb11d38a0a053a7a806fedadb8c8a676738b /R_LinR/main.r
parent5aaff9711387ce1ea1ec8ee5c5b4ecd9e1ea3dd1 (diff)
R(Cluster)
Diffstat (limited to 'R_LinR/main.r')
-rwxr-xr-xR_LinR/main.r26
1 files changed, 26 insertions, 0 deletions
diff --git a/R_LinR/main.r b/R_LinR/main.r
new file mode 100755
index 0000000..d7b5856
--- /dev/null
+++ b/R_LinR/main.r
@@ -0,0 +1,26 @@
+#!/usr/bin/env Rscript
+
+df <- read.csv("zeta.csv")
+df <- subset(df, sex == "F")
+df <- subset(df, select = -c(zcta, sex))
+df <- subset(df, 8 < meaneducation & meaneducation < 18)
+df <- subset(df, 10000 < meanhouseholdincome & meanhouseholdincome < 200000)
+df <- subset(df, 10000 < meanhouseholdincome & meanhouseholdincome < 200000)
+df <- subset(df, 20 < meanage & meanage < 60)
+
+df$log_income <- log10(df$meanhouseholdincome)
+
+
+names(df) <- c("X", "age", "education", "employment", "income", "log_income")
+
+library(ggplot2)
+
+ggplot(df, aes(x = age, y = log_income)) +
+ geom_point(alpha = 0.2) +
+ labs(x = "age", y = "income", title = "log_income(age)")
+
+model <- lm(log_income ~ age, df)
+
+
+print(model)
+summary(model)