From 2ade61411a014b3eed24bd2b382687d55233a9b5 Mon Sep 17 00:00:00 2001 From: leshe4ka46 Date: Sat, 15 Nov 2025 16:30:38 +0300 Subject: R(Cluster) --- R_LinR/main.r | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) create mode 100755 R_LinR/main.r (limited to 'R_LinR/main.r') diff --git a/R_LinR/main.r b/R_LinR/main.r new file mode 100755 index 0000000..d7b5856 --- /dev/null +++ b/R_LinR/main.r @@ -0,0 +1,26 @@ +#!/usr/bin/env Rscript + +df <- read.csv("zeta.csv") +df <- subset(df, sex == "F") +df <- subset(df, select = -c(zcta, sex)) +df <- subset(df, 8 < meaneducation & meaneducation < 18) +df <- subset(df, 10000 < meanhouseholdincome & meanhouseholdincome < 200000) +df <- subset(df, 10000 < meanhouseholdincome & meanhouseholdincome < 200000) +df <- subset(df, 20 < meanage & meanage < 60) + +df$log_income <- log10(df$meanhouseholdincome) + + +names(df) <- c("X", "age", "education", "employment", "income", "log_income") + +library(ggplot2) + +ggplot(df, aes(x = age, y = log_income)) + + geom_point(alpha = 0.2) + + labs(x = "age", y = "income", title = "log_income(age)") + +model <- lm(log_income ~ age, df) + + +print(model) +summary(model) -- cgit v1.2.3