R 과소표집

1 개요[ | ]

R undersampling
R 과소표집, R 언더샘플링
df = read.table( header=TRUE, stringsAsFactors=FALSE, text="
name  major gpa
Alice Math  3.3
Bob   Math  3.4
Carol Math  3.5
Dave  Math  3.6
Erin  Math  3.7
Frank Chem  3.8
Grace Chem  3.9
Heidi Chem  4.0
")
library(dplyr, warn.conflicts=F)
df_Math = df[df$major=="Math",]
df_Chem = df[df$major=="Chem",]
df_Math = sample_n(df_Math,3)
df = rbind(df_Math, df_Chem, make.row.names=FALSE)
print( df )

2 같이 보기[ | ]

문서 댓글 ({{ doc_comments.length }})
{{ comment.name }} {{ comment.created | snstime }}