1、Rstudio相关设置要改成UTF-8。位置在:1、Tools → Global Options → Default text encoding ;2、File → Save with encoding
2、数据文本要更改为UTF-8编码,工具notepad++,操作:Encoding → Convert to UTF-8,保存,参考
3、读取数据是,在read.csv或其他读取函数中,添加读取文件编码的参数 fileEncoding = "UTF8
重编码涉及根据同一个变量和/或其他变量的现有值创建新值的过程,如将符合某个条件的值重新赋值等,这里主要介绍两种常见的方法:#第一种方法
per <- data.frame(name = c("张三","李四","王五","赵六"),
age = c(23,45,34,1000))
per
per$age[per$age == 1000] <- NA #设置缺失值
per$age1[per$age <30] = "young" #生成新变量
per$age1[per$age >= 30 &per$age<50] <- "middle age"
per
#第二种方法
per <- data.frame(name = c("张三","李四","王五","赵六"),
age = c(23,45,34,1000))
per <- within(per,{
age1 <- NA
age1[age <30] <- "young"
age1[age>=30 &age<50] <- "middle age"
})
per