DAY6-琦
2021-07-12 本文已影响0人
见期
加载和安装R包
1.镜像设置
file.edit('~/.Rprofile')
options("repos" = c(CRAN="https://mirrors.tuna.tsinghua.edu.cn/CRAN/")) #对应清华源
options(BioC_mirror="https://mirrors.ustc.edu.cn/bioc/") #对应中科大源
data:image/s3,"s3://crabby-images/b94c8/b94c8208749de6693c721fbcbe2c3a627996f508" alt=""
2.检查
options()$repos
options()$BioC_mirror
3.安装+加载
options("repos" = c(CRAN="https://mirrors.tuna.tsinghua.edu.cn/CRAN/"))
options(BioC_mirror="https://mirrors.ustc.edu.cn/bioc/")
install.packages("dplyr")
library(dplyr)
dplyr是安装包的名字
data:image/s3,"s3://crabby-images/c0ca8/c0ca8cb3316f416737ca58d2ab087ed9ae8e7d1f" alt=""
data:image/s3,"s3://crabby-images/531c0/531c06ed0477756a461beeb76f1dc50f0cf30add" alt=""
test <- iris[c(1:2,51:52,101:102),]
data:image/s3,"s3://crabby-images/5576a/5576ab575488664af0a7f14efea273bc6bd0b068" alt=""
dplyr五个基础函数
1.新增列
mutate(test, new = Sepal.Length * Sepal.Width)
data:image/s3,"s3://crabby-images/83a37/83a372e67a593d099d6d1e5a7cdad507bb136f03" alt=""
2.筛选列
select(test,1)
data:image/s3,"s3://crabby-images/5b748/5b7480b2e13f4711a4e99a296f4c3002aed19df0" alt=""
select(test,c(2,3))
data:image/s3,"s3://crabby-images/48d31/48d310c078eb95dec08f6b59f7b20b9b9f979bc4" alt=""
select(test,Sepal.Length)#按列名筛选
data:image/s3,"s3://crabby-images/665d4/665d4efb5c245388d8e973ff00be0b97ce334600" alt=""
3.筛选行
filter(test, Species == "setosa")
data:image/s3,"s3://crabby-images/3d21f/3d21f689390fe03847e43dc2c69305ac4ac3cd17" alt=""
filter(test, Species == "setosa"&Sepal.Length>5)
data:image/s3,"s3://crabby-images/65943/659439101fa661d76e53c7d8b782037c394d8595" alt=""
data:image/s3,"s3://crabby-images/f262d/f262dc24a438f20f542a6cc7531ee48def20b237" alt=""
filter(test, Species %in% c("setosa","versicolor"))
data:image/s3,"s3://crabby-images/30ec2/30ec22084f70ef06e1583b951c543b5dccac50ad" alt=""
4.排序
arrange(test, Sepal.Length)#默认从小到大排序
data:image/s3,"s3://crabby-images/584d8/584d87132b2d5faeabd979bfd240451d7699a929" alt=""
arrange(test, desc(Sepal.Length))#desc是从大到小
data:image/s3,"s3://crabby-images/01e19/01e197ff04c9407985e34c8e76abf15403d31c95" alt=""
6.汇总
summarise(test,mean(Sepal.Length),sd(Sepal.Length))#计算Sepal.Length的平均值和标准差
group_by(test,Species)
data:image/s3,"s3://crabby-images/28fc5/28fc50214858b8c089cdf681325fb74c217ceb95" alt=""
summarise(group_by(test, Species),mean(Sepal.Length),sd(Sepal.Length))
data:image/s3,"s3://crabby-images/efee6/efee66fe4575c49f906a556cf316c9647443ee5b" alt=""
dplyr两个实用技能
data:image/s3,"s3://crabby-images/d8f8e/d8f8e241b8aa7ca826ff5b69757afef54d83b31e" alt=""
dplyr处理关系数据
options(stringsAsFactors = F)
test1 <- data.frame(x = c('b','e','f','x'),
z = c("A","B","C",'D'),
stringsAsFactors = F)
test1
data:image/s3,"s3://crabby-images/ed3f0/ed3f017a5bcfbf0e3591e80ae809cdfd1f26557a" alt=""
test2 <- data.frame(x = c('a','b','c','d','e','f'),
y = c(1,2,3,4,5,6),
stringsAsFactors = F)
test2
data:image/s3,"s3://crabby-images/adbe2/adbe27ecf55621e007db0154fab6319d62388ee4" alt=""
inner_join(test1,test2,by="x")
left_join(test1,test2,by = "x")
left_join(test2,test1,by = 'x')
data:image/s3,"s3://crabby-images/4ff67/4ff6766ff1668e94a50d5650a2533c56e5ffd839" alt=""
data:image/s3,"s3://crabby-images/e86dd/e86dd9757bc954da3a25aa60334734502bc9b2cc" alt=""
data:image/s3,"s3://crabby-images/6a490/6a490cf6f10a026ed9abf00b9a96a399cdf74c79" alt=""
data:image/s3,"s3://crabby-images/cbb1d/cbb1d342f8d705637862b4a9129c20381fcefe9a" alt=""
data:image/s3,"s3://crabby-images/283c2/283c2db04955648259e680d8353dead8873785b8" alt=""