一、数据的输出 R中提供了write.table(),cat()等函数来导出数据。不过值得指出的是R语言能够导出的数据格式是有限的,比如在基本包中,我们能够导出数据的格式只有txt,csv。 现在介绍一下两个函数的用法: write.table(x, file = “”, append =FALSE, quote = TRUE, sep = ” “, eol = “\n”, na = “NA = c(“escape”, “double”), fileEncoding = “”) write.csv(…) write.csv2(…) write.csv(),write.csv2()可以看做write.table ()的变体,我们知道write.csv(),与参数sep=“,”的write.table()是等效的。 sep = ” “, fill = FALSE, labels = NULL, append = FALSE) cat()作为一个输出函数与dos命令差不多,也是将数据集或数据写入文件中,常用参数和write.table
, header=FALSE, sep=","); #指定分隔符 data3 <- read.csv("3.xxx", header=FALSE, sep="\t") 2、数据的导出 导出文本文件 write.table KEN', 'John'); cname <- c("小明", "小刚"); f <- data.frame(age, name, cname, stringsAsFactors = FALSE); write.table (f, file='f.csv', sep=',', fileEncoding = "UTF-8") #去除行号 write.table(f, file='f.csv', sep=',', fileEncoding = "UTF-8", row.names=FALSE) #去除列名 write.table(f, file='f.csv', sep=',', fileEncoding = "UTF-8", row.names =FALSE, col.names=FALSE) #去除引号 write.table(f, file='f.csv', sep=',', fileEncoding = "UTF-8",
sep="\t"表示以制表符作为分隔符读取文件 x <- readClipboard()#读取剪贴板的内容 二.写入文件 x <- read.table("input.txt",header = T) write.table (x,file="c:/users/lzp/Desktop/Rdata/newfile.txt") write.table (x,file=newfile.txt)#x为想要储存的对象,file为命名 write.table (x,file=newfile.csv,sep="\t") write.table (x,file=newfile.csv,sep="\t",row.names = FALSE ) #写入文件时去掉行名 write.table (x,file=newfile.csv,sep="\t",quote=FALSE,append=FALSE,na="NA")#quote=FALSE,表示字符串去掉引号 ;append=FALSE,当文件名相同时覆盖原文件 write.table (x,file=gzfile (newfile.csv.gz),sep="\t", quote=FALSE
/new_input.txt") # 写入文件> write.table(table_demo, ". /new_input.csv", sep = ",") # 写入文件,每一行的分隔符使用“,”> write.table(table_demo, ". /new_input.csv", sep = ",", row.names = F) # 写入文件时不要R添加序号> write.table(table_demo, ". /new_input.txt", quote = F) # 写入文件时,去掉每一个变量的引号> write.table(table_demo, ". # 写入的时候NA值用其他代替> write.table(mtcars, gzfile("mtcars.txt.gz")) # 写入文件直接压缩读写R格式文件> saveRDS(iris, ".
如下所示,是我以前的代码; dim(dat) expFile='expFile.txt' write.table(dat,file = expFile,sep = '\t',quote = F) groupFiles ='groupFiles.txt' head(groupinfo) write.table(groupinfo,file = groupFiles,sep = '\t',quote = F,col.names = F,row.names = F) head(geneInfor) geneFile='geneFile.txt' write.table(geneInfor,file = geneFile,sep 提供的中国区chatGPT的查询方式: 求助了chatGPT 我采纳了它的第一个建议,然后试着对比一下: # 代码段1 start_time1 <- Sys.time() # Your code here write.table
= TRUE) realdata1$groups_n<-as.numeric(realdata1$groups) ####建模数据 tab <- summary(modeldata$groups) write.table (tab, "clipboard", sep = "\t") t1 <- summary(modeldata$groups)/dim(modeldata)[1] write.table(t1, "clipboard (tab, "clipboard", sep = "\t") # 每组占比 更新至excel t2 <- summary(realdata1$groups)/dim(realdata1)[1] write.table ##### 观测PSI大于0.2的变量##### xx<-tapply(Data$未结清贷款笔数, substr(aa$申请日期,1,7),mean, na.rm = TRUE) write.table (tab, "clipboard", sep = "\t") # 拒绝原因2 tab <- summary(subData$RJ_reason2) write.table(tab, "clipboard
数据文件 2 read.csv() #读取.csv格式的数据,read.table的一种特定应用 3 excel数据文件读取 4 scan #比read.table更加灵活 5 保存为.Rdata 6 write.table () #常用导出数据函数 write.table(x, file = "", append = FALSE, quote = TRUE, sep = " ", eol = "\ (f, file ="f.csv") #以逗号分隔数据列,含行号(默认),含列名(默认),字符串带引号 > write.table (f,file ="f.csv", sep =",") ,不含行号,不含列名,字符串不带引号 > write.table (f,file ="f.csv", row.names = FALSE, col.names =FALSE, quote =FALSE ) 7 CSV格式导出 #write.table的一种特定应用 通过函数write.csv()保存为一个.csv文件 write.csv() #保存为一个.csv文件 > x <- c(1:3)
/tidydata") write.table(GSE100910_new, ". hspc),2)] rownames(gse112438_hspc) <- ids_gse112438_hspc gse112438_hspc[is.na(gse112438_hspc)] = 0 write.table _lymphocytes) <- ids_gse112438_lymphocytes gse112438_lymphocytes[is.na(gse112438_lymphocytes)] = 0 write.table _eosinophils) <- ids_gse112438_eosinophils gse112438_eosinophils[is.na(gse112438_eosinophils)] = 0 write.table gse112438_monocytes) <- ids_gse112438_monocytes gse112438_monocytes[is.na(gse112438_monocytes)] = 0 write.table
rod.csv",row.names = 1) #报错rod = read.csv("rod.csv")#3.数据框导出 注意这里导出的write.csv(ex2,file = "example.csv") write.table (ex2,file = "example.txt")#补充base包中read.table()read.csv()read.delim()write.table()write.csv()readr包中library
read.table() #通常用于读取txt格式 4.将数据框导出,成为表格文件 *csv格式:write.csv() write.csv(test,file="example.csv") txt格式:write.table () write.table(test,file="example.txt") 5.R特有的数据保存格式:Rdata save()保存; load()加载 ex1<- read.table("ex1.txt
normal_expre <- exprs(eset.rma) probeid <- rownames(normal_expre) normal_expre <- cbind(probeid,normal_expre) write.table normal.expres.txt",header = T,sep = "\t") probe_expres <- merge(normal_expres,cancer_expres,by = "probeid") write.table geneidfactor) geneid <- rownames(gene_exp_matrix) gene_exp_matrix2 <- cbind(geneid,gene_exp_matrix) write.table [loc,2] genesymbol <- rownames(gene_exp_matrix) gene_exp_matrix3<-cbind(genesymbol,gene_exp_matrix) write.table lmFit(rt.design) fit2<- eBayes(fit) allDiff<- topTable(fit2,adjust = "fdr",coef = 2,number = 200000) write.table
id_dsct <- cbind(id,dsct = dsct$Pathways) 保存所有的metacyc数据库的pathway id及通路描述 write.table(id_dsct,file = pic_output <- read_tsv("feature-table.biom.tsv",col_names = T) metacyc_input <- pic_output$`OTU-ID` write.table F,sep ="\t") stamp_input <- merge(pic_output,id_dsct,all.x = T,by.x = "OTU-ID",by.y = "Pathways") write.table
FALSE, altHypothesis = "greaterAbs") countMatDiff = cbind(dataS, normDDS, res) head(countMatDiff) write.table , file="D_edgeR.txt", sep="\t", quote=F, col.names = NA) # DESeq2 out <- as.data.frame(comp1.deseq) write.table out[ which(out$p.value < 0.05), c("seqnames", "start", "end", "strand", "Fold")] write.table out[ which(out$p.value < 0.05), c("seqnames", "start", "end", "strand", "Fold")] write.table - annotatePeak(bed, tssRegion=c(-3000, 3000), TxDb=txdb, addFlankGeneInfo=TRUE, flankDistance=4000) write.table
test.txt",sep="\t") #指定分隔符,默认为"",多个分隔符相邻会自动识别为一个 #输出csv文件 write.csv(csv,file = "test.csv") #输出txt文件 write.table ) 保存变量可保存上次操作的各种数据,数据框、向量等,方便下次操作 读取变量前,最好清空当前的变量 文件读写-进阶 base read.table() read.csv() read.delim() write.table
image.png 开始正题 常用的文件读取命令read.table和read.csv 常用的文件存入命令write.table和write.csv 读文件前,文件格式(分隔符)、注释内容、行名、列名等需要了解 sep = '\t',fill=T,skip=66,header=T) ####dim(询问数据类型的维度) dim(d) dim(f) head(d) head(f) tail(d) tail(f) write.table
函数对列做处理,除以每列之和 result <- apply(b,2,function(x)x/(sum(x))*100) #检查每列之和是不是100% colSums(result) #数据导出 write.table b=a[-(1:2),] #每个元素除以每列之和 result=sweep(b,2,colSums(b),"/")*100 #检查每列之和是不是100% colSums(result) #保存结果 write.table
ordered_tags$table allDiff=allDiff[is.na(allDiff$FDR)==FALSE,] diff=allDiff newData=y$pseudo.counts # write.table diffSig, file="edger_diffSig.csv") # # diffUp = diff[(diff$FDR < padj & (diff$logFC>foldChange)),] # write.table edger_up.xls",sep="\t",quote=F) # diffDown = diff[(diff$FDR < padj & (diff$logFC<(-foldChange))),] # write.table
hang = 0.03, addGuide = TRUE, guideHang = 0.05) dev.off() write.table (merge$oldMEs,file="oldMEs.txt"); write.table(merge$newMEs,file="newMEs.txt"); image.png 第五步是表型和模块的相关性 = cor(MEs, bac_traits, use = "p"); moduleTraitPvalue = corPvalueStudent(moduleTraitCor, nSamples); write.table (moduleTraitCor,file="moduleTrait_correlation.txt"); write.table(moduleTraitPvalue,file="moduleTrait_pValue.txt
#查看合并后的字符串向量1和字符串向量2的交集 index=combine1 %in% combine2 #取出原始的数据框的交集数据 result1=df1[index,] #保存数据框交集的结果 write.table intersect函数 #加载dplyr包 library(dplyr) #直接利用dplyr包里面的intersect函数对数据框取交集 result2=intersect(df1,df2) #保存交集结果 write.table data.table) #将数据框转换成data.table格式,然后利用fintersect函数取交集 result3=fintersect(setDT(df1), setDT(df2)) #保存交集结果 write.table
导出数据为csv文件 #第一个参数是需要导出的数据名称 #第二个参数是导出后新文件的名称 #第三个参数是指文件的分隔符 #导出数据和导入数据的参数类似,只是所使用的函数不同 write.table(mydata 导出数据为tsv文件 write.table(mydata, "c:/mydata.tsv", sep="\t") 3. 导出数据为txt文件 write.table(mydata, "c:/mydata.txt") Tips: (1)使用?function()的形式查阅函数的帮助信息,比如?