R语言学习-绘制热图初步

> txt <- "ID;Zygote;2_cell;4_cell;8_cell
+ Gene_1;1;2;3;4
+ Gene_2;6;5;4;5
+ Gene_3;0.6;0.5;0.4;0.4"
> txt
[1] "ID;Zygote;2_cell;4_cell;8_cell\nGene_1;1;2;3;4\nGene_2;6;5;4;5\nGene_3;0.6;0.5;0.4;0.4"
> data2 <- read.table(text = txt,sep = ";",header = T,row.names = 1)  ##还可以这样创建数据框呢
> data2  ##列名中以数字开头的列名都加上了X。所以要尽量避免命名时以数字开头。加上check.names = F 可取消加X。
       Zygote X2_cell X4_cell X8_cell
Gene_1    1.0     2.0     3.0     4.0
Gene_2    6.0     5.0     4.0     5.0
Gene_3    0.6     0.5     0.4     0.4
> data2 <- read.table(text = txt,sep = ";",header = T,row.names = 1,check.names = F)
> data2
       Zygote 2_cell 4_cell 8_cell
Gene_1    1.0    2.0    3.0    4.0
Gene_2    6.0    5.0    4.0    5.0
Gene_3    0.6    0.5    0.4    0.4

> txt <- "ID;Zygote;2_cell;4_cell;8_cell;  ##这里句尾不能有分号
+ + Gene_1;1;2;3;4
+ + Gene_2;6;5;4;5
+ + Gene_3;0.6;0.5;0.4;0.4"
> data3 <- read.table(text = txt,sep = ";",header = T,row.names = 1)
Error in scan(file = file, what = what, sep = sep, quote = quote, dec = dec,  : 
  line 1 did not have 6 elements

##开始创建数据框

#先用matrix()将vector转变为矩阵，在as.data.frame()
#ncol：指定列数
#byrow = T：先按行填充vector内容，我还以为有bycol，后面试了下，没有这个参数!_!
> data <- c(1:6,6:1,6:1,1:6,(6:1)/10,(1:6)/10,(1:6)/10,(6:1)/10,1:6,6:1,6:1,1:6,6:1,1:6,1:6,6:1)
> data <- as.data.frame(matrix(data,ncol = 12,byrow = T))
> data
   V1  V2  V3  V4  V5  V6  V7  V8  V9 V10 V11 V12
1 1.0 2.0 3.0 4.0 5.0 6.0 6.0 5.0 4.0 3.0 2.0 1.0
2 6.0 5.0 4.0 3.0 2.0 1.0 1.0 2.0 3.0 4.0 5.0 6.0
3 0.6 0.5 0.4 0.3 0.2 0.1 0.1 0.2 0.3 0.4 0.5 0.6
4 0.1 0.2 0.3 0.4 0.5 0.6 0.6 0.5 0.4 0.3 0.2 0.1
5 1.0 2.0 3.0 4.0 5.0 6.0 6.0 5.0 4.0 3.0 2.0 1.0
6 6.0 5.0 4.0 3.0 2.0 1.0 1.0 2.0 3.0 4.0 5.0 6.0
7 6.0 5.0 4.0 3.0 2.0 1.0 1.0 2.0 3.0 4.0 5.0 6.0
8 1.0 2.0 3.0 4.0 5.0 6.0 6.0 5.0 4.0 3.0 2.0 1.0
> data_bycol <- c(1:6,6:1,6:1,1:6,(6:1)/10,(1:6)/10,(1:6)/10,(6:1)/10,1:6,6:1,6:1,1:6,6:1,1:6,1:6,6:1)
> data <- as.data.frame(matrix(data_bycol,ncol = 12,bycol = T))
Error in matrix(data_bycol, ncol = 12, bycol = T) : 参数没有用(bycol = T)

#增加列名
#colnames()
> colnames(data) <- c("Zygote","2_cell","4_cell","8_cell","Morula","ICM","ESC","4 week PGC","7 week PGC","10 week PGC","17 week PGC","00cyte")
> data
  Zygote 2_cell 4_cell 8_cell Morula ICM ESC 4 week PGC 7 week PGC
1    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
2    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
3    0.6    0.5    0.4    0.3    0.2 0.1 0.1        0.2        0.3
4    0.1    0.2    0.3    0.4    0.5 0.6 0.6        0.5        0.4
5    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
6    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
7    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
8    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
  10 week PGC 17 week PGC 00cyte
1         3.0         2.0    1.0
2         4.0         5.0    6.0
3         0.4         0.5    0.6
4         0.3         0.2    0.1
5         3.0         2.0    1.0
6         4.0         5.0    6.0
7         4.0         5.0    6.0
8         3.0         2.0    1.0
#增加行名
#rownames()
> rownames(data) <- paste("Gene",1:8,sep = "_")
> data
       Zygote 2_cell 4_cell 8_cell Morula ICM ESC 4 week PGC 7 week PGC
Gene_1    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_2    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_3    0.6    0.5    0.4    0.3    0.2 0.1 0.1        0.2        0.3
Gene_4    0.1    0.2    0.3    0.4    0.5 0.6 0.6        0.5        0.4
Gene_5    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_6    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_7    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_8    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
       10 week PGC 17 week PGC 00cyte
Gene_1         3.0         2.0    1.0
Gene_2         4.0         5.0    6.0
Gene_3         0.4         0.5    0.6
Gene_4         0.3         0.2    0.1
Gene_5         3.0         2.0    1.0
Gene_6         4.0         5.0    6.0
Gene_7         4.0         5.0    6.0
Gene_8         3.0         2.0    1.0
> class(data)
[1] "data.frame"
###paste(a,b,c...,sep = " ")
###连接a b c...多个R对象，将其转变为字符串之后连起来

> paste(1:12, c("st", "nd", "rd", rep("th", 9)))
 [1] "1 st"  "2 nd"  "3 rd"  "4 th"  "5 th"  "6 th"  "7 th"  "8 th" 
 [9] "9 th"  "10 th" "11 th" "12 th"
> paste(1:12, c("st", "nd", "rd", rep("th", 9)),sep = "")
 [1] "1st"  "2nd"  "3rd"  "4th"  "5th"  "6th"  "7th"  "8th"  "9th"  "10th"
[11] "11th" "12th"
> paste0(1:12, c("st", "nd", "rd", rep("th", 9)))  ##看起来paste0()和paste(...,sep = "")是等价的
 [1] "1st"  "2nd"  "3rd"  "4th"  "5th"  "6th"  "7th"  "8th"  "9th"  "10th"
[11] "11th" "12th"
> paste(1:12, c("st", "nd", "rd", rep("th", 9)),13:24,sep = "")
 [1] "1st13"  "2nd14"  "3rd15"  "4th16"  "5th17"  "6th18"  "7th19" 
 [8] "8th20"  "9th21"  "10th22" "11th23" "12th24"

###转换数据格式

#先安装并加载所需R包

> install.packages(c("reshape2","ggplot2")) ##复习一下同时安装多个包
> library(reshape2)
> library(ggplot2)

#转换数据之前，给data加上一列，使之与行名一致。

> data$ID <- rownames(data)##直接$ID创建新列，然后通过rownames()或者data的行名，赋值给data。有没有其他方式？我这里想了想用cbind()应该怎么实现
> data
       Zygote 2_cell 4_cell 8_cell Morula ICM ESC 4 week PGC 7 week PGC
Gene_1    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_2    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_3    0.6    0.5    0.4    0.3    0.2 0.1 0.1        0.2        0.3
Gene_4    0.1    0.2    0.3    0.4    0.5 0.6 0.6        0.5        0.4
Gene_5    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_6    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_7    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_8    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
       10 week PGC 17 week PGC 00cyte     ID
Gene_1         3.0         2.0    1.0 Gene_1
Gene_2         4.0         5.0    6.0 Gene_2
Gene_3         0.4         0.5    0.6 Gene_3
Gene_4         0.3         0.2    0.1 Gene_4
Gene_5         3.0         2.0    1.0 Gene_5
Gene_6         4.0         5.0    6.0 Gene_6
Gene_7         4.0         5.0    6.0 Gene_7
Gene_8         3.0         2.0    1.0 Gene_8
> data2 <- cbind(data,rownames(data))##没想到直接把rownames(data)作为新列名了。。。所以下面新建了一个列名
> data2
       Zygote 2_cell 4_cell 8_cell Morula ICM ESC 4 week PGC 7 week PGC
Gene_1    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_2    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_3    0.6    0.5    0.4    0.3    0.2 0.1 0.1        0.2        0.3
Gene_4    0.1    0.2    0.3    0.4    0.5 0.6 0.6        0.5        0.4
Gene_5    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_6    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_7    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_8    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
       10 week PGC 17 week PGC 00cyte     ID rownames(data)
Gene_1         3.0         2.0    1.0 Gene_1         Gene_1
Gene_2         4.0         5.0    6.0 Gene_2         Gene_2
Gene_3         0.4         0.5    0.6 Gene_3         Gene_3
Gene_4         0.3         0.2    0.1 Gene_4         Gene_4
Gene_5         3.0         2.0    1.0 Gene_5         Gene_5
Gene_6         4.0         5.0    6.0 Gene_6         Gene_6
Gene_7         4.0         5.0    6.0 Gene_7         Gene_7
Gene_8         3.0         2.0    1.0 Gene_8         Gene_8
> data2 <- cbind(data,ID_2 = rownames(data)) ##bingo！
> data2
       Zygote 2_cell 4_cell 8_cell Morula ICM ESC 4 week PGC 7 week PGC
Gene_1    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_2    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_3    0.6    0.5    0.4    0.3    0.2 0.1 0.1        0.2        0.3
Gene_4    0.1    0.2    0.3    0.4    0.5 0.6 0.6        0.5        0.4
Gene_5    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
Gene_6    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_7    6.0    5.0    4.0    3.0    2.0 1.0 1.0        2.0        3.0
Gene_8    1.0    2.0    3.0    4.0    5.0 6.0 6.0        5.0        4.0
       10 week PGC 17 week PGC 00cyte     ID   ID_2
Gene_1         3.0         2.0    1.0 Gene_1 Gene_1
Gene_2         4.0         5.0    6.0 Gene_2 Gene_2
Gene_3         0.4         0.5    0.6 Gene_3 Gene_3
Gene_4         0.3         0.2    0.1 Gene_4 Gene_4
Gene_5         3.0         2.0    1.0 Gene_5 Gene_5
Gene_6         4.0         5.0    6.0 Gene_6 Gene_6
Gene_7         4.0         5.0    6.0 Gene_7 Gene_7
Gene_8         3.0         2.0    1.0 Gene_8 Gene_8

posted @ 2020-05-24 15:36 月光边境Eric 阅读(469) 评论(0) 编辑收藏举报

会员力量，点亮园子希望

刷新页面返回顶部

月光边境Eric

R语言学习-绘制热图初步

公告