绘制一个数据集的每列的直方图,并且添加和密度曲线
#install.packages("tidyr")
library(ggplot2)
library(tidyr)
dataset_long <- gather(data[2:13], key = "column_name", value = "value")
# 创建基本图层,绘制直方图和密度曲线,并使用facet_wrap分割图表
plot1 = ggplot(dataset_long, aes(x = value)) +
geom_histogram(aes(y = ..density..), bins = 20, color = "black", fill = "white") +
geom_density(color = "red") +
labs(x = "Value", y = "Density") +
ggtitle("核密度曲线图") +
facet_wrap(~ column_name, scales = "free")
#保存图片
plot1
ggsave("D:/Users/sf253/Desktop/研一上/R+python/R/数据探索性分析/各列直方图+核密度曲线.png", plot = plot1, dpi = 300, width = 10, height = 6)
对每一列绘制时序图。每个子图的横坐标是年份,纵坐标是对应列的值
library(tidyr)
data_long <- gather(data, key = "variable", value = "value", -年份)
data_long
plot2 = ggplot(data = data_long, aes(x = 年份, y = value)) +
geom_line(color = "red") +
facet_wrap(~ variable, scales = "free") +
labs(x = "Year", y = "Value") +
ggtitle("时序图") +
scale_y_continuous(labels = scales::scientific_format()) ###将纵坐标换为科学计数法
plot2
ggsave("D:/Users/sf253/Desktop/研一上/R+python/R/数据探索性分析/各列时序图.png", plot = plot2, dpi = 300, width = 10, height = 6)
pairs(data, main = "Correlation Plot")