数理统计
#####采集报告数据筛选######
library(tidyverse)
library(readxl)
# 导入数据 --------------------------------------------------------------------
df <- read_excel("YS_NEW.xls")
# 分组摘要 --------------------------------------------------------------------
df %>% count()
df0 <-df %>% count(`街道名称`)
df1 <-df %>% count(`街道名称`,`租赁来源`) %>% pivot_wider( names_from = "租赁来源", values_from = "n")
df2 <-df %>% count(`街道名称`,`租赁类型`)%>% pivot_wider( names_from = "租赁类型", values_from = "n")
df3 <-df %>% count(`街道名称`,`月租金价格`)%>% pivot_wider( names_from = "月租金价格", values_from = "n")
df4 <-df %>% count(`街道名称`,`出租使用面积`)%>% pivot_wider( names_from = "出租使用面积", values_from = "n")
df5 <-df %>% count(`街道名称`,`电梯配备`)%>% pivot_wider( names_from = "电梯配备", values_from = "n")
df6 <-df %>% count(`街道名称`,`装修程度`)%>% pivot_wider( names_from = "装修程度", values_from = "n")
df7 <- df %>% group_by(`街道名称`) %>% summarize(租金均价=mean(`租金均价`))
# 多表拼接 --------------------------------------------------------------------
df_group <- df0 %>% inner_join(df1) %>% inner_join(df2) %>% inner_join(df3) %>% inner_join(df4) %>% inner_join(df5) %>% inner_join(df6)%>% inner_join(df7)
# 按行排序--------------------------------------------------------------------
x <- c('珞南街道','洪山街道','关山街道','卓刀泉街道','狮子山街道','梨园街道','和平街道','张家湾街道','青菱街道')
y <- c(1,2,3,4,5,6,7,8,9)
df_num <- data.frame( num = y, 街道名称= x)
df_group2 <- df_num%>% inner_join(df_group)
# 按列排序--------------------------------------------------------------------
df_group3 <-select(df_group2,
`num`,`街道名