平均値のgeom_densityとshade confidence intervalにvlineを追加するR

異なる投稿を読み終えたら、hereのように濃度プロットに平均値のvlineを追加する方法を見つけました。上記のリンクに記載されているデータを使用してください：平均値のgeom_densityとshade confidence intervalにvlineを追加するR

1）geom_ribbonを使用して平均周りに95％信頼区間を追加するにはどうすればよいですか？シスつの曲線下の領域にVLINEを制限することができる方法

#computation of the standard error of the mean 
sem<-sd(x)/sqrt(length(x)) 
#95% confidence intervals of the mean 
c(mean(x)-2*sem,mean(x)+2*sem)

2）のように計算することができますか？下の図では、カーブの外にあるラインのプロットが表示されます。私の本当の問題に非常に近い

サンプル・データは、上記のリンクで、実際のデータを用いてhttps://www.dropbox.com/s/bvvfdpgekbjyjh0/test.csv?dl=0

UPDATE

で見つけることができ、私は、@ビートルートの答えを使用して、以下を試してみました。

# Find the mean of each group 
dat=me 
library(dplyr) 
library(plyr) 
cdat <- ddply(data,.(direction,cond), summarise, rating.mean=mean(rating,na.rm=T))# summarize by season and variable 
cdat 

#ggplot 
p=ggplot(data,aes(x = rating)) + 
    geom_density(aes(colour = cond),size=1.3,adjust=4)+ 
    facet_grid(.~direction, scales="free")+ 
    xlab(NULL) + ylab("Density") 
p=p+coord_cartesian(xlim = c(0, 130))+scale_color_manual(name="",values=c("blue","#00BA38","#F8766D"))+ 
    scale_fill_manual(values=c("blue", "#00BA38", "#F8766D"))+ 
    theme(legend.title = element_text(colour="black", size=15, face="plain"))+ 
    theme(legend.text = element_text(colour="black", size = 15, face = "plain"))+ 
    theme(title = red.bold.italic.text, axis.title = red.bold.italic.text)+ 
    theme(strip.text.x = element_text(size=20, color="black",face="plain"))+ # facet labels 
    ggtitle("SAMPLE A") +theme(plot.title = element_text(size = 20, face = "bold"))+ 
    theme(axis.text = blue.bold.italic.16.text)+ theme(legend.position = "none")+ 
    geom_vline(data=cdat, aes(xintercept=rating.mean, color=cond),linetype="dotted",size=1) 
p

## implementing @beetroot's code to restrict lines under the curve and shade CIs around the mean 
# I will use ddply for mean and CIs 
cdat <- ddply(data,.(direction,cond), summarise, rating.mean=mean(rating,na.rm=T), 
       sem = sd(rating,na.rm=T)/sqrt(length(rating)), 
       ci.low = mean(rating,na.rm=T) - 2*sem, 
       ci.upp = mean(rating,na.rm=T) + 2*sem)# summarize by direction and variable 


#In order to limit the lines to the outline of the curves you first need to find out which y values 
#of the curves correspond to the means, e.g. by accessing the density values with ggplot_build and 
#using approx: 

    cdat.dens <- ggplot_build(ggplot(data, aes(x=rating, colour=cond)) + 
           facet_grid(.~direction, scales="free")+ 
           geom_density(aes(colour = cond),size=1.3,adjust=4))$data[[1]] %>% 
    mutate(cond = ifelse(group==1, "A", 
         ifelse(group==2, "B","C"))) %>% 
    left_join(cdat) %>% 
    select(y, x, cond, rating.mean, sem, ci.low, ci.upp) %>% 
    group_by(cond) %>% 
    mutate(dens.mean = approx(x, y, xout = rating.mean)[[2]], 
     dens.cilow = approx(x, y, xout = ci.low)[[2]], 
     dens.ciupp = approx(x, y, xout = ci.upp)[[2]]) %>% 
    select(-y, -x) %>% 
    slice(1) 

cdat.dens 

#--- 
#You can then combine everything with various geom_segments: 

    ggplot(data, aes(x=rating, colour=cond)) + 
    geom_density(data = data, aes(x = rating, colour = cond),size=1.3,adjust=4) +facet_grid(.~direction, scales="free")+ 
    geom_segment(data = cdat.dens, aes(x = rating.mean, xend = rating.mean, y = 0, yend = dens.mean, colour = cond), 
       linetype = "dashed", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.low, xend = ci.low, y = 0, yend = dens.cilow, colour = cond), 
       linetype = "dotted", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.upp, xend = ci.upp, y = 0, yend = dens.ciupp, colour = cond), 
       linetype = "dotted", size = 1)

これを与える：

あなたは平均値とのCIは、元のプロットのように整列されていないわかります。 @beetrootを正しくしないのは何ですか？そのような

出典

2017-02-01 code123

私はgeom_rectを使用します。 yminとymaxを+/- Infに設定してください –

曲線に限定するには、密度をあらかじめ計算しておく必要があります。 – Axeman

また、http://stackoverflow.com/questions/12429333/how-to-shade-a-region-under-a-curve-using-ggplot2 – Axeman

リンクからのデータを使用して、平均値を計算することができ、それ自体とCI（私はdplyr、plyrの後継者を使用することをお勧め）：

set.seed(1234) 
dat <- data.frame(cond = factor(rep(c("A","B"), each=200)), 
        rating = c(rnorm(200),rnorm(200, mean=.8))) 

library(ggplot2) 
library(dplyr) 
cdat <- dat %>% 
    group_by(cond) %>% 
    summarise(rating.mean = mean(rating), 
      sem = sd(rating)/sqrt(length(rating)), 
      ci.low = mean(rating) - 2*sem, 
      ci.upp = mean(rating) + 2*sem)

アウトラインに行を制限するために曲線のどのy値が平均値に対応しているかを最初に調べる必要がある曲線の例Axemanはあなたがベースポリゴンを作成することができます指摘したように

ggplot() + 
    geom_density(data = dat, aes(x = rating, colour = cond)) + 
    geom_segment(data = cdat.dens, aes(x = rating.mean, xend = rating.mean, y = 0, yend = dens.mean, colour = cond), 
      linetype = "dashed", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.low, xend = ci.low, y = 0, yend = dens.cilow, colour = cond), 
      linetype = "dotted", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.upp, xend = ci.upp, y = 0, yend = dens.ciupp, colour = cond), 
       linetype = "dotted", size = 1)

：ggplot_buildと密度値にアクセスしapproxを使用することにより：

cdat.dens <- ggplot_build(ggplot(dat, aes(x=rating, colour=cond)) + geom_density())$data[[1]] %>% 
    mutate(cond = ifelse(group == 1, "A", "B")) %>% 
    left_join(cdat) %>% 
    select(y, x, cond, rating.mean, sem, ci.low, ci.upp) %>% 
    group_by(cond) %>% 
    mutate(dens.mean = approx(x, y, xout = rating.mean)[[2]], 
     dens.cilow = approx(x, y, xout = ci.low)[[2]], 
     dens.ciupp = approx(x, y, xout = ci.upp)[[2]]) %>% 
    select(-y, -x) %>% 
    slice(1) 

> cdat.dens 
Source: local data frame [2 x 8] 
Groups: cond [2] 

    cond rating.mean  sem  ci.low  ci.upp dens.mean dens.cilow dens.ciupp 
    <chr>  <dbl>  <dbl>  <dbl>  <dbl>  <dbl>  <dbl>  <dbl> 
1  A -0.05775928 0.07217200 -0.2021033 0.08658471 0.3865929 0.403623 0.3643583 
2  B 0.87324927 0.07120697 0.7308353 1.01566320 0.3979347 0.381683 0.4096153

あなたはその後、様々なgeom_segment秒ですべてを組み合わせることができますthis answerで説明されているように、リボン領域にあります。

だからあなたのデータのためにあなたがそうのような追加の行サブセットと追加することができます。

ribbon <- ggplot_build(ggplot(dat, aes(x=rating, colour=cond)) + geom_density())$data[[1]] %>% 
    mutate(cond = ifelse(group == 1, "A", "B")) %>% 
    left_join(cdat.dens) %>% 
    group_by(cond) %>% 
    filter(x >= ci.low & x <= ci.upp) %>% 
    select(cond, x, y) 

ribbon <- rbind(data.frame(cond = c("A", "B"), x = c(-0.2021033, 0.7308353), y = c(0, 0)), 
       as.data.frame(ribbon), 
       data.frame(cond = c("A", "B"), x = c(0.08658471, 1.01566320), y = c(0, 0)))

、プロットにgeom_polygonを追加する：

ggplot() + 
    geom_polygon(data = ribbon, aes(x = x, y = y, fill = cond), alpha = .5) + 
    geom_density(data = dat, aes(x = rating, colour = cond)) + 
    geom_segment(data = cdat.dens, aes(x = rating.mean, xend = rating.mean, y = 0, yend = dens.mean, colour = cond), 
      linetype = "dashed", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.low, xend = ci.low, y = 0, yend = dens.cilow, colour = cond), 
      linetype = "dotted", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.upp, xend = ci.upp, y = 0, yend = dens.ciupp, colour = cond), 
       linetype = "dotted", size = 1)

ここです実際のデータに適合したコードです。これは、1つの代わりに2つのグループを組み込むことがちょうど少しトリッキーです：

cdat <- dat %>% 
    group_by(direction, cond) %>% 
    summarise(rating.mean = mean(rating, na.rm = TRUE), 
      sem = sd(rating, na.rm = TRUE)/sqrt(length(rating)), 
      ci.low = mean(rating, na.rm = TRUE) - 2*sem, 
      ci.upp = mean(rating, na.rm = TRUE) + 2*sem) 

cdat.dens <- ggplot_build(ggplot(dat, aes(x=rating, colour=interaction(direction, cond))) + geom_density())$data[[1]] %>% 
    mutate(cond = ifelse((group == 1 | group == 2 | group == 3 | group == 4), "A", 
         ifelse((group == 5 | group == 6 | group == 7 | group == 8), "B", "C")), 
     direction = ifelse((group == 1 | group == 5 | group == 9), "EAST", 
          ifelse((group == 2 | group == 6 | group == 10), "NORTH", 
            ifelse((group == 3 | group == 7 | group == 11), "SOUTH", "WEST")))) %>% 
    left_join(cdat) %>% 
    select(y, x, cond, direction, rating.mean, sem, ci.low, ci.upp) %>% 
    group_by(cond, direction) %>% 
    mutate(dens.mean = approx(x, y, xout = rating.mean)[[2]], 
     dens.cilow = approx(x, y, xout = ci.low)[[2]], 
     dens.ciupp = approx(x, y, xout = ci.upp)[[2]]) %>% 
    select(-y, -x) %>% 
    slice(1) 

ggplot() + 
    geom_density(data = dat, aes(x = rating, colour = cond)) + 
    geom_segment(data = cdat.dens, aes(x = rating.mean, xend = rating.mean, y = 0, yend = dens.mean, colour = cond), 
       linetype = "dashed", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.low, xend = ci.low, y = 0, yend = dens.cilow, colour = cond), 
       linetype = "dotted", size = 1) + 
    geom_segment(data = cdat.dens, aes(x = ci.upp, xend = ci.upp, y = 0, yend = dens.ciupp, colour = cond), 
       linetype = "dotted", size = 1) + 
    facet_wrap(~direction)

出典

2017-02-01 08:45:14 beetroot

よろしくお願いします。これはすばらしく見える。私は自分のデータでそれを試し、あなたに知らせます。再度、感謝します。 – code123

私はあなたが上記で提供したデータにあなたのコードを使用できますか？私の実際のデータには、「A」、「B」、「C」、および「東」、「西」、「南」、「北」という追加の変数「方向」があります。究極の目的は、私が間違いなく行うことができる 'facet_grid（。〜direction、scales =" free "）を使って濃度を表示することです。私はさらに多くのグループを持っていますが、上のリンクの新しく提供されたデータ 'test.csv'へのあなたの答えは私を始めなければなりません。ありがとう。 – code123

あなたの質問の中にあなたのデータの 'dput（）'を入れて、あなたが何をしたのかを示して、あなたの答えから抜け出した箇所を説明してください。 – beetroot

平均値のgeom_densityとshade confidence intervalにvlineを追加するR

答えて

関連する問題