title author date
N. Alcala

Code to produce Fig. 2D from Dayton et al. (Submitted)

load libraries

Define colors

Colors for each experiment (organoid and parental tumor families), type, and grades:

colors_org = c(LNET2="#aade87ff",LNET6="#5fd38dff",LNET13="#16502dff",LNET14="#6f917cff",
               LNET5="#e6a73cff",LNET10="#ff9955ff",LNET15="#ffd42aff", LNET16 = "#ff6600ff", LNET18= "#d0742fff", 
               LNET20 = "#f6e62bff", 
               LCNEC3="#ff8080ff",LCNEC4="#d35f5fff", LCNEC23 = "#ff5555ff", 
               SINET7="#2ad4ffff",SINET8="#80b3ffff",SINET9="#5f8dd3ff",SINET12="#5fbcd3ff", SINET21="#0066ffff", SINET22="#2c5aa0ff")

colors_types = c(SI= "#5bc2f0ff", Lung = "#9b9972ff", Pancreas = "#8d5fd3ff")

colors_grades = c(G1= "#58b873f9", G2 = "#ff9955ff", G3 = "#f0677dff", "G1/G2" = "#58c1f0ff")

Load data

Data is in TableS1.xlsx, second tab (see supplementary files from the paper)

expr_genes_KI67.tib = read_xlsx("TableS1.xlsx",sheet = 2,skip=2,col_types = c("text","numeric","text","text","text"))

Plot Figure 2D

Figure presenting the expression of MKI67 in organoids and reference tumors:

ggplot( expr_genes_KI67.tib %>% filter(Experiment=="Reference",Type!="SCLC",Grade!="NA") , aes(y=Grade,x=Expression.TPM,fill=Grade) ) + geom_density_ridges2(scale = 1.5,col=NA) + 
  geom_point(data = expr_genes_KI67.tib %>% filter(Experiment!="Reference",str_detect(Sample,"p[0-9.]*$")) , size=4, pch=16, col="white",fill="black") +
  geom_point(data = expr_genes_KI67.tib %>% filter(Experiment!="Reference",str_detect(Sample,"p[0-9.]*$")) , size=2.7, pch=16, col="black",fill="black") + 
  theme_classic()  + labs(y="Histopathological type",x=expression(italic(MKI67)~" Expression (TPM)") ) + 
  geom_vline(xintercept = 1,linetype="dashed") + 
  scale_x_log10(breaks=c(0.01,0.1,1,10,10**2),limits=c(0.01,200),labels=c("≤0.01",0.1,1,10,100)) + scale_fill_manual(values=alpha(colors_grades,0.5))

compute a few stats

Compute mean expression levels per grade and tumor type, in organoids and reference samples

expr_genes_KI67.tib %>% group_by(Experiment=="Reference",Type,Grade) %>% summarize(mean(Expression.TPM))
## # A tibble: 10 × 4
## # Groups:   Experiment == "Reference", Type [7]
##    `Experiment == "Reference"` Type  Grade `mean(Expression.TPM)`
##    <lgl>                       <chr> <chr>                  <dbl>
##  1 FALSE                       LCNEC G3                     39.0 
##  2 FALSE                       LNET  G1                      1.15
##  3 FALSE                       LNET  G2                      5.51
##  4 FALSE                       SINET G1/G2                   1.02
##  5 TRUE                        LCNEC G3                     37.8 
##  6 TRUE                        LNET  G1                      1.10
##  7 TRUE                        LNET  G2                   4268.  
##  8 TRUE                        LNET  NA                      2.05
##  9 TRUE                        SCLC  G3                     71.4 
## 10 TRUE                        SINET G1/G2                   3.54
expr_genes_KI67.tib %>% filter(str_detect(Sample,"p[0-9]")) %>% group_by(Experiment=="Reference",Type,Grade) %>% summarize(mean(Expression.TPM))
## # A tibble: 4 × 4
## # Groups:   Experiment == "Reference", Type [3]
##   `Experiment == "Reference"` Type  Grade `mean(Expression.TPM)`
##   <lgl>                       <chr> <chr>                  <dbl>
## 1 FALSE                       LCNEC G3                    38.8  
## 2 FALSE                       LNET  G1                     1.45 
## 3 FALSE                       LNET  G2                     4.28 
## 4 FALSE                       SINET G1/G2                  0.691

Session Info

