Data description

The female filial 1 generation of NZBxW mice was used for this study. Tissue from spleen, kidney, liver and lung cells were extracted, prepared and stained according to the guidelines for the use of flow cytometry and cell sorting in immunological studies. The data set can be downloaded from FlowRepository. Compensation, elimination of dublets and dead cells, gating to CD44+ T cells were pre-processed with simple two dimensional scatter plots in FlowJo.

Example analysis with PRI - Pattern Recognition with Immune cells

We chose two examples how to create the binplots with three and four marker combinations, respectively. Only the parameters in the beginning need to be adjusted.

Load libraries

We operated on R v3.2.4 Revised. Library ‘flowCore’ v1.36.9 was installed via BioConductor to read the fcs-files. Help and plot functions are accumulated in ‘YH_bintriploT_functions.R’.

rm(list = ls())
fcs = new.env()
library(flowCore)
source("/data/PRI manuscript/R/standalone/YH_binplot_functions.R")

Data import

The file “TL160721_OHiPU_S23_CD4.fcs” was used to create Figure 1e+f and has 334276 cells after preprocession. The file “export_SG20170627_4hP+I_011_CD44.fcs” was used to create Figure 6e and has 73639 cells after preprocession. Cells were transformed with inverse hyperbolic sine (asinh), which is a common transformation method for flow cytometry data [doi:10.1186/1471-2105-11-546]. Change the path according to your download folder.

path.folder = file.path("","data","PRI\ manuscript","R","fcs_examples")
file.tri = "TL160721_OHiPU_S23_CD4.fcs"
file.quad = "export_SG20170627_4hP+I_011_CD44.fcs"
####### data for bin plots with 3 parameters (example from Figure 1e+f)
# read the alias vs channel mapping from keyword() option
data.tri = read.FCS(file=file.path(path.folder,file.tri),which.lines=1)
keys.tri = keyword(data.tri)
aliases = unlist(keyword(data.tri, c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6S","$P7S","$P8S","$P9S","$P10S",
                                     "$P11S","$P12S","$P13S","$P14S","$P15S",
                                     "$P16S")))
channels = unlist(keyword(data.tri,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6N","$P7N","$P8N","$P9N","$P10N",
                                     "$P11N","$P12N","$P13N","$P14N","$P15N",
                                     "$P16N")))
map.tri <- data.frame(alias = aliases, channels = channels)
# load data
exprs.tri= as.data.frame(exprs(read.FCS(file=file.path(path.folder,file.tri),
                    channel_alias = map.tri, transformation=NULL)))
# rename column names
for ( i in 1:ncol(exprs.tri)) {
  colnames(exprs.tri)[i] = strsplit(colnames(exprs.tri)[i]," ")[[1]][1]
}
# transform data with asinh()
exprs.tri= asinh(exprs.tri)
########################################
####### data for bin plots with 4 parameters (example from Figure 6e)
data.quad = read.FCS(file=file.path(path.folder,file.quad),which.lines=1)
keys.quad = keyword(data.quad)
aliases.quad = unlist(keyword(data.quad,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6S","$P7S","$P8S","$P9S","$P10S",
                                     "$P11S","$P12S","$P13S")))
channels.quad = unlist(keyword(data.quad,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6N","$P7N","$P8N","$P9N","$P10N",
                                     "$P11N","$P12N","$P13N")))
map.quad <- data.frame(alias = aliases.quad, channels = channels.quad)
# load data
exprs.quad= as.data.frame(exprs(read.FCS(file=file.path(path.folder,file.quad),
                    channel_alias = map.quad, transformation=NULL)))
# rename column names
for ( i in 1:ncol(exprs.quad)) {
  colnames(exprs.quad)[i] = strsplit(colnames(exprs.quad)[i]," ")[[1]][1]
}
colnames(exprs.quad)[5] = "IFN-g"
colnames(exprs.quad)[10] = "CXCR5"
# transform data with asinh()
exprs.quad= asinh(exprs.quad)
########################################

binplot with three parameters

The range of parameter X (TNF-a) and parameter Y (CD44) on x and y axis, respectively, are categorized into bins of size 0.2x0.2. With the cells in each bin, different statistical methods can be plotted into a color-coded manner. Here, cell density and mean fluorescence intensity of parameter Z (MFI) are displayed in pseudo-color. All parameters were included in the analysis and bins with less than 10 cells were excluded. This minimum count of cells was used to balance the impact of identifying comparatively rare subpopulations while retaining the statistical power. Examples are shown from Figure 1e.

### INITIATING PARAMETERS
featX = "TNFa"
featY = "CD44"
featZ1 = "IFNg"
cutoffs.man = c(6.6,9,5)
binSize = 0.2
### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2.4,2,2.5,0),
    oma = c(1,1,1,1))
### CALL PLOT FUNCTIONS
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "density",
  binsize = binSize,
  cutoffs = cutoffs.man
)
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "MFI",
  binsize = binSize,
  cutoffs = cutoffs.man
)

Binplot with three parameters and using cutoff of parameter Z

The use of the cutoff of parameter Z can result in an additional advantage. Frequency of parameter Z (IFN-g) producing cells (%) and mean fluorescence intensity of parameter Z producing cells (MFI+) can then be displayed. Examples are shown from Figure 1e+1f.

### INITIATING PARAMETERS
featX = "TNFa"
featY = "CD44"
featZ1 = "IFNg"
cutoffs.man = c(6.6,9,5)
binSize = 0.2
### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2.4,2,2.5,0),
    oma = c(1,1,1,1))
### CALL PLOT FUNCTIONS
  
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man
)
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "MFI+",
  binsize = binSize,
  cutoffs = cutoffs.man
)

Binplot with four parameters

Additionally, frequency of double producing cells (parameter Z1 and Z2) are introduced in green scales. Examples are shown from Figure 6e.

### INITIATING PARAMETERS
featX = "PD1"
featY = "IFNg"
featZ1 = "CXCR5"
featZ2 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.783,7.346)
binSize = 0.2
### plotting options
maxfreq = 80
### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2,2,2,0),
    oma = c(2,2,2,1))
### PLOT BIN CONSTRUCT
fcs$binplot_construct(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)
### PLOT HEATMAP
fcs$binplot_freq_doublepos(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  feat.Z1 = featZ1,
  feat.Z2 = featZ2,
  cutoffs = cutoffs.man,
  maxfreq = maxfreq,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)
############## PLOT #2
### INITIATING PARAMETERS
featX = "PD1"
featY = "IFNg"
featZ1 = "IL21"
featZ2 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.696,7.346)
binSize = 0.2
### plotting options
maxfreq = 50
### PLOT BIN CONSTRUCT
fcs$binplot_construct(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)
### PLOT HEATMAP
fcs$binplot_freq_doublepos(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  feat.Z1 = featZ1,
  feat.Z2 = featZ2,
  cutoffs = cutoffs.man,
  binsize = binSize,
  maxfreq = maxfreq,
  plot.range = c(3,11,3,11)
)

In regards to 3D-surface plots, frequency bin tables are provided and exported from PRI and created with package ‘plotly’ v4.7.1. Examples are shown from Figure 6g.

library(plotly)
featX = "PD1"
featY = "IFNg"
featZ1 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.346)
binSize = 0.2
binplot.table.Z1 = fcs$binplot_table(
  data = exprs.quad, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man,
  plotting = FALSE
)
featZ2 = "IL21"
cutoffs.man = c(6.982,7.479,7.696)
binplot.table.Z2 = fcs$binplot_table(
  data = exprs.quad, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ2, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man,
  plotting = FALSE
)
x=seq(2,12,by=0.2)
y=seq(2,12,by=0.2)
scene = list(xaxis=list(title= "PD-1"),
    yaxis=list(title="IFN-g"),
    zaxis=list(title="freq",range=c(0,85)),
    cameraposition=list(c(-0.1, 0.4, -1, 0.33), c(0.0, 0, 0.0), 2)
)
### UNCOMMENT TO PLOT
### Figure with Bcl6
# plot_ly(showscale = TRUE) %>% add_surface(x=x,y=y,z=t(binplot.table.Z1), cmin=0, cmax=82,colors="Greens",reversescale=F) %>% layout(scene=scene)
### Figure with IL21 
# plot_ly(showscale = TRUE) %>% add_surface(x=x,y=y,z=t(binplot.table.Z2), cmin=0, cmax=82,colors="Greens",reversescale=F) %>% layout(scene=scene)
---
title: "Data analysis with PRI - Pattern Recognition with Immune cells"
author: "Yen Hoang"
date: "22 July 2019"
output: html_notebook
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE)
```


## Data description

The female filial 1 generation of NZBxW mice was used for this study. Tissue from spleen, kidney, liver and lung cells were extracted, prepared and stained according to the guidelines for the use of flow cytometry and cell sorting in immunological studies. The data set can be downloaded from [FlowRepository](http://flowrepository.org). Compensation, elimination of dublets and dead cells, gating to CD44+ T cells were pre-processed with simple two dimensional scatter plots in  [FlowJo](http://flowjo.com).

## Example analysis with PRI - Pattern Recognition with Immune cells
We chose two examples how to create the binplots with three and four marker combinations, respectively. Only the parameters in the beginning need to be adjusted.

### Load libraries
We operated on [R v3.2.4 Revised](http://www.r-project.org). Library 'flowCore' v1.36.9 was installed via [BioConductor](https://www.bioconductor.org/) to read the fcs-files. Help and plot functions are accumulated in 'YH_bintriploT_functions.R'. 
```{r load functions}
rm(list = ls())
fcs = new.env()
library(flowCore)
source("/data/PRI manuscript/R/standalone/YH_binplot_functions.R")
```


### Data import
The file "TL160721_OHiPU_S23_CD4.fcs" was used to create Figure 1e+f and has 334276 cells after preprocession. The file "export_SG20170627_4hP+I_011_CD44.fcs" was used to create Figure 6e and has 73639 cells after preprocession. Cells were transformed with inverse hyperbolic sine (asinh), which is a common transformation method for flow cytometry data [doi:10.1186/1471-2105-11-546]. Change the path according to your download folder. 
```{r data import1}
path.folder = file.path("","data","PRI\ manuscript","R","fcs_examples")

file.tri = "TL160721_OHiPU_S23_CD4.fcs"
file.quad = "export_SG20170627_4hP+I_011_CD44.fcs"

####### data for bin plots with 3 parameters (example from Figure 1e+f)
# read the alias vs channel mapping from keyword() option
data.tri = read.FCS(file=file.path(path.folder,file.tri),which.lines=1)
keys.tri = keyword(data.tri)
aliases = unlist(keyword(data.tri, c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6S","$P7S","$P8S","$P9S","$P10S",
                                     "$P11S","$P12S","$P13S","$P14S","$P15S",
                                     "$P16S")))
channels = unlist(keyword(data.tri,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6N","$P7N","$P8N","$P9N","$P10N",
                                     "$P11N","$P12N","$P13N","$P14N","$P15N",
                                     "$P16N")))
map.tri <- data.frame(alias = aliases, channels = channels)

# load data
exprs.tri= as.data.frame(exprs(read.FCS(file=file.path(path.folder,file.tri),
                    channel_alias = map.tri, transformation=NULL)))
# rename column names
for ( i in 1:ncol(exprs.tri)) {
  colnames(exprs.tri)[i] = strsplit(colnames(exprs.tri)[i]," ")[[1]][1]
}
# transform data with asinh()
exprs.tri= asinh(exprs.tri)
########################################

####### data for bin plots with 4 parameters (example from Figure 6e)
data.quad = read.FCS(file=file.path(path.folder,file.quad),which.lines=1)
keys.quad = keyword(data.quad)
aliases.quad = unlist(keyword(data.quad,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6S","$P7S","$P8S","$P9S","$P10S",
                                     "$P11S","$P12S","$P13S")))
channels.quad = unlist(keyword(data.quad,c("$P1N","$P2N","$P3N","$P4N","$P5N",
                                     "$P6N","$P7N","$P8N","$P9N","$P10N",
                                     "$P11N","$P12N","$P13N")))
map.quad <- data.frame(alias = aliases.quad, channels = channels.quad)

# load data
exprs.quad= as.data.frame(exprs(read.FCS(file=file.path(path.folder,file.quad),
                    channel_alias = map.quad, transformation=NULL)))
# rename column names
for ( i in 1:ncol(exprs.quad)) {
  colnames(exprs.quad)[i] = strsplit(colnames(exprs.quad)[i]," ")[[1]][1]
}
colnames(exprs.quad)[5] = "IFN-g"
colnames(exprs.quad)[10] = "CXCR5"
# transform data with asinh()
exprs.quad= asinh(exprs.quad)

########################################
```

### binplot with three parameters
The range of parameter X (TNF-a) and parameter Y (CD44) on x and y axis, respectively, are categorized into bins of size 0.2x0.2. With the cells in each bin, different statistical methods can be plotted into a color-coded manner. Here, cell density and mean fluorescence intensity of parameter Z (MFI) are displayed in pseudo-color. All parameters were included in the analysis and bins with less than 10 cells were excluded. This minimum count of cells was used to balance the impact of identifying comparatively rare subpopulations while retaining the statistical power. Examples are shown from Figure 1e.

```{r triplot1}
### INITIATING PARAMETERS
featX = "TNFa"
featY = "CD44"
featZ1 = "IFNg"
cutoffs.man = c(6.6,9,5)
binSize = 0.2

### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2.4,2,2.5,0),
    oma = c(1,1,1,1))

### CALL PLOT FUNCTIONS
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "density",
  binsize = binSize,
  cutoffs = cutoffs.man
)

fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "MFI",
  binsize = binSize,
  cutoffs = cutoffs.man
)
```

### Binplot with three parameters and using cutoff of parameter Z
The use of the cutoff of parameter Z can result in an additional advantage. Frequency of parameter Z (IFN-g) producing cells (%) and mean fluorescence intensity of parameter Z producing cells (MFI+) can then be displayed.  Examples are shown from Figure 1e+1f.
```{r triplot2}
### INITIATING PARAMETERS
featX = "TNFa"
featY = "CD44"
featZ1 = "IFNg"
cutoffs.man = c(6.6,9,5)
binSize = 0.2

### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2.4,2,2.5,0),
    oma = c(1,1,1,1))
### CALL PLOT FUNCTIONS
  
fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man
)

fcs$binplot_table(
  data = exprs.tri, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "MFI+",
  binsize = binSize,
  cutoffs = cutoffs.man
)
```



### Binplot with four parameters
Additionally, frequency of double producing cells (parameter Z1 and Z2) are introduced in green scales. Examples are shown from Figure 6e.
```{r quadplot}
### INITIATING PARAMETERS
featX = "PD1"
featY = "IFNg"
featZ1 = "CXCR5"
featZ2 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.783,7.346)
binSize = 0.2
### plotting options
maxfreq = 80

### PLOTTING PARAMETERS FOR TWO PLOTS
par(mfrow = c(1,2),
    cex.lab = 1.4, cex.axis = 1.4,
    mgp = c(2.0, 0, 0),
    mar = c(2,2,2,0),
    oma = c(2,2,2,1))

### PLOT BIN CONSTRUCT
fcs$binplot_construct(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)

### PLOT HEATMAP
fcs$binplot_freq_doublepos(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  feat.Z1 = featZ1,
  feat.Z2 = featZ2,
  cutoffs = cutoffs.man,
  maxfreq = maxfreq,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)

############## PLOT #2
### INITIATING PARAMETERS
featX = "PD1"
featY = "IFNg"
featZ1 = "IL21"
featZ2 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.696,7.346)
binSize = 0.2
### plotting options
maxfreq = 50


### PLOT BIN CONSTRUCT
fcs$binplot_construct(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  binsize = binSize,
  plot.range = c(3,11,3,11)
)

### PLOT HEATMAP
fcs$binplot_freq_doublepos(
  data = exprs.quad,
  feat.X = featX,
  feat.Y = featY,
  feat.Z1 = featZ1,
  feat.Z2 = featZ2,
  cutoffs = cutoffs.man,
  binsize = binSize,
  maxfreq = maxfreq,
  plot.range = c(3,11,3,11)
)
```

In regards to 3D-surface plots, frequency bin tables are provided and exported from PRI and created with package 'plotly' v4.7.1. Examples are shown from Figure 6g.

```{r surface plots}
library(plotly)
featX = "PD1"
featY = "IFNg"
featZ1 = "Bcl6"
cutoffs.man = c(6.982,7.479,7.346)
binSize = 0.2

binplot.table.Z1 = fcs$binplot_table(
  data = exprs.quad, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ1, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man,
  plotting = FALSE
)

featZ2 = "IL21"
cutoffs.man = c(6.982,7.479,7.696)

binplot.table.Z2 = fcs$binplot_table(
  data = exprs.quad, 
  feat.X = featX, 
  feat.Y = featY, 
  feat.Z1 = featZ2, 
  calc = "freq",
  binsize = binSize,
  cutoffs = cutoffs.man,
  plotting = FALSE
)


x=seq(2,12,by=0.2)
y=seq(2,12,by=0.2)
scene = list(xaxis=list(title= "PD-1"),
    yaxis=list(title="IFN-g"),
    zaxis=list(title="freq",range=c(0,85)),
    cameraposition=list(c(-0.1, 0.4, -1, 0.33), c(0.0, 0, 0.0), 2)
)
### UNCOMMENT TO PLOT
### Figure with Bcl6
# plot_ly(showscale = TRUE) %>% add_surface(x=x,y=y,z=t(binplot.table.Z1), cmin=0, cmax=82,colors="Greens",reversescale=F) %>% layout(scene=scene)
### Figure with IL21 
# plot_ly(showscale = TRUE) %>% add_surface(x=x,y=y,z=t(binplot.table.Z2), cmin=0, cmax=82,colors="Greens",reversescale=F) %>% layout(scene=scene)
```
