<!DOCTYPE html>

<html xmlns="http://www.w3.org/1999/xhtml">

<head>

<meta charset="utf-8" />
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<meta name="generator" content="pandoc" />


<meta name="author" content="Siming Zhao" />

<meta name="date" content="2018-12-02" />

<title>Differential expression analysis--EdgeR log likelihood ratio tests</title>

<script src="site_libs/jquery-1.11.3/jquery.min.js"></script>
<meta name="viewport" content="width=device-width, initial-scale=1" />
<link href="site_libs/bootstrap-3.3.5/css/cosmo.min.css" rel="stylesheet" />
<script src="site_libs/bootstrap-3.3.5/js/bootstrap.min.js"></script>
<script src="site_libs/bootstrap-3.3.5/shim/html5shiv.min.js"></script>
<script src="site_libs/bootstrap-3.3.5/shim/respond.min.js"></script>
<script src="site_libs/jqueryui-1.11.4/jquery-ui.min.js"></script>
<link href="site_libs/tocify-1.9.1/jquery.tocify.css" rel="stylesheet" />
<script src="site_libs/tocify-1.9.1/jquery.tocify.js"></script>
<script src="site_libs/navigation-1.1/tabsets.js"></script>
<link href="site_libs/highlightjs-9.12.0/textmate.css" rel="stylesheet" />
<script src="site_libs/highlightjs-9.12.0/highlight.js"></script>
<link href="site_libs/font-awesome-5.0.13/css/fa-svg-with-js.css" rel="stylesheet" />
<script src="site_libs/font-awesome-5.0.13/js/fontawesome-all.min.js"></script>
<script src="site_libs/font-awesome-5.0.13/js/fa-v4-shims.min.js"></script>

<style type="text/css">code{white-space: pre;}</style>
<style type="text/css">
  pre:not([class]) {
    background-color: white;
  }
</style>
<script type="text/javascript">
if (window.hljs) {
  hljs.configure({languages: []});
  hljs.initHighlightingOnLoad();
  if (document.readyState && document.readyState === "complete") {
    window.setTimeout(function() { hljs.initHighlighting(); }, 0);
  }
}
</script>



<style type="text/css">
h1 {
  font-size: 34px;
}
h1.title {
  font-size: 38px;
}
h2 {
  font-size: 30px;
}
h3 {
  font-size: 24px;
}
h4 {
  font-size: 18px;
}
h5 {
  font-size: 16px;
}
h6 {
  font-size: 12px;
}
.table th:not([align]) {
  text-align: left;
}
</style>


</head>

<body>

<style type = "text/css">
.main-container {
  max-width: 940px;
  margin-left: auto;
  margin-right: auto;
}
code {
  color: inherit;
  background-color: rgba(0, 0, 0, 0.04);
}
img {
  max-width:100%;
  height: auto;
}
.tabbed-pane {
  padding-top: 12px;
}
.html-widget {
  margin-bottom: 20px;
}
button.code-folding-btn:focus {
  outline: none;
}
</style>


<style type="text/css">
/* padding for bootstrap navbar */
body {
  padding-top: 51px;
  padding-bottom: 40px;
}
/* offset scroll position for anchor links (for fixed navbar)  */
.section h1 {
  padding-top: 56px;
  margin-top: -56px;
}

.section h2 {
  padding-top: 56px;
  margin-top: -56px;
}
.section h3 {
  padding-top: 56px;
  margin-top: -56px;
}
.section h4 {
  padding-top: 56px;
  margin-top: -56px;
}
.section h5 {
  padding-top: 56px;
  margin-top: -56px;
}
.section h6 {
  padding-top: 56px;
  margin-top: -56px;
}
</style>

<script>
// manage active state of menu based on current page
$(document).ready(function () {
  // active menu anchor
  href = window.location.pathname
  href = href.substr(href.lastIndexOf('/') + 1)
  if (href === "")
    href = "index.html";
  var menuAnchor = $('a[href="' + href + '"]');

  // mark it active
  menuAnchor.parent().addClass('active');

  // if it's got a parent navbar menu mark it active as well
  menuAnchor.closest('li.dropdown').addClass('active');
});
</script>


<div class="container-fluid main-container">

<!-- tabsets -->
<script>
$(document).ready(function () {
  window.buildTabsets("TOC");
});
</script>

<!-- code folding -->




<script>
$(document).ready(function ()  {

    // move toc-ignore selectors from section div to header
    $('div.section.toc-ignore')
        .removeClass('toc-ignore')
        .children('h1,h2,h3,h4,h5').addClass('toc-ignore');

    // establish options
    var options = {
      selectors: "h1,h2,h3",
      theme: "bootstrap3",
      context: '.toc-content',
      hashGenerator: function (text) {
        return text.replace(/[.\\/?&!#<>]/g, '').replace(/\s/g, '_').toLowerCase();
      },
      ignoreSelector: ".toc-ignore",
      scrollTo: 0
    };
    options.showAndHide = true;
    options.smoothScroll = true;

    // tocify
    var toc = $("#TOC").tocify(options).data("toc-tocify");
});
</script>

<style type="text/css">

#TOC {
  margin: 25px 0px 20px 0px;
}
@media (max-width: 768px) {
#TOC {
  position: relative;
  width: 100%;
}
}


.toc-content {
  padding-left: 30px;
  padding-right: 40px;
}

div.main-container {
  max-width: 1200px;
}

div.tocify {
  width: 20%;
  max-width: 260px;
  max-height: 85%;
}

@media (min-width: 768px) and (max-width: 991px) {
  div.tocify {
    width: 25%;
  }
}

@media (max-width: 767px) {
  div.tocify {
    width: 100%;
    max-width: none;
  }
}

.tocify ul, .tocify li {
  line-height: 20px;
}

.tocify-subheader .tocify-item {
  font-size: 0.90em;
  padding-left: 25px;
  text-indent: 0;
}

.tocify .list-group-item {
  border-radius: 0px;
}


</style>

<!-- setup 3col/9col grid for toc_float and main content  -->
<div class="row-fluid">
<div class="col-xs-12 col-sm-4 col-md-3">
<div id="TOC" class="tocify">
</div>
</div>

<div class="toc-content col-xs-12 col-sm-8 col-md-9">




<div class="navbar navbar-default  navbar-fixed-top" role="navigation">
  <div class="container">
    <div class="navbar-header">
      <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
        <span class="icon-bar"></span>
        <span class="icon-bar"></span>
        <span class="icon-bar"></span>
      </button>
      <a class="navbar-brand" href="index.html">cropseq</a>
    </div>
    <div id="navbar" class="navbar-collapse collapse">
      <ul class="nav navbar-nav">
        <li>
  <a href="index.html">Home</a>
</li>
<li>
  <a href="about.html">About</a>
</li>
<li>
  <a href="license.html">License</a>
</li>
      </ul>
      <ul class="nav navbar-nav navbar-right">
        <li>
  <a href="https://github.com/simingz/cropseq">
    <span class="fa fa-github"></span>
     
  </a>
</li>
      </ul>
    </div><!--/.nav-collapse -->
  </div><!--/.container -->
</div><!--/.navbar -->

<!-- Add a small amount of space between sections. -->
<style type="text/css">
div.section {
  padding-top: 12px;
}
</style>

<div class="fluid-row" id="header">



<h1 class="title toc-ignore">Differential expression analysis–EdgeR log likelihood ratio tests</h1>
<h4 class="author"><em>Siming Zhao</em></h4>
<h4 class="date"><em>December 2, 2018</em></h4>

</div>


<p><strong>Last updated:</strong> 2018-12-17</p>
<strong>workflowr checks:</strong> <small>(Click a bullet for more information)</small>
<ul>
<li>
<details>
<p><summary> <strong style="color:red;">✖</strong> <strong>R Markdown file:</strong> uncommitted changes </summary> The R Markdown is untracked by Git. To know which version of the R Markdown file created these results, you’ll want to first commit it to the Git repo. If you’re still working on the analysis, you can ignore this warning. When you’re finished, you can run <code>wflow_publish</code> to commit the R Markdown file and build the HTML.</p>
</details>
</li>
<li>
<details>
<p><summary> <strong style="color:blue;">✔</strong> <strong>Environment:</strong> empty </summary></p>
<p>Great job! The global environment was empty. Objects defined in the global environment can affect the analysis in your R Markdown file in unknown ways. For reproduciblity it’s best to always run the code in an empty environment.</p>
</details>
</li>
<li>
<details>
<p><summary> <strong style="color:blue;">✔</strong> <strong>Seed:</strong> <code>set.seed(20181119)</code> </summary></p>
<p>The command <code>set.seed(20181119)</code> was run prior to running the code in the R Markdown file. Setting a seed ensures that any results that rely on randomness, e.g. subsampling or permutations, are reproducible.</p>
</details>
</li>
<li>
<details>
<p><summary> <strong style="color:blue;">✔</strong> <strong>Session information:</strong> recorded </summary></p>
<p>Great job! Recording the operating system, R version, and package versions is critical for reproducibility.</p>
</details>
</li>
<li>
<details>
<p><summary> <strong style="color:blue;">✔</strong> <strong>Repository version:</strong> <a href="https://github.com/simingz/cropseq/tree/49ecf6e2cf5686b9d11690f78c565c7361d08d6e" target="_blank">49ecf6e</a> </summary></p>
Great! You are using Git for version control. Tracking code development and connecting the code version to the results is critical for reproducibility. The version displayed above was the version of the Git repository at the time these results were generated. <br><br> Note that you need to be careful to ensure that all relevant files for the analysis have been committed to Git prior to generating the results (you can use <code>wflow_publish</code> or <code>wflow_git_commit</code>). workflowr only checks the R Markdown file, but you know if there are other scripts or data files that it depends on. Below is the status of the Git repository when the results were generated:
<pre><code>
Ignored files:
    Ignored:    .Rhistory
    Ignored:    .Rproj.user/
    Ignored:    analysis/Quality_metrics_cache/
    Ignored:    analysis/figure/

Untracked files:
    Untracked:  analysis/EdgeR-LRT.Rmd
    Untracked:  docs/figure/DEseq2-LRT.Rmd/

Unstaged changes:
    Modified:   analysis/DEseq2-LRT.Rmd

</code></pre>
Note that any generated files, e.g. HTML, png, CSS, etc., are not included in this status report because it is ok for generated content to have uncommitted changes.
</details>
</li>
</ul>
<hr />
<p>Load data</p>
<pre class="r"><code>source(&quot;code/summary_functions.R&quot;)
library(dplyr)
load(&quot;data/DE_input.Rd&quot;)
glocus &lt;- &quot;VPS45&quot;
dim(dm)[1]</code></pre>
<pre><code>NULL</code></pre>
<pre class="r"><code>gcount &lt;- dm[1:(dim(dm)[1]-76), colnames(dm1dfagg)[dm1dfagg[glocus,] &gt;0 &amp; nlocus==1]]
# negative control cells defined as neg gRNA targeted cells
ncount &lt;- dm[1:(dim(dm)[1]-76), colnames(dm1dfagg)[dm1dfagg[&quot;neg&quot;,] &gt;0 &amp; nlocus==1]]
coldata &lt;- data.frame(row.names = c(colnames(gcount),colnames(ncount)),     
                      condition=c(rep(&#39;G&#39;,dim(gcount)[2]),rep(&#39;N&#39;,dim(ncount)[2])))
countall &lt;- cbind(gcount,ncount)
totalcount &lt;- apply(countall,1,sum)
cellpercent &lt;-  apply(countall,1,function(x) length(x[x&gt;0])/length(x))</code></pre>
<p>edgeR log likelihood ratio tests function</p>
<pre class="r"><code>library(edgeR)
run_edgeR &lt;- function(y) {
  # y is DGElist object
  y &lt;- calcNormFactors(y)
  group=coldata$condition
  design &lt;- model.matrix(~group)
  y &lt;- estimateDisp(y,design)

  fitlrt &lt;- glmFit(y,design)
  lrt &lt;- glmLRT(fitlrt,coef=2)
  summ_pvalues(lrt$table$PValue)
  out &lt;- topTags(lrt, n=Inf, adjust.method = &quot;BH&quot;)
  outsig &lt;- subset(out$table,FDR &lt;0.1)
  print(paste0(&quot;There are &quot;,dim(outsig)[1], &quot; genes passed FDR &lt;0.1 cutoff&quot;))
  print(knitr::kable(signif(as.matrix(head(out$table[order(out$table$PValue),])),digit=2)))
  return(out)
}</code></pre>
<div id="run-edgerno-filtering" class="section level2">
<h2>Run edgeR–No filtering</h2>
<pre class="r"><code>y &lt;- DGEList(counts= countall,group=coldata$condition)
res &lt;- run_edgeR(y)</code></pre>
<p><img src="figure/EdgeR-LRT.Rmd/edgeRall-1.png" width="672" style="display: block; margin: auto;" /></p>
<pre><code>[1] &quot;There are 0 genes passed FDR &lt;0.1 cutoff&quot;

                      logFC   logCPM   LR    PValue    FDR
-------------------  ------  -------  ---  --------  -----
ENSG00000175899.14    -1.50      6.9   20   8.5e-06   0.12
ENSG00000176956.12    -2.60      6.6   19   1.1e-05   0.12
ENSG00000100097.11    -2.20      6.6   19   1.2e-05   0.12
ENSG00000100300.17    -1.50      6.4   14   1.5e-04   0.97
ENSG00000119906.11     1.10      6.4   14   1.9e-04   0.97
ENSG00000185900.9     -0.79      6.3   14   2.2e-04   0.97</code></pre>
</div>
<div id="run-edgerat-least-one-cell-umi-0" class="section level2">
<h2>Run edgeR–at least one cell UMI &gt; 0</h2>
<pre class="r"><code>y &lt;- DGEList(counts= countall[totalcount&gt;0,],group=coldata$condition)
res &lt;- run_edgeR(y)</code></pre>
<p><img src="figure/EdgeR-LRT.Rmd/edgeR%3E0-1.png" width=“672” style=“display: block; margin: auto;” /&gt;</p>
<pre><code>[1] &quot;There are 3 genes passed FDR &lt;0.1 cutoff&quot;

                      logFC   logCPM   LR    PValue     FDR
-------------------  ------  -------  ---  --------  ------
ENSG00000175899.14    -1.50      6.9   20   8.5e-06   0.062
ENSG00000176956.12    -2.60      6.6   19   1.1e-05   0.062
ENSG00000100097.11    -2.20      6.6   19   1.2e-05   0.062
ENSG00000100300.17    -1.50      6.4   14   1.5e-04   0.510
ENSG00000119906.11     1.10      6.4   14   1.9e-04   0.510
ENSG00000185900.9     -0.79      6.3   14   2.2e-04   0.510</code></pre>
</div>
<div id="run-edger3-cells-with-umi-0" class="section level2">
<h2>Run edgeR–3% cells with UMI &gt; 0</h2>
<pre class="r"><code>y &lt;- DGEList(counts= countall[cellpercent &gt; 0.03,],group=coldata$condition)
res &lt;- run_edgeR(y)</code></pre>
<p><img src="figure/EdgeR-LRT.Rmd/edgeR0.03-1.png" width="672" style="display: block; margin: auto;" /></p>
<pre><code>[1] &quot;There are 3 genes passed FDR &lt;0.1 cutoff&quot;

                      logFC   logCPM   LR    PValue     FDR
-------------------  ------  -------  ---  --------  ------
ENSG00000176956.12    -2.70      6.6   21   4.1e-06   0.023
ENSG00000100097.11    -2.30      6.6   21   5.3e-06   0.023
ENSG00000175899.14    -1.50      6.9   21   5.9e-06   0.023
ENSG00000100300.17    -1.50      6.4   15   1.1e-04   0.340
ENSG00000219626.8     -1.00      6.5   14   2.0e-04   0.360
ENSG00000185900.9     -0.79      6.3   14   2.1e-04   0.360</code></pre>
</div>
<div id="run-edger10-cells-with-umi-0" class="section level2">
<h2>Run edgeR–10% cells with UMI &gt; 0</h2>
<pre class="r"><code>y &lt;- DGEList(counts= countall[cellpercent &gt; 0.1,],group=coldata$condition)
res &lt;- run_edgeR(y)</code></pre>
<p><img src="figure/EdgeR-LRT.Rmd/edgeR0.1-1.png" width="672" style="display: block; margin: auto;" /></p>
<pre><code>[1] &quot;There are 2 genes passed FDR &lt;0.1 cutoff&quot;

                      logFC   logCPM   LR    PValue    FDR
-------------------  ------  -------  ---  --------  -----
ENSG00000175899.14    -1.50      6.9   20   7.0e-06   0.04
ENSG00000100097.11    -2.20      6.6   20   8.4e-06   0.04
ENSG00000100300.17    -1.50      6.4   15   1.3e-04   0.42
ENSG00000119906.11     1.10      6.5   14   1.8e-04   0.44
ENSG00000219626.8     -0.98      6.5   14   2.3e-04   0.44
ENSG00000078061.12    -0.83      6.6   13   3.5e-04   0.46</code></pre>
</div>
<div id="run-edger20-cells-with-umi-0" class="section level2">
<h2>Run edgeR–20% cells with UMI &gt; 0</h2>
<pre class="r"><code>y &lt;- DGEList(counts= countall[cellpercent &gt; 0.2,],group=coldata$condition)
res &lt;- run_edgeR(y)</code></pre>
<p><img src="figure/EdgeR-LRT.Rmd/edgeR0.2-1.png" width="672" style="display: block; margin: auto;" /></p>
<pre><code>[1] &quot;There are 1 genes passed FDR &lt;0.1 cutoff&quot;

                      logFC   logCPM   LR    PValue     FDR
-------------------  ------  -------  ---  --------  ------
ENSG00000175899.14    -1.50      6.9   19   1.2e-05   0.093
ENSG00000119906.11     1.10      6.5   14   1.7e-04   0.490
ENSG00000219626.8     -0.99      6.5   14   2.2e-04   0.490
ENSG00000078061.12    -0.82      6.6   13   3.4e-04   0.490
ENSG00000131669.9      0.73      6.9   12   4.5e-04   0.490
ENSG00000141219.15     0.95      6.4   12   4.6e-04   0.490</code></pre>
</div>
<div id="parameters-used" class="section level2">
<h2>Parameters used</h2>
<ul>
<li>We used data processed after QC step <a href="Quality_metrics.html">here</a>.<br />
</li>
<li>targeted locus, choose VPS45.</li>
</ul>
</div>
<div id="session-information" class="section level2">
<h2>Session information</h2>
<pre class="r"><code>sessionInfo()</code></pre>
<pre><code>R version 3.5.1 (2018-07-02)
Platform: x86_64-apple-darwin14.5.0 (64-bit)
Running under: OS X El Capitan 10.11.6

Matrix products: default
BLAS: /System/Library/Frameworks/Accelerate.framework/Versions/A/Frameworks/vecLib.framework/Versions/A/libBLAS.dylib
LAPACK: /System/Library/Frameworks/Accelerate.framework/Versions/A/Frameworks/vecLib.framework/Versions/A/libLAPACK.dylib

locale:
[1] en_US.UTF-8/en_US.UTF-8/en_US.UTF-8/C/en_US.UTF-8/en_US.UTF-8

attached base packages:
[1] grid      stats     graphics  grDevices utils     datasets  methods  
[8] base     

other attached packages:
[1] gridExtra_2.3   lattice_0.20-35 edgeR_3.22.5    limma_3.36.5   
[5] Matrix_1.2-14   dplyr_0.7.6    

loaded via a namespace (and not attached):
 [1] Rcpp_1.0.0        compiler_3.5.1    pillar_1.3.0     
 [4] git2r_0.23.0      highr_0.7         workflowr_1.1.1  
 [7] bindr_0.1.1       R.methodsS3_1.7.1 R.utils_2.7.0    
[10] tools_3.5.1       digest_0.6.18     evaluate_0.12    
[13] tibble_1.4.2      gtable_0.2.0      pkgconfig_2.0.2  
[16] rlang_0.3.0.1     yaml_2.2.0        bindrcpp_0.2.2   
[19] stringr_1.3.1     knitr_1.20        locfit_1.5-9.1   
[22] rprojroot_1.3-2   tidyselect_0.2.4  glue_1.3.0       
[25] R6_2.3.0          rmarkdown_1.10    purrr_0.2.5      
[28] magrittr_1.5      whisker_0.3-2     backports_1.1.2  
[31] htmltools_0.3.6   splines_3.5.1     assertthat_0.2.0 
[34] stringi_1.2.4     crayon_1.3.4      R.oo_1.22.0      </code></pre>
</div>

<!-- Adjust MathJax settings so that all math formulae are shown using
TeX fonts only; see
http://docs.mathjax.org/en/latest/configuration.html.  This will make
the presentation more consistent at the cost of the webpage sometimes
taking slightly longer to load. Note that this only works because the
footer is added to webpages before the MathJax javascript. -->
<script type="text/x-mathjax-config">
  MathJax.Hub.Config({
    "HTML-CSS": { availableFonts: ["TeX"] }
  });
</script>

<hr>
<p>
  This reproducible <a href="http://rmarkdown.rstudio.com">R Markdown</a>
  analysis was created with
  <a href="https://github.com/jdblischak/workflowr">workflowr</a> 1.1.1
</p>
<hr>


</div>
</div>

</div>

<script>

// add bootstrap table styles to pandoc tables
function bootstrapStylePandocTables() {
  $('tr.header').parent('thead').parent('table').addClass('table table-condensed');
}
$(document).ready(function () {
  bootstrapStylePandocTables();
});


</script>

<!-- dynamically load mathjax for compatibility with self-contained -->
<script>
  (function () {
    var script = document.createElement("script");
    script.type = "text/javascript";
    script.src  = "https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
    document.getElementsByTagName("head")[0].appendChild(script);
  })();
</script>

</body>
</html>