<!DOCTYPE html> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta charset="utf-8" /> <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> <meta name="generator" content="pandoc" /> <meta name="author" content="Yuxin Zou" /> <title>Mash Missing Whole Row</title> <script src="site_libs/jquery-1.11.3/jquery.min.js"></script> <meta name="viewport" content="width=device-width, initial-scale=1" /> <link href="site_libs/bootstrap-3.3.5/css/cosmo.min.css" rel="stylesheet" /> <script src="site_libs/bootstrap-3.3.5/js/bootstrap.min.js"></script> <script src="site_libs/bootstrap-3.3.5/shim/html5shiv.min.js"></script> <script src="site_libs/bootstrap-3.3.5/shim/respond.min.js"></script> <script src="site_libs/jqueryui-1.11.4/jquery-ui.min.js"></script> <link href="site_libs/tocify-1.9.1/jquery.tocify.css" rel="stylesheet" /> <script src="site_libs/tocify-1.9.1/jquery.tocify.js"></script> <script src="site_libs/navigation-1.1/tabsets.js"></script> <script src="site_libs/navigation-1.1/codefolding.js"></script> <link href="site_libs/highlightjs-9.12.0/textmate.css" rel="stylesheet" /> <script src="site_libs/highlightjs-9.12.0/highlight.js"></script> <link href="site_libs/font-awesome-4.5.0/css/font-awesome.min.css" rel="stylesheet" /> <style type="text/css">code{white-space: pre;}</style> <style type="text/css"> pre:not([class]) { background-color: white; } </style> <script type="text/javascript"> if (window.hljs) { hljs.configure({languages: []}); hljs.initHighlightingOnLoad(); if (document.readyState && document.readyState === "complete") { window.setTimeout(function() { hljs.initHighlighting(); }, 0); } } </script> <style type="text/css"> h1 { font-size: 34px; } h1.title { font-size: 38px; } h2 { font-size: 30px; } h3 { font-size: 24px; } h4 { font-size: 18px; } h5 { font-size: 16px; } h6 { font-size: 12px; } .table th:not([align]) { text-align: left; } </style> </head> <body> <style type = "text/css"> .main-container { max-width: 940px; margin-left: auto; margin-right: auto; } code { color: inherit; background-color: rgba(0, 0, 0, 0.04); } img { max-width:100%; height: auto; } .tabbed-pane { padding-top: 12px; } button.code-folding-btn:focus { outline: none; } </style> <style type="text/css"> /* padding for bootstrap navbar */ body { padding-top: 51px; padding-bottom: 40px; } /* offset scroll position for anchor links (for fixed navbar) */ .section h1 { padding-top: 56px; margin-top: -56px; } .section h2 { padding-top: 56px; margin-top: -56px; } .section h3 { padding-top: 56px; margin-top: -56px; } .section h4 { padding-top: 56px; margin-top: -56px; } .section h5 { padding-top: 56px; margin-top: -56px; } .section h6 { padding-top: 56px; margin-top: -56px; } </style> <script> // manage active state of menu based on current page $(document).ready(function () { // active menu anchor href = window.location.pathname href = href.substr(href.lastIndexOf('/') + 1) if (href === "") href = "index.html"; var menuAnchor = $('a[href="' + href + '"]'); // mark it active menuAnchor.parent().addClass('active'); // if it's got a parent navbar menu mark it active as well menuAnchor.closest('li.dropdown').addClass('active'); }); </script> <div class="container-fluid main-container"> <!-- tabsets --> <script> $(document).ready(function () { window.buildTabsets("TOC"); }); </script> <!-- code folding --> <style type="text/css"> .code-folding-btn { margin-bottom: 4px; } </style> <script> $(document).ready(function () { window.initializeCodeFolding("hide" === "show"); }); </script> <script> $(document).ready(function () { // move toc-ignore selectors from section div to header $('div.section.toc-ignore') .removeClass('toc-ignore') .children('h1,h2,h3,h4,h5').addClass('toc-ignore'); // establish options var options = { selectors: "h1,h2,h3", theme: "bootstrap3", context: '.toc-content', hashGenerator: function (text) { return text.replace(/[.\\/?&!#<>]/g, '').replace(/\s/g, '_').toLowerCase(); }, ignoreSelector: ".toc-ignore", scrollTo: 0 }; options.showAndHide = true; options.smoothScroll = true; // tocify var toc = $("#TOC").tocify(options).data("toc-tocify"); }); </script> <style type="text/css"> #TOC { margin: 25px 0px 20px 0px; } @media (max-width: 768px) { #TOC { position: relative; width: 100%; } } .toc-content { padding-left: 30px; padding-right: 40px; } div.main-container { max-width: 1200px; } div.tocify { width: 20%; max-width: 260px; max-height: 85%; } @media (min-width: 768px) and (max-width: 991px) { div.tocify { width: 25%; } } @media (max-width: 767px) { div.tocify { width: 100%; max-width: none; } } .tocify ul, .tocify li { line-height: 20px; } .tocify-subheader .tocify-item { font-size: 0.90em; padding-left: 25px; text-indent: 0; } .tocify .list-group-item { border-radius: 0px; } </style> <!-- setup 3col/9col grid for toc_float and main content --> <div class="row-fluid"> <div class="col-xs-12 col-sm-4 col-md-3"> <div id="TOC" class="tocify"> </div> </div> <div class="toc-content col-xs-12 col-sm-8 col-md-9"> <div class="navbar navbar-default navbar-fixed-top" role="navigation"> <div class="container"> <div class="navbar-header"> <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar"> <span class="icon-bar"></span> <span class="icon-bar"></span> <span class="icon-bar"></span> </button> <a class="navbar-brand" href="index.html">mash_application</a> </div> <div id="navbar" class="navbar-collapse collapse"> <ul class="nav navbar-nav"> <li> <a href="index.html">Home</a> </li> <li> <a href="about.html">About</a> </li> <li> <a href="license.html">License</a> </li> </ul> <ul class="nav navbar-nav navbar-right"> <li> <a href="https://github.com/jdblischak/workflowr"> <span class="fa fa-github"></span> </a> </li> </ul> </div><!--/.nav-collapse --> </div><!--/.container --> </div><!--/.navbar --> <!-- Add a small amount of space between sections. --> <style type="text/css"> div.section { padding-top: 12px; } </style> <div class="fluid-row" id="header"> <div class="btn-group pull-right"> <button type="button" class="btn btn-default btn-xs dropdown-toggle" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false"><span>Code</span> <span class="caret"></span></button> <ul class="dropdown-menu" style="min-width: 50px;"> <li><a id="rmd-show-all-code" href="#">Show All Code</a></li> <li><a id="rmd-hide-all-code" href="#">Hide All Code</a></li> </ul> </div> <h1 class="title toc-ignore">Mash Missing Whole Row</h1> <h4 class="author"><em>Yuxin Zou</em></h4> <h4 class="date"><em>2018-2-28</em></h4> </div> <!-- Update knitr chunk options --> <!-- Insert the date the file was last updated --> <p><strong>Last updated:</strong> 2018-03-06</p> <!-- Insert the code version (Git commit SHA1) if Git repository exists and R package git2r is installed --> <p><strong>Code version:</strong> 193208d</p> <div id="r5" class="section level1"> <h1>R=5</h1> <pre class="r"><code>library(mashr)</code></pre> <pre><code>Loading required package: ashr</code></pre> <pre class="r"><code>set.seed(2018) data = simple_sims(500, err_sd = 0.1) data.miss = data # select missing rows missing.row = sample(1:nrow(data$Bhat), nrow(data$Bhat)/4) missing.ind = matrix(0, nrow = nrow(data$B), ncol=ncol(data$B)) missing.ind[missing.row,] = 1 # set missing rows to NA missing = which(missing.ind == 1) data.miss$Bhat[missing] = NA data.miss$Shat[missing] = NA missing1 = is.na(data.miss$Bhat[,1]) # set the missing value with large standard deviation data.large.dev = data.miss data.large.dev$Bhat[is.na(data.miss$Bhat)] = 0 data.large.dev$Shat[is.na(data.miss$Shat)] = 1000</code></pre> <div id="ee-model" class="section level2"> <h2>EE model</h2> <pre class="r"><code># with missing values mash.data.missing = mash_set_data(Bhat=data.large.dev$Bhat, Shat=data.large.dev$Shat) U.c = cov_canonical(mash.data.missing) mash.model.missing = mash(mash.data.missing, U.c, verbose = FALSE) # delete missing values data.miss.na = data.miss data.miss.na$Bhat = na.omit(data.miss$Bhat) data.miss.na$Shat = na.omit(data.miss$Shat) mash.data.missing.na = mash_set_data(Bhat=data.miss.na$Bhat, Shat= data.miss.na$Shat) U.c = cov_canonical(mash.data.missing.na) mash.model.missing.na = mash(mash.data.missing.na, U.c, verbose=FALSE)</code></pre> <pre><code>Warning in REBayes::KWDual(A, rep(1, k), normalize(w), control = control): estimated mixing distribution has some negative values: consider reducing rtol</code></pre> <pre><code>Warning in mixIP(matrix_lik = structure(c(1, 0.204132576568413, 0.736530341806702, : Optimization step yields mixture weights that are either too small, or negative; weights have been corrected and renormalized after the optimization.</code></pre> <pre class="r"><code>par(mfrow=c(1,2)) barplot(get_estimated_pi(mash.model.missing), las=2, cex.names = 0.7, main='with missing values') barplot(get_estimated_pi(mash.model.missing.na), las=2, cex.names = 0.7, main = 'delete missing values')</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-4-1.png" width="672" style="display: block; margin: auto;" /></p> <pre class="r"><code>par(mfrow=c(1,1))</code></pre> </div> <div id="ez-model" class="section level2"> <h2>EZ model</h2> <pre class="r"><code># with missing values mash.data.missing.1 = mash_set_data(Bhat=data.large.dev$Bhat, Shat=data.large.dev$Shat, alpha = 1) U.c = cov_canonical(mash.data.missing.1) mash.model.missing.1 = mash(mash.data.missing.1, U.c, verbose = FALSE)</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code># delete missing values mash.data.missing.na.1 = mash_set_data(Bhat=data.miss.na$Bhat, Shat= data.miss.na$Shat, alpha = 1) U.c = cov_canonical(mash.data.missing.na.1) mash.model.missing.na.1 = mash(mash.data.missing.na.1, U.c, verbose=FALSE)</code></pre> <pre><code>Warning in REBayes::KWDual(A, rep(1, k), normalize(w), control = control): estimated mixing distribution has some negative values: consider reducing rtol</code></pre> <pre><code>Warning in mixIP(matrix_lik = structure(c(1, 0.204132576568412, 0.736530341806701, : Optimization step yields mixture weights that are either too small, or negative; weights have been corrected and renormalized after the optimization.</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>par(mfrow=c(1,2)) barplot(get_estimated_pi(mash.model.missing.1), las=2, cex.names = 0.7, main='with missing values') barplot(get_estimated_pi(mash.model.missing.na.1), las=2, cex.names = 0.7, main='delete missing values')</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-6-1.png" width="672" style="display: block; margin: auto;" /></p> <pre class="r"><code>par(mfrow=c(1,1))</code></pre> </div> </div> <div id="r60" class="section level1"> <h1>R=60</h1> <pre class="r"><code>set.seed(2018) data = simple_sims(500, ncond = 60, err_sd = 0.1) data.miss = data missing.row = sample(1:nrow(data$Bhat), nrow(data$Bhat)/4) missing.ind = matrix(0, nrow = nrow(data$B), ncol=ncol(data$B)) missing.ind[missing.row,] = 1 missing = which(missing.ind == 1) data.miss$Bhat[missing] = NA data.miss$Shat[missing] = NA missing1 = is.na(data.miss$Bhat[,1]) # Set the missing value with large standard deviation data.large.dev = data.miss data.large.dev$Bhat[is.na(data.miss$Bhat)] = 0 data.large.dev$Shat[is.na(data.miss$Shat)] = 1000</code></pre> <div id="ee-model-1" class="section level2"> <h2>EE model</h2> <div id="with-missing-values" class="section level3"> <h3>With missing values</h3> <pre class="r"><code>mash.data.missing = mash_set_data(Bhat=data.large.dev$Bhat, Shat=data.large.dev$Shat) U.c = cov_canonical(mash.data.missing) mash.model.missing = mash(mash.data.missing, U.c, verbose = FALSE) barplot(get_estimated_pi(mash.model.missing), las=2, cex.names = 0.7)</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-8-1.png" width="672" style="display: block; margin: auto;" /> The weights learned from the data are correct.</p> </div> <div id="delete-missing-values" class="section level3"> <h3>Delete missing values</h3> <pre class="r"><code>data.miss.na = data.miss data.miss.na$Bhat = na.omit(data.miss$Bhat) data.miss.na$Shat = na.omit(data.miss$Shat) mash.data.missing.na = mash_set_data(Bhat=data.miss.na$Bhat, Shat= data.miss.na$Shat) U.c = cov_canonical(mash.data.missing.na) mash.model.missing.na = mash(mash.data.missing.na, U.c, verbose=FALSE)</code></pre> <pre><code>Warning in REBayes::KWDual(A, rep(1, k), normalize(w), control = control): estimated mixing distribution has some negative values: consider reducing rtol</code></pre> <pre><code>Warning in mixIP(matrix_lik = structure(c(0.240920767436896, 0.337563330121546, : Optimization step yields mixture weights that are either too small, or negative; weights have been corrected and renormalized after the optimization.</code></pre> <pre class="r"><code>barplot(get_estimated_pi(mash.model.missing.na), las=2, cex.names = 0.7)</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-9-1.png" width="672" style="display: block; margin: auto;" /> The estimated weights are very weird and incorrect. It ignores the null matrix.</p> </div> </div> <div id="ez-model-1" class="section level2"> <h2>EZ model</h2> <div id="with-missing-values-1" class="section level3"> <h3>With missing values</h3> <pre class="r"><code>mash.data.missing.1 = mash_set_data(Bhat=data.large.dev$Bhat, Shat=data.large.dev$Shat, alpha = 1) U.c = cov_canonical(mash.data.missing.1) mash.model.missing.1 = mash(mash.data.missing.1, U.c, verbose = FALSE)</code></pre> <pre><code>Warning in REBayes::KWDual(A, rep(1, k), normalize(w), control = control): estimated mixing distribution has some negative values: consider reducing rtol</code></pre> <pre><code>Warning in mixIP(matrix_lik = structure(c(0.240920767436896, 0.33756333012155, : Optimization step yields mixture weights that are either too small, or negative; weights have been corrected and renormalized after the optimization.</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>barplot(get_estimated_pi(mash.model.missing.1), las=2, cex.names = 0.7)</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-10-1.png" width="672" style="display: block; margin: auto;" /></p> </div> <div id="delete-missing-values-1" class="section level3"> <h3>Delete missing values</h3> <pre class="r"><code>mash.data.missing.na.1 = mash_set_data(Bhat=data.miss.na$Bhat, Shat= data.miss.na$Shat, alpha = 1) U.c = cov_canonical(mash.data.missing.na.1) mash.model.missing.na.1 = mash(mash.data.missing.na.1, U.c, verbose=FALSE)</code></pre> <pre><code>Warning in REBayes::KWDual(A, rep(1, k), normalize(w), control = control): estimated mixing distribution has some negative values: consider reducing rtol</code></pre> <pre><code>Warning in mixIP(matrix_lik = structure(c(0.240920767436896, 0.33756333012155, : Optimization step yields mixture weights that are either too small, or negative; weights have been corrected and renormalized after the optimization.</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>barplot(get_estimated_pi(mash.model.missing.na.1), las=2, cex.names = 0.7)</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-11-1.png" width="672" style="display: block; margin: auto;" /> The estimated weights are different.</p> </div> </div> </div> <div id="subgroups" class="section level1"> <h1>Subgroups</h1> <p>The weired covariance structure is caused by the high dimension of R.</p> <p>If we separate conditions into several groups, the covariance structure will be correct.</p> <p>We show this for the EZ model R=60.</p> <pre class="r"><code>mash.data.missing.1.sub1 = mash_set_data(Bhat=data.large.dev$Bhat[,1:20], Shat=data.large.dev$Shat[,1:20], alpha = 1) U.c = cov_canonical(mash.data.missing.1.sub1) mash.model.missing.1.sub1 = mash(mash.data.missing.1.sub1, U.c, verbose = FALSE)</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>mash.data.missing.1.sub2 = mash_set_data(Bhat=data.large.dev$Bhat[,21:40], Shat=data.large.dev$Shat[,21:40], alpha = 1) U.c = cov_canonical(mash.data.missing.1.sub2) mash.model.missing.1.sub2 = mash(mash.data.missing.1.sub2, U.c, verbose = FALSE)</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>mash.data.missing.1.sub3 = mash_set_data(Bhat=data.large.dev$Bhat[,41:60], Shat=data.large.dev$Shat[,41:60], alpha = 1) U.c = cov_canonical(mash.data.missing.1.sub3) mash.model.missing.1.sub3 = mash(mash.data.missing.1.sub3, U.c, verbose = FALSE)</code></pre> <pre><code>FIXME: 'compute_posterior_matrices' in Rcpp does not transfer EZ to EE</code></pre> <pre class="r"><code>par(mfcol=c(3,1)) barplot(get_estimated_pi(mash.model.missing.1.sub1), las=2, cex.names = 0.7, main='condition 1:20') barplot(get_estimated_pi(mash.model.missing.1.sub2), las=2, cex.names = 0.7, main='condition 21:40') barplot(get_estimated_pi(mash.model.missing.1.sub3), las=2, cex.names = 0.7, main='condition 41:60')</code></pre> <p><img src="figure/mash_missing_whole_row.Rmd/unnamed-chunk-12-1.png" width="672" style="display: block; margin: auto;" /></p> <pre class="r"><code>par(mfcol=c(1,1))</code></pre> </div> <div id="session-information" class="section level1"> <h1>Session information</h1> <!-- Insert the session information into the document --> <pre class="r"><code>sessionInfo()</code></pre> <pre><code>R version 3.4.3 (2017-11-30) Platform: x86_64-apple-darwin15.6.0 (64-bit) Running under: macOS High Sierra 10.13.3 Matrix products: default BLAS: /Library/Frameworks/R.framework/Versions/3.4/Resources/lib/libRblas.0.dylib LAPACK: /Library/Frameworks/R.framework/Versions/3.4/Resources/lib/libRlapack.dylib locale: [1] en_US.UTF-8/en_US.UTF-8/en_US.UTF-8/C/en_US.UTF-8/en_US.UTF-8 attached base packages: [1] stats graphics grDevices utils datasets methods base other attached packages: [1] mashr_0.2-6 ashr_2.2-7 loaded via a namespace (and not attached): [1] Rcpp_0.12.15 knitr_1.20 magrittr_1.5 [4] REBayes_1.2 MASS_7.3-47 doParallel_1.0.11 [7] pscl_1.5.2 SQUAREM_2017.10-1 lattice_0.20-35 [10] foreach_1.4.4 plyr_1.8.4 stringr_1.3.0 [13] tools_3.4.3 parallel_3.4.3 grid_3.4.3 [16] rmeta_2.16 git2r_0.20.0 htmltools_0.3.6 [19] iterators_1.0.9 assertthat_0.2.0 yaml_2.1.17 [22] rprojroot_1.2 digest_0.6.13 Matrix_1.2-12 [25] codetools_0.2-15 evaluate_0.10.1 rmarkdown_1.8 [28] stringi_1.1.6 compiler_3.4.3 Rmosek_8.0.69 [31] backports_1.1.2 mvtnorm_1.0-7 truncnorm_1.0-8 </code></pre> </div> <!-- Adjust MathJax settings so that all math formulae are shown using TeX fonts only; see http://docs.mathjax.org/en/latest/configuration.html. This will make the presentation more consistent at the cost of the webpage sometimes taking slightly longer to load. Note that this only works because the footer is added to webpages before the MathJax javascript. --> <script type="text/x-mathjax-config"> MathJax.Hub.Config({ "HTML-CSS": { availableFonts: ["TeX"] } }); </script> <hr> <p> This <a href="http://rmarkdown.rstudio.com">R Markdown</a> site was created with <a href="https://github.com/jdblischak/workflowr">workflowr</a> </p> <hr> <!-- To enable disqus, uncomment the section below and provide your disqus_shortname --> <!-- disqus <div id="disqus_thread"></div> <script type="text/javascript"> /* * * CONFIGURATION VARIABLES: EDIT BEFORE PASTING INTO YOUR WEBPAGE * * */ var disqus_shortname = 'rmarkdown'; // required: replace example with your forum shortname /* * * DON'T EDIT BELOW THIS LINE * * */ (function() { var dsq = document.createElement('script'); dsq.type = 'text/javascript'; dsq.async = true; dsq.src = '//' + disqus_shortname + '.disqus.com/embed.js'; (document.getElementsByTagName('head')[0] || document.getElementsByTagName('body')[0]).appendChild(dsq); })(); </script> <noscript>Please enable JavaScript to view the <a href="http://disqus.com/?ref_noscript">comments powered by Disqus.</a></noscript> <a href="http://disqus.com" class="dsq-brlink">comments powered by <span class="logo-disqus">Disqus</span></a> --> </div> </div> </div> <script> // add bootstrap table styles to pandoc tables function bootstrapStylePandocTables() { $('tr.header').parent('thead').parent('table').addClass('table table-condensed'); } $(document).ready(function () { bootstrapStylePandocTables(); }); </script> <!-- dynamically load mathjax for compatibility with self-contained --> <script> (function () { var script = document.createElement("script"); script.type = "text/javascript"; script.src = "https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML"; document.getElementsByTagName("head")[0].appendChild(script); })(); </script> </body> </html>