Przeglądaj źródła

Convert to sub-figures! And add some more plots

Ryan C. Thompson 5 lat temu
rodzic
commit
bb2c13b0c5

BIN
graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-PCA.png


BIN
graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-clusters.png


BIN
graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-expression.png


BIN
graphics/CD4-csaw/IDR/D4659vsD5053_epic.pdf


BIN
graphics/CD4-csaw/IDR/D4659vsD5053_macs.pdf


+ 565 - 610
thesis.lyx

@@ -24,29 +24,11 @@
 \lfoot{}
 \cfoot{\thepage} % Page number bottom center
 
-% https://tex.stackexchange.com/questions/65680/automatically-bold-first-sentence-of-a-floats-caption
-\usepackage{xstring}
-\usepackage{etoolbox}
-\usepackage{caption}
-
-\captionsetup{labelfont=bf,tableposition=top}
-
-\makeatletter
-\newcommand\formatlabel[1]{%
-    \noexpandarg
-    \IfSubStr{#1}{.}{%
-      \StrBefore{#1}{.}[\firstcaption]%
-      \StrBehind{#1}{.}[\secondcaption]%
-      \textbf{\firstcaption.} \secondcaption}{%
-      #1}%
-      }
-
-
-\patchcmd{\@caption}{#3}{\formatlabel{#3}}
-\makeatother
-
 % Allow FloatBarrier command
 \usepackage{placeins}
+
+% This one breaks subfigs so it's disabled
+% https://tex.stackexchange.com/questions/65680/automatically-bold-first-sentence-of-a-floats-caption
 \end_preamble
 \use_default_options true
 \begin_modules
@@ -724,6 +706,13 @@ Maybe fix up the excessive axis ranges for these plots?
 \begin_layout Standard
 \begin_inset Float figure
 wide false
+sideways true
+status collapsed
+
+\begin_layout Plain Layout
+\align center
+\begin_inset Float figure
+wide false
 sideways false
 status collapsed
 
@@ -732,8 +721,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/ensmebl-vs-entrez-star-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -755,9 +744,10 @@ Comparison of STAR quantification between Ensembl and Entrez gene identifiers
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -768,8 +758,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/ensmebl-vs-entrez-shoal-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -792,9 +782,10 @@ Comparison of Salmon+Shoal quantification between Ensembl and Entrez gene
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -805,8 +796,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/star-vs-hisat2-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -830,7 +821,8 @@ Comparison of quantification between STAR and HISAT2 for identical annotation
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
+\align center
 \begin_inset Float figure
 wide false
 sideways false
@@ -841,8 +833,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/star-vs-salmon-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -864,9 +856,10 @@ Comparison of quantification between STAR and Salmon for identical annotation
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -877,8 +870,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/salmon-vs-kallisto-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -901,9 +894,10 @@ n
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -914,8 +908,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/rnaseq-compare/salmon-vs-shoal-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId rna-comp-subfig
 
 \end_inset
 
@@ -940,24 +934,22 @@ Comparison of quantification between Salmon with and without Shoal for identical
 
 \end_layout
 
-\begin_layout Itemize
-Ultimately selected shoal as quantification, Ensembl as annotation.
- Why? Running downstream analyses with all quant methods and both annotations
- showed very little practical difference, so choice was not terribly important.
- Prefer shoal due to theoretical advantages.
- To note in discussion: reproducible workflow made it easy to do this, enabling
- an informed decision.
-\end_layout
-
-\begin_layout Standard
-\begin_inset ERT
-status collapsed
+\begin_layout Plain Layout
+\begin_inset Caption Standard
 
 \begin_layout Plain Layout
+\begin_inset CommandInset label
+LatexCommand label
+name "fig:RNA-norm-comp"
+
+\end_inset
+
+RNA-seq comparisons
+\end_layout
+
+\end_inset
 
 
-\backslash
-FloatBarrier
 \end_layout
 
 \end_inset
@@ -965,6 +957,15 @@ FloatBarrier
 
 \end_layout
 
+\begin_layout Itemize
+Ultimately selected shoal as quantification, Ensembl as annotation.
+ Why? Running downstream analyses with all quant methods and both annotations
+ showed very little practical difference, so choice was not terribly important.
+ Prefer shoal due to theoretical advantages.
+ To note in discussion: reproducible workflow made it easy to do this, enabling
+ an informed decision.
+\end_layout
+
 \begin_layout Subsection
 RNA-seq has a large confounding batch effect
 \end_layout
@@ -1013,7 +1014,7 @@ name "fig:RNA-seq-weights-vs-covars"
 
 \end_inset
 
-RNA-seq sample weights, grouped by experimental and technical covariates
+RNA-seq sample weights, grouped by experimental and technical covariates.
 \end_layout
 
 \end_inset
@@ -1026,19 +1027,32 @@ RNA-seq sample weights, grouped by experimental and technical covariates
 
 \end_layout
 
+\begin_layout Itemize
+Batch 1 is garbage quality.
+ Analyses involving batch 1 samples are expected to yield poor statistical
+ power.
+\end_layout
+
 \begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
 status collapsed
 
+\begin_layout Plain Layout
+\align center
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
+
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/RNA-seq/PCA-no-batchsub-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 75col%
+	groupId rna-pca-subfig
 
 \end_inset
 
@@ -1057,7 +1071,7 @@ name "fig:RNA-PCA-no-batchsub"
 
 \end_inset
 
-RNA-seq PCoA plot showing clear batch effect
+Before batch correction
 \end_layout
 
 \end_inset
@@ -1070,32 +1084,20 @@ RNA-seq PCoA plot showing clear batch effect
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
+\align center
 \begin_inset Float figure
 wide false
 sideways false
 status collapsed
 
-\begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Probably don't need this
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/RNA-seq/PCA-naive-batchsub-CROP.png
+	filename graphics/CD4-csaw/RNA-seq/PCA-combat-batchsub-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 75col%
+	groupId rna-pca-subfig
 
 \end_inset
 
@@ -1110,16 +1112,11 @@ Probably don't need this
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:RNA-PCA-limma-batchsub"
-
-\end_inset
-
-RNA-seq PCoA plot showing clear batch effect
-\end_layout
+name "fig:RNA-PCA-ComBat-batchsub"
 
 \end_inset
 
-
+After batch correction with ComBat
 \end_layout
 
 \end_inset
@@ -1127,20 +1124,6 @@ RNA-seq PCoA plot showing clear batch effect
 
 \end_layout
 
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status collapsed
-
-\begin_layout Plain Layout
-\align center
-\begin_inset Graphics
-	filename graphics/CD4-csaw/RNA-seq/PCA-combat-batchsub-CROP.png
-	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
-
 \end_inset
 
 
@@ -1154,11 +1137,11 @@ status collapsed
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:RNA-PCA-ComBat-batchsub"
+name "fig:RNA-PCA"
 
 \end_inset
 
-RNA-seq PCoA plot showing clear batch effect
+PCoA plots of RNA-seq data showing effect of batch correction.
 \end_layout
 
 \end_inset
@@ -1176,46 +1159,22 @@ RNA-seq batch effect can be partially corrected, but still induces uncorrectable
  biases in downstream analysis
 \end_layout
 
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Figures showing p-value histograms for within-batch and cross-batch contrasts,
- showing that cross-batch contrasts have attenuated signal, as do comparisons
- within the bad batch
-\end_layout
-
-\end_inset
-
-
+\begin_layout Subsection
+ChIP-seq blacklisting is important
 \end_layout
 
 \begin_layout Standard
-\begin_inset ERT
+\begin_inset Float figure
+wide false
+sideways false
 status collapsed
 
 \begin_layout Plain Layout
-
-
-\backslash
-FloatBarrier
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout Subsection
-ChIP-seq blacklisting is important
-\end_layout
-
-\begin_layout Standard
+\align center
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
@@ -1223,7 +1182,7 @@ status open
 	filename graphics/CD4-csaw/csaw/CCF-plots-PAGE2-CROP.pdf
 	lyxscale 50
 	width 100col%
-	groupId colwidth
+	groupId ccf-subfig
 
 \end_inset
 
@@ -1255,11 +1214,12 @@ Cross-correlation plots with blacklisted reads removed
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
+\align center
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
@@ -1267,7 +1227,7 @@ status open
 	filename graphics/CD4-csaw/csaw/CCF-plots-noBL-PAGE2-CROP.pdf
 	lyxscale 50
 	width 100col%
-	groupId colwidth
+	groupId ccf-subfig
 
 \end_inset
 
@@ -1299,17 +1259,24 @@ Cross-correlation plots without removing blacklisted reads
 
 \end_layout
 
-\begin_layout Subsection
-ChIP-seq peak calling
+\begin_layout Plain Layout
+\begin_inset Caption Standard
+
+\begin_layout Plain Layout
+
+\series bold
+\begin_inset CommandInset label
+LatexCommand label
+name "fig:CCF-master"
+
+\end_inset
+
+Strand cross-correlation plots for ChIP-seq data.
 \end_layout
 
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
+\end_inset
+
 
-\begin_layout Plain Layout
-Replace these figures with a single table of # of peaks called at chosen
- IDR threshold, showing that SICER has more
 \end_layout
 
 \end_inset
@@ -1317,19 +1284,30 @@ Replace these figures with a single table of # of peaks called at chosen
 
 \end_layout
 
+\begin_layout Subsection
+ChIP-seq peak calling
+\end_layout
+
 \begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
+\align center
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
 
 \begin_layout Plain Layout
-Re-generate IDR rank consistency plots for SICER and MACS side-by-side
-\end_layout
+\align center
+\begin_inset Graphics
+	filename graphics/CD4-csaw/IDR/D4659vsD5053_epic-PAGE1-CROP.pdf
+	lyxscale 50
+	width 40theight%
+	groupId idr-rc-subfig
 
 \end_inset
 
@@ -1340,19 +1318,15 @@ Re-generate IDR rank consistency plots for SICER and MACS side-by-side
 \begin_inset Caption Standard
 
 \begin_layout Plain Layout
-
-\series bold
-\begin_inset CommandInset label
-LatexCommand label
-name "fig:IDR-RC-H3K4me2"
+Peak ranks from SICER peak caller
+\end_layout
 
 \end_inset
 
-Irreproducible Discovery Rate consistency plots for H3K4me2
-\end_layout
 
-\end_inset
+\end_layout
 
+\begin_layout Plain Layout
 
 \end_layout
 
@@ -1361,18 +1335,36 @@ Irreproducible Discovery Rate consistency plots for H3K4me2
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
+\align center
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
+\align center
+\begin_inset Graphics
+	filename graphics/CD4-csaw/IDR/D4659vsD5053_macs-PAGE1-CROP.pdf
+	lyxscale 50
+	width 40theight%
+	groupId idr-rc-subfig
+
+\end_inset
+
+
+\end_layout
 
 \begin_layout Plain Layout
-Re-generate IDR rank consistency plots for SICER and MACS side-by-side
+\begin_inset Caption Standard
+
+\begin_layout Plain Layout
+Peak ranks from MACS peak caller
+\end_layout
+
+\end_inset
+
+
 \end_layout
 
 \end_inset
@@ -1388,16 +1380,18 @@ Re-generate IDR rank consistency plots for SICER and MACS side-by-side
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:IDR-RC-H3K4me3"
-
-\end_inset
-
-Irreproducible Discovery Rate consistency plots for H3K4me3
-\end_layout
+name "fig:IDR-rank-consist"
 
 \end_inset
 
+Irreproducible Discovery Rate rank consistency plots for H3K27me3.
 
+\series default
+ Peaks are ranked by the scores assigned by the peak caller in each donor,
+ and then the ranks are plotted against each other.
+ Higher ranks are more significant.
+ Peaks meeting various thresholds of reproducibility, measured by the irreproduc
+ible discovery rate (IDR), are shaded accordingly.
 \end_layout
 
 \end_inset
@@ -1405,42 +1399,7 @@ Irreproducible Discovery Rate consistency plots for H3K4me3
 
 \end_layout
 
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status open
-
 \begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Re-generate IDR rank consistency plots for SICER and MACS side-by-side
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout Plain Layout
-\begin_inset Caption Standard
-
-\begin_layout Plain Layout
-
-\series bold
-\begin_inset CommandInset label
-LatexCommand label
-name "fig:IDR-RC-H3K27me3"
-
-\end_inset
-
-Irreproducible Discovery Rate consistency plots for H3K27me3
-\end_layout
-
-\end_inset
-
 
 \end_layout
 
@@ -1450,41 +1409,20 @@ Irreproducible Discovery Rate consistency plots for H3K27me3
 \end_layout
 
 \begin_layout Standard
-Figures 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:IDR-RC-H3K4me2"
-plural "false"
-caps "false"
-noprefix "false"
-
-\end_inset
-
-, 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:IDR-RC-H3K4me3"
-plural "false"
-caps "false"
-noprefix "false"
-
-\end_inset
-
-, and 
+Figure 
 \begin_inset CommandInset ref
 LatexCommand ref
-reference "fig:IDR-RC-H3K27me3"
+reference "fig:IDR-rank-consist"
 plural "false"
 caps "false"
 noprefix "false"
 
 \end_inset
 
- show the IDR rank-consistency plots for peaks called in an arbitrarily-chosen
+ shows the IDR rank-consistency plots for peaks called in an arbitrarily-chosen
  pair of donors.
- For all 3 histone marks, when the peaks for each donor are ranked according
- to their scores, SICER produces much more reproducible results between
- donors.
+ when the peaks for each donor are ranked according to their scores, SICER
+ produces much more reproducible results between donors.
  This is consistent with SICER's stated goal of identifying broad peaks,
  in contrast to MACS, which is designed for identifying sharp peaks.
  Based on this observation, the SICER peak calls were used for all downstream
@@ -1496,19 +1434,6 @@ noprefix "false"
 ChIP-seq normalization
 \end_layout
 
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Maybe just one of these figures and then say the other 2 were similar
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
 \begin_layout Standard
 \begin_inset Float figure
 wide false
@@ -1534,70 +1459,48 @@ status open
 \begin_layout Plain Layout
 
 \series bold
-MA plot of H3K4me2 read counts in 10kb bins for two arbitrary samples
-\end_layout
-
-\end_inset
-
-
-\end_layout
+\begin_inset CommandInset label
+LatexCommand label
+name "fig:MA-plot-bigbins"
 
 \end_inset
 
-
+MA plot of H3K4me2 read counts in 10kb bins for two arbitrary samples.
 \end_layout
 
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status open
-
-\begin_layout Plain Layout
-\align center
-\begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-sample-MAplot-bins-CROP.png
-	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
-
 \end_inset
 
 
 \end_layout
 
-\begin_layout Plain Layout
-\begin_inset Caption Standard
-
-\begin_layout Plain Layout
-
-\series bold
-MA plot of H3K4me3 read counts in 10kb bins for two arbitrary samples
-\end_layout
-
 \end_inset
 
 
 \end_layout
 
-\end_inset
-
-
+\begin_layout Subsection
+ChIP-seq must be corrected for hidden confounding factors
 \end_layout
 
 \begin_layout Standard
 \begin_inset Float figure
 wide false
-sideways false
+sideways true
 status open
 
+\begin_layout Plain Layout
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
+
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-sample-MAplot-bins-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-PCA-raw-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1610,12 +1513,13 @@ status open
 \begin_layout Plain Layout
 
 \series bold
-MA plot of H3K27me3 read counts in 10kb bins for two arbitrary samples
-\end_layout
+\begin_inset CommandInset label
+LatexCommand label
+name "fig:PCoA-H3K4me2-bad"
 
 \end_inset
 
-
+H3K4me2, no correction
 \end_layout
 
 \end_inset
@@ -1623,47 +1527,13 @@ MA plot of H3K27me3 read counts in 10kb bins for two arbitrary samples
 
 \end_layout
 
-\begin_layout Subsection
-ChIP-seq must be corrected for hidden confounding factors
-\end_layout
-
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Consolidate figures 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:PCoA-H3K4me2-bad"
-plural "false"
-caps "false"
-noprefix "false"
-
-\end_inset
-
- through 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:PCoA-H3K27me3-good"
-plural "false"
-caps "false"
-noprefix "false"
-
 \end_inset
 
- into 1 2x3 grid lettered A through F.
- For now, just refer to them as if they were a single figure.
- Also, do the good PCoA plots belong in the results section since they are
- also used there?
-\end_layout
 
+\begin_inset space \hfill{}
 \end_inset
 
 
-\end_layout
-
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -1672,10 +1542,10 @@ status collapsed
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-PCA-raw-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-PCA-raw-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1690,11 +1560,11 @@ status collapsed
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:PCoA-H3K4me2-bad"
+name "fig:PCoA-H3K4me3-bad"
 
 \end_inset
 
-PCoA plot of H3K4me2 windows, before subtracting surrogate variables
+H3K4me3, no correction
 \end_layout
 
 \end_inset
@@ -1705,21 +1575,22 @@ PCoA plot of H3K4me2 windows, before subtracting surrogate variables
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-PCA-SVsub-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-PCA-raw-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1734,11 +1605,11 @@ status open
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:PCoA-H3K4me2-good"
+name "fig:PCoA-H3K27me3-bad"
 
 \end_inset
 
-PCoA plot of H3K4me2 windows, after subtracting surrogate variables
+H3K27me3, no correction
 \end_layout
 
 \end_inset
@@ -1751,7 +1622,7 @@ PCoA plot of H3K4me2 windows, after subtracting surrogate variables
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
 \begin_inset Float figure
 wide false
 sideways false
@@ -1760,10 +1631,10 @@ status collapsed
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-PCA-raw-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-PCA-SVsub-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1778,11 +1649,11 @@ status collapsed
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:PCoA-H3K4me3-bad"
+name "fig:PCoA-H3K4me2-good"
 
 \end_inset
 
-PCoA plot of H3K4me3 windows, before subtracting surrogate variables
+H3K4me2, SVs subtracted
 \end_layout
 
 \end_inset
@@ -1793,21 +1664,22 @@ PCoA plot of H3K4me3 windows, before subtracting surrogate variables
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-PCA-SVsub-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1826,7 +1698,7 @@ name "fig:PCoA-H3K4me3-good"
 
 \end_inset
 
-PCoA plot of H3K4me3 windows, after subtracting surrogate variables
+H3K4me3 windows, SVs subtracted
 \end_layout
 
 \end_inset
@@ -1837,9 +1709,10 @@ PCoA plot of H3K4me3 windows, after subtracting surrogate variables
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -1848,10 +1721,10 @@ status collapsed
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-PCA-raw-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-PCA-SVsub-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId pcoa-subfig
 
 \end_inset
 
@@ -1866,16 +1739,11 @@ status collapsed
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:PCoA-H3K27me3-bad"
-
-\end_inset
-
-PCoA plot of H3K27me3 windows, before subtracting surrogate variables
-\end_layout
+name "fig:PCoA-H3K27me3-good"
 
 \end_inset
 
-
+H3K27me3, SVs subtracted
 \end_layout
 
 \end_inset
@@ -1883,20 +1751,6 @@ PCoA plot of H3K27me3 windows, before subtracting surrogate variables
 
 \end_layout
 
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status open
-
-\begin_layout Plain Layout
-\align center
-\begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-PCA-SVsub-CROP.png
-	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
-
 \end_inset
 
 
@@ -1910,11 +1764,12 @@ status open
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:PCoA-H3K27me3-good"
+name "fig:PCoA-ChIP"
 
 \end_inset
 
-PCoA plot of H3K27me3 windows, after subtracting surrogate variables
+PCoA plots of ChIP-seq sliding window data, before and after subtracting
+ surrogate variables (SVs).
 \end_layout
 
 \end_inset
@@ -1922,29 +1777,17 @@ PCoA plot of H3K27me3 windows, after subtracting surrogate variables
 
 \end_layout
 
-\end_inset
-
-
-\end_layout
+\begin_layout Plain Layout
 
-\begin_layout Itemize
-Figures showing BCV plots with and without SVA for each histone mark?
 \end_layout
 
-\begin_layout Standard
-\begin_inset ERT
-status collapsed
-
-\begin_layout Plain Layout
+\end_inset
 
 
-\backslash
-FloatBarrier
 \end_layout
 
-\end_inset
-
- 
+\begin_layout Itemize
+Figures showing BCV plots with and without SVA for each histone mark?
 \end_layout
 
 \begin_layout Subsection
@@ -1955,6 +1798,12 @@ MOFA recovers biologically relevant variation from blind analysis by correlating
 \begin_layout Standard
 \begin_inset Float figure
 wide false
+sideways true
+status collapsed
+
+\begin_layout Plain Layout
+\begin_inset Float figure
+wide false
 sideways false
 status open
 
@@ -1963,8 +1812,8 @@ status open
 \begin_inset Graphics
 	filename graphics/CD4-csaw/MOFA-varExplaiend-matrix-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId mofa-subfig
 
 \end_inset
 
@@ -1984,11 +1833,20 @@ name "fig:mofa-varexplained"
 \end_inset
 
 Variance explained in each data set by each latent factor estimated by MOFA.
-\end_layout
 
+\series default
+ For each latent factor (LF) learned by MOFA, the variance explained by
+ that factor in each data set (
+\begin_inset Quotes eld
 \end_inset
 
+view
+\begin_inset Quotes erd
+\end_inset
 
+) is shown by the shading of the cells in the lower section.
+ The upper section shows the total fraction of each data set's variance
+ that is explained by all LFs combined.
 \end_layout
 
 \end_inset
@@ -1996,46 +1854,25 @@ Variance explained in each data set by each latent factor estimated by MOFA.
 
 \end_layout
 
-\begin_layout Itemize
-Figure 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:mofa-varexplained"
-plural "false"
-caps "false"
-noprefix "false"
+\end_inset
 
+
+\begin_inset space \hfill{}
 \end_inset
 
- shows that LF1, 4, and 5 explain substantial var in all data sets
-\end_layout
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
 status open
 
-\begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Maybe drop this one
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/MOFA-LF-distributions-CROP.png
+	filename graphics/CD4-csaw/MOFA-LF-scatter-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId mofa-subfig
 
 \end_inset
 
@@ -2050,16 +1887,16 @@ Maybe drop this one
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:mofa-lf-dist"
-
-\end_inset
-
-Sample distribution for each latent factor estimated by MOFA.
-\end_layout
+name "fig:mofa-lf-scatter"
 
 \end_inset
 
+Scatter plots of specific pairs of MOFA latent factors.
 
+\series default
+ LFs 1, 4, and 5 explain substantial variation in all data sets, so they
+ are plotted against each other in order to reveal patterns of variation
+ that are shared across all data sets.
 \end_layout
 
 \end_inset
@@ -2067,33 +1904,6 @@ Sample distribution for each latent factor estimated by MOFA.
 
 \end_layout
 
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status open
-
-\begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Talk about how this supports the convergence hypothesis
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout Plain Layout
-\align center
-\begin_inset Graphics
-	filename graphics/CD4-csaw/MOFA-LF-scatter-CROP.png
-	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
-
 \end_inset
 
 
@@ -2107,11 +1917,11 @@ Talk about how this supports the convergence hypothesis
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:mofa-lf-scatter"
+name "fig:MOFA-master"
 
 \end_inset
 
-Scatter plots of specific pairs of MOFA latent factors.
+MOFA latent factors separate technical confounders from 
 \end_layout
 
 \end_inset
@@ -2125,17 +1935,21 @@ Scatter plots of specific pairs of MOFA latent factors.
 \end_layout
 
 \begin_layout Itemize
-Figures 
+Figure 
 \begin_inset CommandInset ref
 LatexCommand ref
-reference "fig:mofa-lf-dist"
+reference "fig:mofa-varexplained"
 plural "false"
 caps "false"
 noprefix "false"
 
 \end_inset
 
- and 
+ shows that LF1, 4, and 5 explain substantial var in all data sets
+\end_layout
+
+\begin_layout Itemize
+Figure 
 \begin_inset CommandInset ref
 LatexCommand ref
 reference "fig:mofa-lf-scatter"
@@ -2145,8 +1959,8 @@ noprefix "false"
 
 \end_inset
 
- show that those same 3 LFs, (1, 4, & 5) also correlate best with the experiment
-al factors (cell type & time point)
+ shows that those same 3 LFs, (1, 4, & 5) also correlate best with the experimen
+tal factors (cell type & time point)
 \end_layout
 
 \begin_layout Itemize
@@ -2157,7 +1971,7 @@ LF2 is clearly the RNA-seq batch effect
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
@@ -2980,7 +2794,7 @@ effective promoter radii
 \begin_inset Quotes erd
 \end_inset
 
- were used for all further promoter-based analyses.
+ were used to define the promoter regions for all further analyses.
 \end_layout
 
 \begin_layout Standard
@@ -3056,13 +2870,20 @@ wide false
 sideways false
 status collapsed
 
+\begin_layout Plain Layout
+\align center
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
+
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-promoter-PCA-group-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId pcoa-prom-subfig
 
 \end_inset
 
@@ -3092,9 +2913,10 @@ PCoA plot of H3K4me2 promoters, after subtracting surrogate variables
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -3105,8 +2927,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-promoter-PCA-group-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId pcoa-prom-subfig
 
 \end_inset
 
@@ -3138,7 +2960,8 @@ PCoA plot of H3K4me3 promoters, after subtracting surrogate variables
 
 \end_layout
 
-\begin_layout Standard
+\begin_layout Plain Layout
+\align center
 \begin_inset Float figure
 wide false
 sideways false
@@ -3149,8 +2972,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-promoter-PCA-group-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId pcoa-prom-subfig
 
 \end_inset
 
@@ -3180,9 +3003,10 @@ PCoA plot of H3K27me3 promoters, after subtracting surrogate variables
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
@@ -3193,8 +3017,8 @@ status collapsed
 \begin_inset Graphics
 	filename graphics/CD4-csaw/RNA-seq/PCA-final-23-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 45col%
+	groupId pcoa-prom-subfig
 
 \end_inset
 
@@ -3224,6 +3048,31 @@ RNA-seq PCoA showing principal coordiantes 2 and 3.
 \end_inset
 
 
+\end_layout
+
+\begin_layout Plain Layout
+\begin_inset Caption Standard
+
+\begin_layout Plain Layout
+
+\series bold
+\begin_inset CommandInset label
+LatexCommand label
+name "fig:PCoA-promoters"
+
+\end_inset
+
+PCoA plots for promoter ChIP-seq and expression RNA-seq data
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+\end_inset
+
+
 \end_layout
 
 \begin_layout Standard
@@ -3682,38 +3531,31 @@ literal "false"
 \end_layout
 
 \begin_layout Standard
-Figures 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:PCoA-H3K4me2-prom"
-plural "false"
-caps "false"
-noprefix "false"
+\begin_inset Flex TODO Note (inline)
+status open
+
+\begin_layout Plain Layout
+Check up on figure refs in this paragraph
+\end_layout
 
 \end_inset
 
-, 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:PCoA-H3K4me3-prom"
-plural "false"
-caps "false"
-noprefix "false"
 
-\end_inset
+\end_layout
 
-, and 
+\begin_layout Standard
+Figure 
 \begin_inset CommandInset ref
 LatexCommand ref
-reference "fig:PCoA-H3K27me3-prom"
+reference "fig:PCoA-promoters"
 plural "false"
 caps "false"
 noprefix "false"
 
 \end_inset
 
- show the patterns of variation in all 3 histone marks in the promoter regions
- of the genome using principal coordinate analysis.
+ shows the patterns of variation in all 3 histone marks in the promoter
+ regions of the genome using principal coordinate analysis.
  All 3 marks show a noticeable convergence between the naive and memory
  samples at day 14, visible as an overlapping of the day 14 groups on each
  plot.
@@ -3781,22 +3623,6 @@ This result feels shallow, somehow.
 \end_inset
 
 
-\end_layout
-
-\begin_layout Standard
-\begin_inset ERT
-status collapsed
-
-\begin_layout Plain Layout
-
-
-\backslash
-FloatBarrier
-\end_layout
-
-\end_inset
-
-
 \end_layout
 
 \begin_layout Subsection
@@ -3821,29 +3647,23 @@ For the figures in this section, the group labels are arbitrary, so if time
 \begin_layout Standard
 \begin_inset Float figure
 wide false
-sideways false
-status open
-
-\begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
+sideways true
 status open
 
 \begin_layout Plain Layout
-These really need to be sub-figures A, B, and C.
-\end_layout
-
-\end_inset
-
-
-\end_layout
+\align center
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-neighborhood-clusters-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -3862,71 +3682,33 @@ name "fig:H3K4me2-neighborhood-clusters"
 
 \end_inset
 
-K-means clustering of promoter H3K4me2 relative coverage depth in naive
- day 0 samples.
- 
-\series default
-H3K4me2 ChIP-seq reads were binned into 500-bp windows tiled across each
- promoter from 5
-\begin_inset space ~
-\end_inset
-
-kbp upstream to 5
-\begin_inset space ~
-\end_inset
-
-kbp downstream, and the logCPM values were normalized within each promoter
- to an average of 0, yielding relative coverage depths.
- These were then grouped using K-means clustering with 
-\begin_inset Formula $K=6$
-\end_inset
-
-, and the average bin values were plotted for each cluster.
- The 
-\begin_inset Formula $x$
-\end_inset
-
--axis is the genomic coordinate of each bin relative to the the transcription
- start site, and the 
-\begin_inset Formula $y$
-\end_inset
+Average relative coverage for each bin in each cluster
+\end_layout
 
--axis is the mean relative coverage depth of that bin across all promoters
- in the cluster.
- Each line represents the average 
-\begin_inset Quotes eld
 \end_inset
 
-shape
-\begin_inset Quotes erd
-\end_inset
 
- of the promoter coverage for promoters in that cluster.
 \end_layout
 
 \end_inset
 
 
-\end_layout
-
+\begin_inset space \hfill{}
 \end_inset
 
 
-\end_layout
-
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-neighborhood-PCA-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -3945,23 +3727,8 @@ name "fig:H3K4me2-neighborhood-pca"
 
 \end_inset
 
-PCA of promoter H3K4me2 relative coverage depth in naive day 0 samples,
- colored by K-means cluster membership.
+PCA of relative coverage depth, colored by K-means cluster membership.
  
-\series default
-PCA was performed on the same relative promoter coverage values used for
- K-means clustering in Figure 
-\begin_inset CommandInset ref
-LatexCommand ref
-reference "fig:H3K4me2-neighborhood-clusters"
-plural "false"
-caps "false"
-noprefix "false"
-
-\end_inset
-
-, and the first two principal components were plotted, coloring each point
- by its K-means cluster identity.
 \end_layout
 
 \end_inset
@@ -3972,21 +3739,22 @@ noprefix "false"
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
 	filename graphics/CD4-csaw/ChIP-seq/H3K4me2-neighborhood-expression-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -4005,11 +3773,49 @@ name "fig:H3K4me2-neighborhood-expression"
 
 \end_inset
 
-Gene expression distributions grouped by H3K4me2 promoter coverage K-means
- clustering.
+Gene expression grouped by promoter coverage clusters.
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+\begin_layout Plain Layout
+\begin_inset Caption Standard
+
+\begin_layout Plain Layout
+
+\series bold
+K-means clustering of promoter H3K4me2 relative coverage depth in naive
+ day 0 samples.
  
 \series default
-For each of the clusters in Figure 
+H3K4me2 ChIP-seq reads were binned into 500-bp windows tiled across each
+ promoter from 5
+\begin_inset space ~
+\end_inset
+
+kbp upstream to 5
+\begin_inset space ~
+\end_inset
+
+kbp downstream, and the logCPM values were normalized within each promoter
+ to an average of 0, yielding relative coverage depths.
+ These were then grouped using K-means clustering with 
+\begin_inset Formula $K=6$
+\end_inset
+
+,
+\series bold
+ 
+\series default
+and the average bin values were plotted for each cluster (
 \begin_inset CommandInset ref
 LatexCommand ref
 reference "fig:H3K4me2-neighborhood-clusters"
@@ -4019,7 +3825,51 @@ noprefix "false"
 
 \end_inset
 
+).
+ The 
+\begin_inset Formula $x$
+\end_inset
+
+-axis is the genomic coordinate of each bin relative to the the transcription
+ start site, and the 
+\begin_inset Formula $y$
+\end_inset
+
+-axis is the mean relative coverage depth of that bin across all promoters
+ in the cluster.
+ Each line represents the average 
+\begin_inset Quotes eld
+\end_inset
+
+shape
+\begin_inset Quotes erd
+\end_inset
+
+ of the promoter coverage for promoters in that cluster.
+ PCA was performed on the same data, and the first two principal components
+ were plotted, coloring each point by its K-means cluster identity (
+\begin_inset CommandInset ref
+LatexCommand ref
+reference "fig:H3K4me2-neighborhood-pca"
+plural "false"
+caps "false"
+noprefix "false"
+
+\end_inset
 
+).
+ For each cluster, the distribution of gene expression values was plotted
+ (
+\begin_inset CommandInset ref
+LatexCommand ref
+reference "fig:H3K4me2-neighborhood-expression"
+plural "false"
+caps "false"
+noprefix "false"
+
+\end_inset
+
+.
 \end_layout
 
 \end_inset
@@ -4035,16 +3885,23 @@ noprefix "false"
 \begin_layout Standard
 \begin_inset Float figure
 wide false
-sideways false
+sideways true
 status open
 
+\begin_layout Plain Layout
+\align center
+\begin_inset Float figure
+wide false
+sideways false
+status collapsed
+
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-neighborhood-clusters-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-clusters-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -4059,11 +3916,11 @@ status open
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:H3K4me3-neighborhood-clusters"
+name "fig:H3K27me3-neighborhood-clusters"
 
 \end_inset
 
-RNA-seq PCoA showing principal coordiantes 2 and 3.
+Average relative coverage for each bin in each cluster
 \end_layout
 
 \end_inset
@@ -4074,21 +3931,22 @@ RNA-seq PCoA showing principal coordiantes 2 and 3.
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-neighborhood-PCA-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-PCA-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -4103,11 +3961,11 @@ status open
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:H3K4me3-neighborhood-pca-1"
+name "fig:H3K27me3-neighborhood-pca"
 
 \end_inset
 
-RNA-seq PCoA showing principal coordiantes 2 and 3.
+PCA of relative coverage depth, colored by K-means cluster membership.
 \end_layout
 
 \end_inset
@@ -4118,21 +3976,22 @@ RNA-seq PCoA showing principal coordiantes 2 and 3.
 \end_inset
 
 
-\end_layout
+\begin_inset space \hfill{}
+\end_inset
+
 
-\begin_layout Standard
 \begin_inset Float figure
 wide false
 sideways false
-status open
+status collapsed
 
 \begin_layout Plain Layout
 \align center
 \begin_inset Graphics
-	filename graphics/CD4-csaw/ChIP-seq/H3K4me3-neighborhood-expression-CROP.png
+	filename graphics/CD4-csaw/ChIP-seq/H3K27me3-neighborhood-expression-CROP.png
 	lyxscale 25
-	width 100col%
-	groupId colwidth-raster
+	width 30col%
+	groupId covprof-subfig
 
 \end_inset
 
@@ -4147,11 +4006,107 @@ status open
 \series bold
 \begin_inset CommandInset label
 LatexCommand label
-name "fig:H3K4me3-neighborhood-expression-1"
+name "fig:H3K27me3-neighborhood-expression"
 
 \end_inset
 
-RNA-seq PCoA showing principal coordiantes 2 and 3.
+Gene expression grouped by promoter coverage clusters.
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+\begin_layout Plain Layout
+\begin_inset Caption Standard
+
+\begin_layout Plain Layout
+
+\series bold
+K-means clustering of promoter H3K27me3 relative coverage depth in naive
+ day 0 samples.
+ 
+\series default
+H3K27me3 ChIP-seq reads were binned into 500-bp windows tiled across each
+ promoter from 5
+\begin_inset space ~
+\end_inset
+
+kbp upstream to 5
+\begin_inset space ~
+\end_inset
+
+kbp downstream, and the logCPM values were normalized within each promoter
+ to an average of 0, yielding relative coverage depths.
+ These were then grouped using K-means clustering with 
+\begin_inset Formula $K=6$
+\end_inset
+
+,
+\series bold
+ 
+\series default
+and the average bin values were plotted for each cluster (
+\begin_inset CommandInset ref
+LatexCommand ref
+reference "fig:H3K27me3-neighborhood-clusters"
+plural "false"
+caps "false"
+noprefix "false"
+
+\end_inset
+
+).
+ The 
+\begin_inset Formula $x$
+\end_inset
+
+-axis is the genomic coordinate of each bin relative to the the transcription
+ start site, and the 
+\begin_inset Formula $y$
+\end_inset
+
+-axis is the mean relative coverage depth of that bin across all promoters
+ in the cluster.
+ Each line represents the average 
+\begin_inset Quotes eld
+\end_inset
+
+shape
+\begin_inset Quotes erd
+\end_inset
+
+ of the promoter coverage for promoters in that cluster.
+ PCA was performed on the same data, and the first two principal components
+ were plotted, coloring each point by its K-means cluster identity (
+\begin_inset CommandInset ref
+LatexCommand ref
+reference "fig:H3K27me3-neighborhood-pca"
+plural "false"
+caps "false"
+noprefix "false"
+
+\end_inset
+
+).
+ For each cluster, the distribution of gene expression values was plotted
+ (
+\begin_inset CommandInset ref
+LatexCommand ref
+reference "fig:H3K27me3-neighborhood-expression"
+plural "false"
+caps "false"
+noprefix "false"
+
+\end_inset
+
+.
 \end_layout
 
 \end_inset