瀏覽代碼

Remove nomencl usage, add figure short captions, add TOC entries

Ryan C. Thompson 5 年之前
父節點
當前提交
80cc1557f1
共有 4 個文件被更改,包括 338 次插入475 次删除
  1. 2 6
      Snakefile
  2. 14 10
      abbrevs.tex
  3. 二進制
      graphics/CD4-csaw/RNA-seq/weights-vs-covars-nobcv.png
  4. 322 459
      thesis.lyx

+ 2 - 6
Snakefile

@@ -132,12 +132,8 @@ def lyx_input_deps(lyxfile):
     '''Return an iterator over all tex files included by a Lyx file.'''
     '''Return an iterator over all tex files included by a Lyx file.'''
     with open(lyxfile) as f:
     with open(lyxfile) as f:
         lyx_text = f.read()
         lyx_text = f.read()
-    tex_names = regex.search('\\\\input{(.*?[.]tex)}', lyx_text).group(1).split(',')
-    # Unfortunately LyX doesn't indicate which bib names refer to
-    # files in the current directory and which don't. Currently that's
-    # not a problem for me since all my refs are in bib files in the
-    # current directory.
-    yield from tex_names
+    for m in regex.finditer('\\\\(?:input|loadglsentries){(.*?[.]tex)}', lyx_text):
+        yield m.group(1)
 
 
 def lyx_bib_deps(lyxfile):
 def lyx_bib_deps(lyxfile):
     '''Return an iterator over all bib files referenced by a Lyx file.
     '''Return an iterator over all bib files referenced by a Lyx file.

+ 14 - 10
abbrevs.tex

@@ -1,6 +1,11 @@
-%% Methods
+%% Wet-lab methods
 \newabbreviation{RNA-seq}{RNA-seq}{high-throughput RNA sequencing}
 \newabbreviation{RNA-seq}{RNA-seq}{high-throughput RNA sequencing}
 \newabbreviation{ChIP-seq}{ChIP-seq}{chromatin immunoprecipitation followed by high-throughput DNA sequencing}
 \newabbreviation{ChIP-seq}{ChIP-seq}{chromatin immunoprecipitation followed by high-throughput DNA sequencing}
+\newabbreviation{oligo}{oligo}{oligonucleotide}
+\newabbreviation{GB}{GB}{globin blocking}
+\newabbreviation{PCR}{PCR}{polymerase chain reaction}
+
+%% Computational methods
 \newabbreviation{GLM}{GLM}{generalized linear model}
 \newabbreviation{GLM}{GLM}{generalized linear model}
 \newabbreviation{NB}{NB}{negative binomial}
 \newabbreviation{NB}{NB}{negative binomial}
 \newabbreviation{BCV}{BCV}{biological coefficient of variation}
 \newabbreviation{BCV}{BCV}{biological coefficient of variation}
@@ -10,13 +15,13 @@
 \newabbreviation{SVA}{SVA}{surrogate variable analysis}
 \newabbreviation{SVA}{SVA}{surrogate variable analysis}
 \newabbreviation{PCA}{PCA}{principal component analysis}
 \newabbreviation{PCA}{PCA}{principal component analysis}
 \newabbreviation{PC}{PC}{principal component}
 \newabbreviation{PC}{PC}{principal component}
-\newabbreviation{PCoA}{PCoA}{principal coordinate analysis} % AKA MDS?
-\newabbreviation{MOFA}{MOFA}{Multi-Omics Factor Analysis}
 \newabbreviation{LF}{LF}{latent factor}
 \newabbreviation{LF}{LF}{latent factor}
 %% Note: Can't start with math or else capitalization fails
 %% Note: Can't start with math or else capitalization fails
 \newabbreviation{logCPM}{logCPM}{log$_2$ counts per million}
 \newabbreviation{logCPM}{logCPM}{log$_2$ counts per million}
 \newabbreviation{CPM}{CPM}{counts per million}
 \newabbreviation{CPM}{CPM}{counts per million}
 \newabbreviation{logFC}{logFC}{log$_2$ fold change}
 \newabbreviation{logFC}{logFC}{log$_2$ fold change}
+\newabbreviation{FPKM}{FPKM}{fragments per kilobase per million fragments}
+
 \newabbreviation{RMA}{RMA}{Robust Multichip Average}
 \newabbreviation{RMA}{RMA}{Robust Multichip Average}
 \newabbreviation{fRMA}{fRMA}{frozen Robust Multichip Average}
 \newabbreviation{fRMA}{fRMA}{frozen Robust Multichip Average}
 \newabbreviation{GRSN}{GRSN}{Global Rank-invariant Set Normalization}
 \newabbreviation{GRSN}{GRSN}{Global Rank-invariant Set Normalization}
@@ -24,15 +29,13 @@
 \newabbreviation{MACS}{MACS}{Model-based Analysis of ChIP-seq}
 \newabbreviation{MACS}{MACS}{Model-based Analysis of ChIP-seq}
 \newabbreviation{SICER}{SICER}{Spatial Clustering for Identification of ChIP-Enriched Regions}
 \newabbreviation{SICER}{SICER}{Spatial Clustering for Identification of ChIP-Enriched Regions}
 \newabbreviation{TMM}{TMM}{trimmed mean of M-values}
 \newabbreviation{TMM}{TMM}{trimmed mean of M-values}
-\newabbreviation{FPKM}{FPKM}{fragments per kilobase per million fragments}
-\newabbreviation{CpGi}{CpGi}{CpG island}
-\newabbreviation{ROC}{ROC}{receiver operating characteristic}
-\newabbreviation{AUC}{AUC}{area under ROC curve}
-\newabbreviation{PCR}{PCR}{polymerase chain reaction}
+\newabbreviation{PCoA}{PCoA}{principal coordinate analysis} % AKA MDS?
+\newabbreviation{MOFA}{MOFA}{Multi-Omics Factor Analysis}
 \newabbreviation{SWAN}{SWAN}{subset-quantile within array normalization}
 \newabbreviation{SWAN}{SWAN}{subset-quantile within array normalization}
 \newabbreviation{BH}{BH}{Benjamini-Hochberg}
 \newabbreviation{BH}{BH}{Benjamini-Hochberg}
-\newabbreviation{oligo}{oligo}{oligonucleotide}
-\newabbreviation{GB}{GB}{globin blocking}
+
+\newabbreviation{ROC}{ROC}{receiver operating characteristic}
+\newabbreviation{AUC}{AUC}{area under ROC curve}
 
 
 %% Data sources
 %% Data sources
 \newabbreviation{GEO}{GEO}{Gene Expression Omnibus}
 \newabbreviation{GEO}{GEO}{Gene Expression Omnibus}
@@ -41,6 +44,7 @@
 
 
 %% Biology
 %% Biology
 \newabbreviation{TSS}{TSS}{transcription start site}
 \newabbreviation{TSS}{TSS}{transcription start site}
+\newabbreviation{CpGi}{CpGi}{CpG island}
 \newabbreviation{TX}{TX}{healthy transplant}
 \newabbreviation{TX}{TX}{healthy transplant}
 \newabbreviation{AR}{AR}{acute rejection}
 \newabbreviation{AR}{AR}{acute rejection}
 \newabbreviation{ADNR}{ADNR}{acute dysfunction with no rejection}
 \newabbreviation{ADNR}{ADNR}{acute dysfunction with no rejection}

二進制
graphics/CD4-csaw/RNA-seq/weights-vs-covars-nobcv.png


+ 322 - 459
thesis.lyx

@@ -9,6 +9,9 @@
 % List all used files in log output
 % List all used files in log output
 \listfiles
 \listfiles
 
 
+%% Add TOC, List of Figures, etc. to TOC
+\usepackage{tocbibind}
+
 % Add a DRAFT watermark
 % Add a DRAFT watermark
 \usepackage{draftwatermark}
 \usepackage{draftwatermark}
 \usepackage{accsupp}
 \usepackage{accsupp}
@@ -41,16 +44,9 @@
 % This one breaks subfigs so it's disabled
 % This one breaks subfigs so it's disabled
 % https://tex.stackexchange.com/questions/65680/automatically-bold-first-sentence-of-a-floats-caption
 % https://tex.stackexchange.com/questions/65680/automatically-bold-first-sentence-of-a-floats-caption
 
 
-% Bold all nomenclature entries
-\renewcommand{\nomlabel}[1]{\textsf{\textbf{#1}}}
-
-% https://tex.stackexchange.com/a/31083/5654
-%\let\nomenclOrig\nomenclature
-%\renewcommand*{\nomenclature}[3][]{#2\nomenclOrig[#1]{#2}{#3}}
-
-\usepackage[nohypertypes={abbreviation}]{glossaries-extra}
+\usepackage[automake,nonumberlist,nohypertypes={abbreviation}]{glossaries-extra}
 \setabbreviationstyle{long-short}
 \setabbreviationstyle{long-short}
-\input{abbrevs.tex}
+\loadglsentries{abbrevs.tex}
 \makeglossaries
 \makeglossaries
 \end_preamble
 \end_preamble
 \use_default_options true
 \use_default_options true
@@ -307,20 +303,84 @@ final
 \end_inset
 \end_inset
 
 
 
 
+\end_layout
+
+\begin_layout Standard
+\begin_inset ERT
+status open
+
+\begin_layout Plain Layout
+
+
+\backslash
+addcontentsline{toc}{chapter}{Copyright notice}
+\end_layout
+
+\end_inset
+
+
 \end_layout
 \end_layout
 
 
 \begin_layout Standard
 \begin_layout Standard
 [Copyright notice]
 [Copyright notice]
 \end_layout
 \end_layout
 
 
+\begin_layout Standard
+\begin_inset ERT
+status open
+
+\begin_layout Plain Layout
+
+
+\backslash
+addcontentsline{toc}{chapter}{Thesis acceptance form}
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
 \begin_layout Standard
 \begin_layout Standard
 [Thesis acceptance form]
 [Thesis acceptance form]
 \end_layout
 \end_layout
 
 
+\begin_layout Standard
+\begin_inset ERT
+status open
+
+\begin_layout Plain Layout
+
+
+\backslash
+addcontentsline{toc}{chapter}{Dedication}
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
 \begin_layout Standard
 \begin_layout Standard
 [Dedication]
 [Dedication]
 \end_layout
 \end_layout
 
 
+\begin_layout Standard
+\begin_inset ERT
+status open
+
+\begin_layout Plain Layout
+
+
+\backslash
+addcontentsline{toc}{chapter}{Acknowledgements}
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
 \begin_layout Standard
 \begin_layout Standard
 [Acknowledgements]
 [Acknowledgements]
 \end_layout
 \end_layout
@@ -355,7 +415,7 @@ LatexCommand tableofcontents
 status open
 status open
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
-To create a new nomenclature entry:
+To create a new abbreviation:
 \end_layout
 \end_layout
 
 
 \begin_layout Enumerate
 \begin_layout Enumerate
@@ -363,17 +423,9 @@ Add an entry to abbrevs.tex
 \end_layout
 \end_layout
 
 
 \begin_layout Enumerate
 \begin_layout Enumerate
-Find the first instance of the term, and wrap it in Insert -> Custom Insets
- -> Glossary Term (use Capital if starting a sentence)
-\end_layout
-
-\begin_layout Enumerate
-Add a nomenclature entry after the first instance
-\end_layout
-
-\begin_layout Enumerate
-Replace every relevant instance throughout the document with the Glossary
- Term wrapped version, using Edit -> Find & Replace (Advanced).
+Wrap every occurrence of the term in Insert -> Custom Insets -> Glossary
+ Term (use appropriate variants for caiptal, plural, etc.), using Edit ->
+ Find & Replace (Advanced).
  Skip section headers and floats.
  Skip section headers and floats.
 \end_layout
 \end_layout
 
 
@@ -386,12 +438,9 @@ literal "false"
 \end_inset
 \end_inset
 
 
 
 
-\end_layout
-
-\begin_layout Plain Layout
 \begin_inset CommandInset href
 \begin_inset CommandInset href
 LatexCommand href
 LatexCommand href
-target "https://wiki.lyx.org/Tips/Nomenclature"
+target "https://ctan.org/pkg/glossaries-extra"
 literal "false"
 literal "false"
 
 
 \end_inset
 \end_inset
@@ -405,66 +454,32 @@ literal "false"
 \end_layout
 \end_layout
 
 
 \begin_layout Standard
 \begin_layout Standard
-\begin_inset CommandInset nomencl_print
-LatexCommand printnomenclature
-set_width "auto"
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout List of TODOs
-
-\end_layout
-
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
+\align center
+\begin_inset ERT
 status open
 status open
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
-Check all figures to make sure they fit on the page with their legends.
-\end_layout
-
-\end_inset
 
 
 
 
+\backslash
+renewcommand*{
+\backslash
+glossaryname}{List of Abbreviations}%
 \end_layout
 \end_layout
 
 
-\begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
-
 \begin_layout Plain Layout
 \begin_layout Plain Layout
-Make all descriptions consistent in terms of 
-\begin_inset Quotes eld
-\end_inset
 
 
-we did X
-\begin_inset Quotes erd
-\end_inset
 
 
- vs 
-\begin_inset Quotes eld
-\end_inset
+\backslash
+printglossaries
+\end_layout
 
 
-I did X
-\begin_inset Quotes erd
 \end_inset
 \end_inset
 
 
- vs 
-\begin_inset Quotes eld
-\end_inset
 
 
-X was done
-\begin_inset Quotes erd
-\end_inset
-
-.
 \end_layout
 \end_layout
 
 
-\end_inset
-
+\begin_layout List of TODOs
 
 
 \end_layout
 \end_layout
 
 
@@ -1016,15 +1031,6 @@ MSC
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "MSC"
-description "mesenchymal stem cell"
-literal "true"
-
-\end_inset
-
 .
 .
 \end_layout
 \end_layout
 
 
@@ -1188,15 +1194,6 @@ status open
 RNA-seq
 RNA-seq
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "RNA-seq"
-description "High-throughput RNA sequencing"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  experiment, the dependent variables may be the count of 
  experiment, the dependent variables may be the count of 
@@ -1480,15 +1477,6 @@ ChIP-seq
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "ChIP-seq"
-description "Chromatin immunoprecipitation followed by high-throughput DNA sequencing"
-literal "false"
-
-\end_inset
-
 , which tend to be much smaller and therefore violate the assumption of
 , which tend to be much smaller and therefore violate the assumption of
  a normal distribution more severely.
  a normal distribution more severely.
  For all count-based data, the 
  For all count-based data, the 
@@ -1519,15 +1507,6 @@ status open
 GLM
 GLM
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "GLM"
-description "generalized linear model"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  instead of a linear model.
  instead of a linear model.
@@ -1571,15 +1550,6 @@ status open
 NB
 NB
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "NB"
-description "negative binomial"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  distribution rather than modeling the normalized log counts using a normal
  distribution rather than modeling the normalized log counts using a normal
@@ -1795,15 +1765,6 @@ status open
 MACS
 MACS
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "MACS"
-description "Model-based Analysis of ChIP-seq"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  exploit this pattern to identify specific loci at which such 
  exploit this pattern to identify specific loci at which such 
@@ -1868,15 +1829,6 @@ status open
 SICER
 SICER
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SICER"
-description "Spatial Clustering for Identification of ChIP-Enriched Regions"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  assume that peaks are represented in the 
  assume that peaks are represented in the 
@@ -1924,15 +1876,6 @@ status open
 ENCODE
 ENCODE
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "ENCODE"
-description "Encyclopedia Of DNA Elements"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  project has developed a method called 
  project has developed a method called 
@@ -1943,15 +1886,6 @@ status open
 IDR
 IDR
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "IDR"
-description "irreproducible discovery rate"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  for this purpose 
  for this purpose 
@@ -2100,15 +2034,6 @@ RMA
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "RMA"
-description "robust multichip average"
-literal "false"
-
-\end_inset
-
  
  
 \begin_inset CommandInset citation
 \begin_inset CommandInset citation
 LatexCommand cite
 LatexCommand cite
@@ -2195,15 +2120,6 @@ GRSN
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "GRSN"
-description "global rank-invariant set normalization"
-literal "false"
-
-\end_inset
-
 , and 
 , and 
 \begin_inset Flex Glossary Term
 \begin_inset Flex Glossary Term
 status open
 status open
@@ -2214,15 +2130,6 @@ SCAN
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SCAN"
-description "Single-Channel Array Normalization"
-literal "false"
-
-\end_inset
-
  
  
 \begin_inset CommandInset citation
 \begin_inset CommandInset citation
 LatexCommand cite
 LatexCommand cite
@@ -2283,15 +2190,6 @@ CPM
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "CPM"
-description "counts per million"
-literal "false"
-
-\end_inset
-
 .
 .
  Furthermore, if the abundance of a single gene increases, then in order
  Furthermore, if the abundance of a single gene increases, then in order
  for its fraction of the total reads to increase, all other genes' fractions
  for its fraction of the total reads to increase, all other genes' fractions
@@ -2406,15 +2304,6 @@ status open
 logFC
 logFC
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "logFC"
-description "$\\log_2$ fold change"
-literal "true"
-
 \end_inset
 \end_inset
 
 
  is zero across all abundance levels.
  is zero across all abundance levels.
@@ -2496,15 +2385,6 @@ status open
 SVD
 SVD
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SVD"
-description "singular value decomposition"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  on the matrix of linear model residuals (which contain all the un-modeled
  on the matrix of linear model residuals (which contain all the un-modeled
@@ -2520,15 +2400,6 @@ status open
 SVA
 SVA
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SVA"
-description "surrogate variable analysis"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  starts with this approach, but takes some additional steps to identify
  starts with this approach, but takes some additional steps to identify
@@ -2819,15 +2690,6 @@ status open
 TSS
 TSS
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "TSS"
-description "transcription start site"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  is an important factor, as opposed to simple proximity.
  is an important factor, as opposed to simple proximity.
@@ -3193,15 +3055,6 @@ SRA
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SRA"
-description "Sequence Read Archive"
-literal "false"
-
-\end_inset
-
  
  
 \begin_inset CommandInset citation
 \begin_inset CommandInset citation
 LatexCommand cite
 LatexCommand cite
@@ -3350,6 +3203,16 @@ After batch correction with ComBat
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status open
+
+\begin_layout Plain Layout
+PCoA plots of RNA-seq data showing effect of batch correction.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:RNA-PCA"
 name "fig:RNA-PCA"
@@ -3421,23 +3284,10 @@ wide false
 sideways false
 sideways false
 status collapsed
 status collapsed
 
 
-\begin_layout Plain Layout
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-Just take the top row
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 \align center
 \align center
 \begin_inset Graphics
 \begin_inset Graphics
-	filename graphics/CD4-csaw/RNA-seq/weights-vs-covars-CROP.png
+	filename graphics/CD4-csaw/RNA-seq/weights-vs-covars-nobcv-CROP.png
 	lyxscale 25
 	lyxscale 25
 	width 100col%
 	width 100col%
 	groupId colwidth-raster
 	groupId colwidth-raster
@@ -3453,6 +3303,16 @@ Just take the top row
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+RNA-seq sample weights, grouped by experimental and technical covariates.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:RNA-seq-weights-vs-covars"
 name "fig:RNA-seq-weights-vs-covars"
@@ -3523,15 +3383,6 @@ TMM
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "TMM"
-description "trimmed mean of M-values"
-literal "false"
-
-\end_inset
-
  
  
 \begin_inset CommandInset citation
 \begin_inset CommandInset citation
 LatexCommand cite
 LatexCommand cite
@@ -3548,15 +3399,6 @@ status open
 logCPM
 logCPM
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "logCPM"
-description "$\\log_2$ counts per million"
-literal "true"
-
 \end_inset
 \end_inset
 
 
  with quality weights using 
  with quality weights using 
@@ -3620,15 +3462,6 @@ status open
 BH
 BH
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "BH"
-description "Benjamini-Hochberg"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  procedure for 
  procedure for 
@@ -3784,6 +3617,16 @@ bp.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Strand cross-correlation plots for ChIP-seq data, before and after blacklisting.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:CCF-master"
 name "fig:CCF-master"
@@ -4435,6 +4278,17 @@ H3K27me3, SVs subtracted
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+PCoA plots of ChIP-seq sliding window data, before and after subtracting
+ surrogate variables (SVs).
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:PCoA-ChIP"
 name "fig:PCoA-ChIP"
@@ -4768,13 +4622,23 @@ Scatter plots of specific pairs of MOFA latent factors.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status open
+
+\begin_layout Plain Layout
+MOFA latent factors identify shared patterns of variation.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:MOFA-master"
 name "fig:MOFA-master"
 
 
 \end_inset
 \end_inset
 
 
-MOFA latent factors separate technical confounders from 
+MOFA latent factors identify shared patterns of variation.
 \end_layout
 \end_layout
 
 
 \end_inset
 \end_inset
@@ -4816,15 +4680,6 @@ status open
 MOFA
 MOFA
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "MOFA"
-description "Multi-Omics Factor Analysis"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  was run on all the 
  was run on all the 
@@ -4877,15 +4732,6 @@ status open
 LF
 LF
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "LF"
-description "latent factor"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  1, 4, and 5 were determined to explain the most variation consistently
  1, 4, and 5 were determined to explain the most variation consistently
@@ -5583,6 +5429,16 @@ status collapsed
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+PCoA plot of RNA-seq samples after ComBat batch correction.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:rna-pca-final"
 name "fig:rna-pca-final"
@@ -6112,9 +5968,19 @@ literal "false"
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 \begin_inset Caption Standard
 \begin_inset Caption Standard
 
 
-\begin_layout Plain Layout
+\begin_layout Plain Layout
+
+\series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Enrichment of peaks in promoter neighborhoods.
+\end_layout
+
+\end_inset
+
 
 
-\series bold
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:near-promoter-peak-enrich"
 name "fig:near-promoter-peak-enrich"
@@ -6429,6 +6295,16 @@ This figure is generated from the old analysis.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Expression distributions of genes with and without promoter peaks.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:fpkm-by-peak"
 name "fig:fpkm-by-peak"
@@ -6506,15 +6382,6 @@ status open
 FPKM
 FPKM
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "FPKM"
-description "fragments per kilobase per million fragments"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  values when a peak overlaps the promoter is about 
  values when a peak overlaps the promoter is about 
@@ -7061,15 +6928,6 @@ PCoA
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "PCoA"
-description "principal coordinate analysis"
-literal "false"
-
-\end_inset
-
 .
 .
  All 3 marks show a noticeable convergence between the naïve and memory
  All 3 marks show a noticeable convergence between the naïve and memory
  samples at day 14, visible as an overlapping of the day 14 groups on each
  samples at day 14, visible as an overlapping of the day 14 groups on each
@@ -7354,6 +7212,16 @@ RNA-seq PCoA showing principal coordinates 2 and 3.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+PCoA plots for promoter ChIP-seq and expression RNA-seq data
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:PCoA-promoters"
 name "fig:PCoA-promoters"
@@ -7592,6 +7460,17 @@ Gene expression grouped by promoter coverage clusters.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+K-means clustering of promoter H3K4me2 relative coverage depth in naïve
+ day 0 samples.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:H3K4me2-neighborhood"
 name "fig:H3K4me2-neighborhood"
@@ -7798,15 +7677,6 @@ status open
 PCA
 PCA
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "PCA"
-description "principal component analysis"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  plot based on the same relative bin abundance data, and colored based on
  plot based on the same relative bin abundance data, and colored based on
@@ -8203,6 +8073,17 @@ Gene expression grouped by promoter coverage clusters.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+K-means clustering of promoter H3K4me3 relative coverage depth in naïve
+ day 0 samples.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:H3K4me3-neighborhood"
 name "fig:H3K4me3-neighborhood"
@@ -8213,7 +8094,7 @@ K-means clustering of promoter H3K4me3 relative coverage depth in naïve
  day 0 samples.
  day 0 samples.
  
  
 \series default
 \series default
-H3K4me2 ChIP-seq reads were binned into 500-bp windows tiled across each
+H3K4me3 ChIP-seq reads were binned into 500-bp windows tiled across each
  promoter from 5
  promoter from 5
 \begin_inset space ~
 \begin_inset space ~
 \end_inset
 \end_inset
@@ -8507,6 +8388,17 @@ Repeated figure legends are kind of an issue here.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+K-means clustering of promoter H3K27me3 relative coverage depth in naïve
+ day 0 samples.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:H3K27me3-neighborhood"
 name "fig:H3K27me3-neighborhood"
@@ -9148,7 +9040,7 @@ LF
 \begin_inset Float figure
 \begin_inset Float figure
 wide false
 wide false
 sideways false
 sideways false
-status collapsed
+status open
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 \align center
 \align center
@@ -9169,6 +9061,21 @@ status collapsed
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Lamere 2016 Figure 8 “Model for the role of H3K4 methylation during CD4
+ T-cell activation.
+\begin_inset Quotes erd
+\end_inset
+
+
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:Lamere2016-Fig8"
 name "fig:Lamere2016-Fig8"
@@ -9862,15 +9769,6 @@ status open
 CpGi
 CpGi
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "CpGi"
-description "CpG island"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  in the promoter was correlated with increases or decreases in gene expression
  in the promoter was correlated with increases or decreases in gene expression
@@ -10465,15 +10363,6 @@ status open
 glsdisp*{TX}{healthy transplants (TX)}
 glsdisp*{TX}{healthy transplants (TX)}
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "TX"
-description "healthy transplant"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  from transplants undergoing 
  from transplants undergoing 
@@ -10484,15 +10373,6 @@ status open
 AR
 AR
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "AR"
-description "acute rejection"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  or 
  or 
@@ -10505,15 +10385,6 @@ ADNR
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "ADNR"
-description "acute dysfunction with no rejection"
-literal "false"
-
-\end_inset
-
 .
 .
  However, the the standard normalization algorithm used for microarray data,
  However, the the standard normalization algorithm used for microarray data,
  
  
@@ -10631,15 +10502,6 @@ glsdisp*{GEO}{the Gene Expression Omnibus (GEO)}
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "GEO"
-description "Gene Expression Omnibus"
-literal "false"
-
-\end_inset
-
 .
 .
  Each array's probe intensity distribution is normalized against these pre-gener
  Each array's probe intensity distribution is normalized against these pre-gener
 ated quantiles.
 ated quantiles.
@@ -11007,15 +10869,6 @@ status open
 ROC
 ROC
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "ROC"
-description "receiver operating characteristic"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  curves and 
  curves and 
@@ -11026,15 +10879,6 @@ status open
 AUC
 AUC
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "AUC"
-description "area under ROC curve"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  values were generated 
  values were generated 
@@ -11553,15 +11397,6 @@ CAN
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "CAN"
-description "chronic allograft nephropathy"
-literal "false"
-
-\end_inset
-
 .
 .
  The data consisted of 33 TX, 9 AR, 8 ADNR, and 28 CAN samples.
  The data consisted of 33 TX, 9 AR, 8 ADNR, and 28 CAN samples.
  The uneven group sizes are a result of taking the biopsy samples before
  The uneven group sizes are a result of taking the biopsy samples before
@@ -11576,15 +11411,6 @@ status open
 T1D
 T1D
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "T1D"
-description "Type 1 diabetes"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  or 
  or 
@@ -11597,15 +11423,6 @@ T2D
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "T2D"
-description "Type 2 diabetes"
-literal "false"
-
-\end_inset
-
 ).
 ).
  
  
 \end_layout
 \end_layout
@@ -11621,15 +11438,6 @@ SWAN
 
 
 \end_inset
 \end_inset
 
 
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "SWAN"
-description "subset-quantile within array normalization"
-literal "false"
-
-\end_inset
-
  
  
 \begin_inset CommandInset citation
 \begin_inset CommandInset citation
 LatexCommand cite
 LatexCommand cite
@@ -12172,6 +11980,18 @@ status open
 \begin_inset Caption Standard
 \begin_inset Caption Standard
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Classifier probabilities on validation samples when normalized with RMA
+ together vs.
+ separately.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:Classifier-probabilities-RMA"
 name "fig:Classifier-probabilities-RMA"
@@ -12377,6 +12197,16 @@ ROC curves for PAM on external validation data
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+ROC curves for PAM using different normalization strategies.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:ROC-PAM-main"
 name "fig:ROC-PAM-main"
@@ -13443,6 +13273,17 @@ Number of samples usable in fRMA probe weight learning as a function of
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Effect of batch size selection on number of batches and number of samples
+ included in fRMA probe weight learning.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:frmatools-batch-size"
 name "fig:frmatools-batch-size"
@@ -13645,6 +13486,16 @@ Violin plot of inter-normalization log ratios for blood samples.
 \begin_inset Caption Standard
 \begin_inset Caption Standard
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Violin plot of log ratios between normalizations for 20 biopsy samples.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:frma-violin"
 name "fig:frma-violin"
@@ -13950,6 +13801,16 @@ fRMA vs fRMA for blood samples.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Representative MA plots comparing RMA and custom fRMA normalizations.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:Representative-MA-plots"
 name "fig:Representative-MA-plots"
@@ -14314,7 +14175,16 @@ Mean-variance trend after voom modeling in analysis C.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
 Mean-variance trend modeling in methylation array data.
 Mean-variance trend modeling in methylation array data.
+\end_layout
+
+\end_inset
+
+ Mean-variance trend modeling in methylation array data.
  
  
 \series default
 \series default
 The estimated 
 The estimated 
@@ -14737,6 +14607,16 @@ Redo the sample weight boxplot with notches, and remove fill colors
 \begin_inset Caption Standard
 \begin_inset Caption Standard
 
 
 \begin_layout Plain Layout
 \begin_layout Plain Layout
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Box-and-whiskers plot of sample quality weights grouped by diabetes diagnosis.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:diabetes-sample-weights"
 name "fig:diabetes-sample-weights"
@@ -15760,6 +15640,16 @@ CAN vs.
 \begin_layout Plain Layout
 \begin_layout Plain Layout
 
 
 \series bold
 \series bold
+\begin_inset Argument 1
+status collapsed
+
+\begin_layout Plain Layout
+Probe p-value histograms for each contrast in each analysis.
+\end_layout
+
+\end_inset
+
+
 \begin_inset CommandInset label
 \begin_inset CommandInset label
 LatexCommand label
 LatexCommand label
 name "fig:meth-p-value-histograms"
 name "fig:meth-p-value-histograms"
@@ -16872,15 +16762,6 @@ status open
 GB
 GB
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "GB"
-description "globin blocking"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  protocol approximately doubles the yield of informative (non-globin) reads
  protocol approximately doubles the yield of informative (non-globin) reads
@@ -17026,15 +16907,6 @@ status open
 mRNA
 mRNA
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "mRNA"
-description "messenger RNA"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  are naturally present in mammalian peripheral blood samples (up to 70%
  are naturally present in mammalian peripheral blood samples (up to 70%
@@ -17372,15 +17244,6 @@ status open
 PCR
 PCR
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "PCR"
-description "polymerase chain reaction"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  tube.
  tube.
@@ -17516,15 +17379,6 @@ status open
 ncRNA
 ncRNA
 \end_layout
 \end_layout
 
 
-\end_inset
-
-
-\begin_inset CommandInset nomenclature
-LatexCommand nomenclature
-symbol "ncRNA"
-description "non-coding RNA"
-literal "false"
-
 \end_inset
 \end_inset
 
 
  gene, resulting in significant undercounting of globin reads.
  gene, resulting in significant undercounting of globin reads.
@@ -20634,11 +20488,15 @@ GB
  method in place, the way is now clear for this experiment to proceed.
  method in place, the way is now clear for this experiment to proceed.
 \end_layout
 \end_layout
 
 
-\begin_layout Chapter
+\begin_layout Standard
+\begin_inset Note Note
+status open
+
+\begin_layout Chapter*
 Future Directions
 Future Directions
 \end_layout
 \end_layout
 
 
-\begin_layout Standard
+\begin_layout Plain Layout
 \begin_inset Flex TODO Note (inline)
 \begin_inset Flex TODO Note (inline)
 status open
 status open
 
 
@@ -20650,6 +20508,11 @@ If there are any chapter-independent future directions, put them here.
 \end_inset
 \end_inset
 
 
 
 
+\end_layout
+
+\end_inset
+
+
 \end_layout
 \end_layout
 
 
 \begin_layout Chapter
 \begin_layout Chapter