2017_fntir_tm_applications.tex

%\documentclass[openany]{now} % creates the journal version
\documentclass{now}  % creates the book pdf version

% the now document class sets various dimensions, so be sure to *not* set
% or alter dimensions in your latex code.
% be sure to remove all manual formatting commands such \newpage, \clearpage.
% hack

%\usepackage[UTF8]{ctex}
\usepackage{CJK}
\usepackage{mathtools}
\usepackage{comment}
\usepackage{makeidx}
\usepackage{bm}
\usepackage{mdwlist}
\usepackage[table]{xcolor}
\usepackage{algorithm}
\usepackage[noend]{algorithmic}
\usepackage{amsfonts}
\usepackage{xcolor}
\usepackage{multirow}
\usepackage{amssymb}
\usepackage{dsfont}
\usepackage{microtype}
\usepackage[all]{nowidow}

\usepackage{caption}
\usepackage{subcaption}

% a few definitions that are *not* needed in general:
\newcommand{\ind}[1]{\mathds{1}\left[ #1 \right] }
\newcommand{\dc}[2]{N_{#1,#2}}
\newcommand{\tc}[2]{V_{#1,#2}}
\newcommand{\etc}{\emph{etc}}
\newcommand{\now}{\textsc{now}}
\newcommand{\slfrac}[2]{\left.#1\middle/#2\right.}
\newcommand{\explain}[2]{\underbrace{#2}_{\mbox{\footnotesize{#1}}}}
\newcommand{\abr}[1]{\textsc{#1}}
\newcommand{\lda}[0]{\abr{lda}}
\newcommand{\tlda}[0]{t\abr{lda}}
\newcommand{\plsa}[0]{p\abr{lsa}}
\newcommand{\plda}[0]{p\abr{lda}}
\newcommand{\g}{\, | \,}
\newcommand{\ptlda}[0]{pt\abr{lda}}
\newcommand{\ptldat}[1]{pt\abr{lda}-\textit{#1}}
\newcommand{\kl}[2]{D_{\mbox{\textsc{KL}}} \left( #1 \,||\, #2 \right)}
\newcommand{\tldat}[1]{t\abr{lda}-\textit{#1}}
\newcommand{\dir}[1]{\mbox{Dir}(#1)}
\newcommand{\R}{\mathbb{R}}
\newcommand{\e}[2]{\mathbb{E}_{#1}\left[ #2 \right] }
\newcommand{\disc}[1]{\mbox{Discrete}( #1)}

\providecommand{\red}[1]{{\color{red}{#1}}}
\providecommand{\green}[1]{{\color{green}{#1}}}
\providecommand{\blue}[1]{{\color{blue}{#1}}}


\newif\ifcomment\commentfalse
\ifcomment
\newcommand{\jbgcomment}[1]{  \colorbox{red}{   \parbox{.8\linewidth}{ JBG: #1}  }}
\newcommand{\yhcomment}[1]{  \colorbox{green}{  \parbox{.8\linewidth}{ YH:  #1}  }}
\newcommand{\dmcomment}[1]{  \colorbox{green}{  \parbox{.8\linewidth}{ DM:  #1}  }}
\else
\newcommand{\jbgcomment}[1]{ }
\newcommand{\yhcomment}[1]{ }
\newcommand{\dmcomment}[1]{ }
\fi


\title{Applications of Topic Models}

\author{
Jordan Boyd-Graber \\
Department of Computer Science, \abr{umiacs}, Language Science \\
University of Maryland\footnote{Work completed while at University of Colorado} \\
\texttt{jbg@umiacs.umd.edu}
\and
Yuening Hu \\
Google, Inc.\footnote{Work completed while at Yahoo!} \\
\texttt{ynhu@google.com}
\and
David Mimno \\
Information Science \\
Cornell University \\
\texttt{mimno@cornell.edu}
}

\makeindex
\begin{document}

\copyrightowner{J.~ Boyd-Graber, Y.~Hu and D.~Mimno}
\volume{11}
\issue{2-3}
\pubyear{2017}
\copyrightyear{2017}
\isbn{978-1-68083-308-9}
\doi{10.1561/1500000030}
\firstpage{143} % correct page number coming asap.
\lastpage{296}

\frontmatter  % title page, contents, catalog information

\maketitle

\tableofcontents

\mainmatter

\begin{abstract}
\setcounter{page}{1}
  How can a single person understand what's going on in a collection
  of millions of documents?  This is an increasingly common problem:
  sifting through an organization's e-mails, understanding a decade
  worth of newspapers, or characterizing a scientific field's
  research.  Topic models are a statistical framework that help users
  understand large document collections: not just to find individual
  documents but to understand the general themes
  present in the collection.

  This survey describes the recent academic and industrial
  applications of topic models with the goal of launching a young
  researcher capable of building their own applications of topic
  models.  In addition to topic models' effective application to
  traditional problems like information retrieval, visualization,
  statistical inference, multilingual modeling, and linguistic
  understanding, this survey also reviews topic models' ability to
  unlock large text collections for qualitative analysis.  We review
  their successful use by researchers to help understand fiction,
  non-fiction, scientific publications, and political texts.
\end{abstract}

\input{chapters/introduction}
\input{chapters/ir}
\input{chapters/viz}
\input{chapters/nonfiction}
\input{chapters/science}
\input{chapters/fiction}
\input{chapters/css}
\input{chapters/multi_ling}
\input{chapters/building}
\input{chapters/conclusion}

\backmatter  % references

\bibliographystyle{plainnat}
\bibliography{bib/journal-full,bib/clean,bib/alison}

\clearpage

\printindex

\end{document}