@book{Marcu1,
  author = "Daniel Marcu",
  title = "The Theory and Practice of Discourse Parsing and Summarization",
  month = "November",
  year = "2000",
  isbn = "0-262-13372-5",
  publisher = "The MIT Press",
  note = "<A HREF=http://mitpress.mit.edu/book-home.tcl?isbn=0262133725>Order from publisher</A> ($39.95 plus shipping)",
  note = "<A HREF=http://www.amazon.com/exec/obidos/ASIN/0262133725/o/qid=974663607/sr=2-1/107-9153238-1898124>Order from Amazon</A> ($35.00 plus shipping)",
  abstract = "<P>
                 Until now, most discourse researchers have
                 assumed that full semantic understanding is
                 necessary to derive the discourse structure
                 of texts. This book documents the first
                 serious attempt to construct automatically
                 and use nonsemantic computational
                 structures for text summarization. Daniel
                 Marcu develops a semantics-free theoretical
                 framework that is both general enough to
                 be applicable to naturally occurring texts
                 and concise enough to facilitate an
                 algorithmic approach to discourse analysis.
                 He presents and evaluates two discourse
                 parsing methods: one uses manually written
                 rules that reflect common patterns of usage
                 of cue phrases such as ``however'' and ``in
                 addition to''; the other uses rules that are
                 learned automatically from a corpus of
                 discourse structures. By means of a
                 psycholinguistic experiment, Marcu
                 demonstrates how a discourse-based
                 summarizer identifies the most important
                 parts of texts at levels of performance that
                 are close to those of humans. </p>
                 <P>
                 Marcu also discusses how the automatic
                 derivation of discourse structures may be
                 used to improve the performance of current
                 natural language generation, machine
                 translation, summarization, question
                 answering, and information retrieval
                 systems. </p>"
}


