@article{Fazly2009,
   author = "Afsaneh Fazly and Paul Cook and Suzanne Stevenson",
   title = "Unsupervised type and token identification of idiomatic expressions",
   journal = "Computational Linguistics",
   year = "2009",
   volume = "35",
   number = "1",
   pages = "61--103",
   abstract = "Idiomatic expressions are plentiful in everyday language, yet they
               remain mysterious, as it is not clear exactly how people learn and
               understand them. They are of special interest to linguists,
               psycholinguists, and lexicographers, mainly because of their syntactic
               and semantic idiosyncrasies as well as their unclear lexical status.
               Despite a great deal of research on the properties of idioms in the
               linguistics literature, there is not much agreement on which
               properties are characteristic of these expressions. Because of their
               peculiarities, idiomatic expressions have mostly been overlooked by
               researchers in computational linguistics. In this article, we look
               into the usefulness of some of the identified linguistic properties of
               idioms for their automatic recognition. Specifically, we develop
               statistical measures that each model a specific property of idiomatic
               expressions by looking at their actual usage patterns in text. We use
               these statistical measures in a type-based classification task where
               we automatically separate idiomatic expressions (expressions with a
               possible idiomatic interpretation) from similar-on-the-surface literal
               phrases (for which no idiomatic interpretation is possible). In
               addition, we use some of the measures in a token identification task
               where we distinguish idiomatic and literal usages of potentially
               idiomatic expressions in context.",
   download = "http://www.mitpressjournals.org/doi/pdf/10.1162/coli.08-010-R1-07-048"
}



