      AUTHOR = {Müller, Karin},
      TITLE = {Evaluating Syllabification: One Category Shared by Many Grammars},
      YEAR = {2002},
      BOOKTITLE = {Proceedings of the Workshop of the Third International Conference on Language Resources and Evaluation (LREC2002), May 29-31},
      EDITOR = {Setzer, Andrea and Gaizauskas, Robert},
      ADDRESS = {Las Palmas, Canary Islands, Spain},
      URL = {},
      ABSTRACT = {We apply a series of contextfree grammars to syllabification by using a supervised training method. In our experiments, we investigate various phonological grammars, which strongly differ in structure. A simple evaluation metric word accuracy supports grammar development by denoting an increasing performance for grammars enriched with linguistic structure. This evaluation, judging one single category shared by all grammars, is in strong contrast to PARSEVAL, which is designed for a single grammar evaluating (almost) all categories. Using a toytreebank, we show that the PARSEVAL measures are hard to interpret, since the results are inconsistent with one another. It turns out that evaluating only a limited number of categories (here only one single category) is a harder evaluation measure than measuring the precision of all occurring substructures of a grammar.},
      ANNOTE = {COLIURL : Muller:2002:ESO.pdf}
