#!/bin/sh # Set these paths appropriately BIN=/Applications/tree-tagger-MacOSX-3.1/bin CMD=/Applications/tree-tagger-MacOSX-3.1/tagger-scripts/cmd LIB=/Applications/tree-tagger-MacOSX-3.1/tagger-scripts/lib TOKENIZER=${BIN}/separate-punctuation TAGGER=${BIN}/tree-tagger ABBR_LIST=${LIB}/german-abbreviations PARFILE=${LIB}/german.par FILTER=${CMD}/filter-german-tags # put all on one line cat $* | # do tokenization $TOKENIZER +1 +s +l $ABBR_LIST | # remove empty lines grep -v '^$' | # tagging $TAGGER $PARFILE -token -lemma -sgml | # error correction $FILTER