diff options
author | Patrick Simianer <p@simianer.de> | 2014-10-09 20:47:23 +0100 |
---|---|---|
committer | Patrick Simianer <p@simianer.de> | 2014-10-09 20:47:23 +0100 |
commit | e0b634754d1bef33dc8e72509c6990cccc32745a (patch) | |
tree | 95d77abef518a333830881dbbd661f14f94868c3 /stanford_parser_run | |
parent | 254c27ed4af938f0b9c4a21cb99b75f8cc1cd1b2 (diff) |
alles neu macht der mai
Diffstat (limited to 'stanford_parser_run')
-rwxr-xr-x | stanford_parser_run | 13 |
1 files changed, 13 insertions, 0 deletions
diff --git a/stanford_parser_run b/stanford_parser_run new file mode 100755 index 0000000..f8d4210 --- /dev/null +++ b/stanford_parser_run @@ -0,0 +1,13 @@ +#!/bin/bash + +if [ $# != 1 ]; then + echo "$0 text-file" + exit 1 +fi + +export CLASSPATH=:/toolbox/stanfordparser_3_2_0/* + +IN=$1 + +cat $IN | java -server -mx25000m edu.stanford.nlp.parser.lexparser.LexicalizedParser -nthreads 8 -sentences newline -encoding utf-8 -tokenized -outputFormat "typedDependencies" -outputFormatOptions "basicDependencies" edu/stanford/nlp/models/lexparser/englishPCFG.ser.gz - | tr '\n' '\t' | sed 's/\t\t/\n/g' | sed 's/\t/ /g' | sed 's/ *$//' | sed 's/, /,/g' > $IN.stp + |