summaryrefslogtreecommitdiff
path: root/stanford_parser_run
blob: f8d4210e27f0f2db7c55dec2488f9af73f4c2750 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
#!/bin/bash

if [ $# != 1 ]; then
	echo "$0 text-file" 
	exit 1
fi

export CLASSPATH=:/toolbox/stanfordparser_3_2_0/*

IN=$1

cat $IN | java -server -mx25000m  edu.stanford.nlp.parser.lexparser.LexicalizedParser -nthreads 8 -sentences newline -encoding utf-8 -tokenized -outputFormat "typedDependencies" -outputFormatOptions "basicDependencies" edu/stanford/nlp/models/lexparser/englishPCFG.ser.gz - | tr '\n' '\t' | sed 's/\t\t/\n/g' | sed 's/\t/ /g' | sed 's/ *$//' | sed 's/, /,/g' > $IN.stp