#install dev env apt-get update apt-get install build-essential vim -y #install jdk8 apt-get install software-properties-common -y #need to confirm add-apt-repository ppa:webupd8team/java apt-get update #need to confirm apt-get install oracle-java8-installer -y #install bazel echo "deb http://storage.googleapis.com/bazel-apt stable jdk1.8" | tee /etc/apt/sources.list.d/bazel.list apt-get install curl curl https://storage.googleapis.com/bazel-apt/doc/apt-key.pub.gpg | apt-key add - apt-get update && apt-get install bazel -y apt-get upgrade bazel -y #install swig apt-get install swig -y #install pip apt-get install python-pip python-devel python-numpy -y #install protobuf, asciitree, numpy pip freeze | grep protobuf pip install -U protobuf==3.0.0b2 pip install asciitree #install SyntaxNet apt-get install git -y git clone --recursive https://github.com/tensorflow/models.git cd models/syntaxnet/tensorflow apt-get install libcurl3-dev -y # we should check whether python path is right ./configure cd .. #need big memory(>=16G) bazel test syntaxnet/... util/utf8/... #test parse tree
echo 'Bob brought the pizza to Alice.' | syntaxnet/demo.sh
参考1和2介绍了在syntaxnet中用定制universal dependencies英文语料重新训练POS-tagger和parser的方法,有兴趣的继续下载定制语料进一步深入测试。
参考:
1. https://github.com/tensorflow/models/tree/master/syntaxnet
2. https://github.com/dsindex/syntaxnet 定制韩语语料的测试,方法可借鉴。