#!/bin/bash mkdir -p /corpora/data/corpus cwb-encode \ -c utf8 \ -d /corpora/data/corpus \ -f /root/files/corpus.vrt \ -R /usr/local/share/cwb/registry/corpus \ -P lemma -P simple_pos -P pos -P ner \ -S text:0+address+author+booktitle+chapter+editor+institution+journal+pages+publisher+publishing_year+school+title -S s \ -0 corpus \ -xsB cwb-make \ -V CORPUS