mirror of
https://gitlab.ub.uni-bielefeld.de/sfb1288inf/cqpserver.git
synced 2024-12-26 11:24:19 +00:00
27 lines
750 B
Bash
27 lines
750 B
Bash
|
#!/bin/bash
|
||
|
|
||
|
if [ $# -eq 0 ]; then
|
||
|
cqpserver -I /root/cqpserver.init
|
||
|
elif [ $1 == "prepare" ]; then
|
||
|
# Input:
|
||
|
# - Source file: "/root/files/corpus.vrt"
|
||
|
# Output
|
||
|
# - Corpus name: "CORPUS"
|
||
|
# - Corpus data directory: "/corpora/data/corpus"
|
||
|
# - Corpus registry file: "/usr/local/share/cwb/registry/corpus"
|
||
|
mkdir -p /corpora/data/corpus
|
||
|
cwb-encode \
|
||
|
-c utf8 \
|
||
|
-d /corpora/data/corpus \
|
||
|
-f /root/files/corpus.vrt \
|
||
|
-R /usr/local/share/cwb/registry/corpus \
|
||
|
-P lemma -P simple_pos -P pos -P ner \
|
||
|
-S text:0+address+author+booktitle+chapter+editor+institution+journal+pages+publisher+publishing_year+school+title -S s \
|
||
|
-0 corpus \
|
||
|
-xsB
|
||
|
cwb-make \
|
||
|
-V CORPUS
|
||
|
else
|
||
|
echo "Unknown command"
|
||
|
fi
|