diff --git a/NOS/txt2corpus.sh b/NOS/txt2corpus.sh index e9e2983..7e58cb2 100755 --- a/NOS/txt2corpus.sh +++ b/NOS/txt2corpus.sh @@ -59,8 +59,8 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 9 -s $corpus.data.dz > $corpus.cat.txt -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x C -s $corpus.data.dz > $corpus.cat.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/NU/txt2corpus.sh b/NU/txt2corpus.sh index 9c9e538..0e21291 100755 --- a/NU/txt2corpus.sh +++ b/NU/txt2corpus.sh @@ -57,7 +57,7 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/NieuwsNL/txt2corpus.sh b/NieuwsNL/txt2corpus.sh index 99ce671..193c969 100755 --- a/NieuwsNL/txt2corpus.sh +++ b/NieuwsNL/txt2corpus.sh @@ -59,7 +59,7 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/RO/txt2corpus.sh b/RO/txt2corpus.sh index cb4c91c..afb4331 100755 --- a/RO/txt2corpus.sh +++ b/RO/txt2corpus.sh @@ -59,7 +59,7 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/Sargasso/txt2corpus.sh b/Sargasso/txt2corpus.sh index eb84a1f..5391ce4 100755 --- a/Sargasso/txt2corpus.sh +++ b/Sargasso/txt2corpus.sh @@ -59,7 +59,7 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/Tzum/txt2corpus.sh b/Tzum/txt2corpus.sh index 0ae1fb6..1bd4d6d 100755 --- a/Tzum/txt2corpus.sh +++ b/Tzum/txt2corpus.sh @@ -59,7 +59,7 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/VRT/txt2corpus.sh b/VRT/txt2corpus.sh index faefee6..1b55734 100755 --- a/VRT/txt2corpus.sh +++ b/VRT/txt2corpus.sh @@ -57,8 +57,8 @@ cd xml alto -o $corpus.data.dz *.xml 2> /dev/null # telling per bericht, niet per zin -/net/corpora/nlnieuws/namen.sh -x 9 -s $corpus.data.dz > $corpus.cat.txt -/net/corpora/nlnieuws/namen.sh -x 10 -s $corpus.data.dz > $corpus.tag.txt +/net/corpora/nlnieuws/namen.sh -x C -s $corpus.data.dz > $corpus.cat.txt +/net/corpora/nlnieuws/namen.sh -x T -s $corpus.data.dz > $corpus.tag.txt cd ../.. rm -fr out diff --git a/namen.sh b/namen.sh index 1eaf408..a238067 100755 --- a/namen.sh +++ b/namen.sh @@ -7,8 +7,8 @@ usage() { echo " gebruik: - $PROGNAME [opties] -x 1..8 -i - $PROGNAME [opties] -x 1..8 corpusfile(s) en/of corpusdirectory(s) + $PROGNAME [opties] -x 1..10 -i + $PROGNAME [opties] -x 1..10 corpusfile(s) en/of corpusdirectory(s) -x : query @@ -116,13 +116,13 @@ case $XN in TEMPLATE='tt:%w\t%P' XVALID=1 ;; - 9) + 9|C) # categorieën EXPR='fp://meta[@name="cat"]/@value' TEMPLATE='tt:%m' XVALID=1 ;; - 10) + 10|T) # tags EXPR='fp://meta[@name="tag"]/@value' TEMPLATE='tt:%m'