Skip to content

Commit

Permalink
generate and analyse failed verblemmas.
Browse files Browse the repository at this point in the history
  • Loading branch information
Trondtr committed Nov 20, 2023
1 parent 00fd5f7 commit 2f861ca
Showing 1 changed file with 31 additions and 21 deletions.
52 changes: 31 additions & 21 deletions test/src/morphology/generate-verb-lemmas.sh.in
Original file line number Diff line number Diff line change
Expand Up @@ -101,30 +101,40 @@ for f in $fsttype; do
$lookup_tool $generator_file.$suffix | \
cut -f2 | grep -v "V+" | grep -v "^$" | LC_ALL=C sort -u > $generated_lemmas.$f.txt

# Sorter, unifiser
LC_ALL=no_NO.UTF-8 sort -u -o $lemmas $lemmas
LC_ALL=no_NO.UTF-8 sort -u -o $generated_lemmas.$f.txt $generated_lemmas.$f.txt

# Sammenlikne: Former som er i lemmalista med ikke i lista med genererte former,
# lagre i missingverbLemmas.txt. Formene generes med +V+Inf for enklere debugging.
LC_ALL=no_NO.UTF-8 comm -23 $lemmas $generated_lemmas.$f.txt |\
grep -v '^$' | sed 's/$/+V+Inf/' |\
$lookup_tool $generator_file.$suffix > $result_file.$f.txt

# Open the diff file in SubEthaEdit (if there is a diff):
if [ -s $result_file.$f.txt ]; then
# Only open the failed lemmas in see if @SEE@ is defined:
if [ "$EXTEDITOR" ]; then
$EXTEDITOR $result_file.$f.txt
###### Collect results, and generate debug info if FAIL: #######
# Sort and compare original input with resulting output - the diff is
# used to generate lemmas which are opened in SEE:
sort -u -o $generated_lemmas.$f.txt $generated_lemmas.$f.txt
comm -23 $lemmas $generated_lemmas.$f.txt > $result_file.$f.txt

# Open the diff file in SubEthaEdit (if there is a diff):
if [ -s $result_file.$f.txt ]; then
grep -v '^$' $result_file.$f.txt \
| sed 's/$/+V+Inf/' \
| $lookup_tool $generator_file.$suffix \
> $gen_result_file.$f.txt
# If we have an analyser, analyse the missing lemmas as well:
if test -e $analyser_file.$suffix ; then
grep -v '^$' $result_file.$f.txt \
| $lookup_tool $analyser_file.$suffix \
> $ana_result_file.$f.txt
fi
# Only open the failed lemmas in see if @SEE@ is defined:
if [ "$EXTEDITOR" ]; then
$EXTEDITOR $result_file.$f.txt
$EXTEDITOR $gen_result_file.$f.txt
$EXTEDITOR $ana_result_file.$f.txt
else
echo "There were problem lemmas. Details in:"
echo "* $result_file.$f.txt "
fi
Fail=1
echo "$f - FAIL"
continue
fi
echo "$f - PASS"
echo "* $gen_result_file.$f.txt"
echo "* $ana_result_file.$f.txt"
fi
Fail=1
echo "$f - FAIL"
continue
fi
echo "$f - PASS"
fi
done

Expand Down

0 comments on commit 2f861ca

Please sign in to comment.