Skip to content

Commit

Permalink
Merge branch 'data' into data-UA
Browse files Browse the repository at this point in the history
  • Loading branch information
matyaskopp authored Sep 16, 2023
2 parents 5545d5f + ec9a10f commit b11cc46
Show file tree
Hide file tree
Showing 47 changed files with 1,872 additions and 115,214 deletions.
9 changes: 9 additions & 0 deletions .github/actions/ParlaMintValidate/validate.sh
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,11 @@ for parla in $(jq -r '.[]' <<< $1 ); do
echo "Cleaning old sample files [$parla]"
rm -f ${DATADIR}/ParlaMint-$parla/ParlaMint-*.{txt,tsv,conllu,vert}

echo "::warning:: TMP check whether are taxonomies translated"
make translateTaxonomies-$parla | sed "s/^\(.*\)\(\berror\b\)/::error::\1\2/i" | tee $DIR/taxonomies.log
make initTaxonomies4translation-$parla
make validateTaxonomies-$parla | sed "s/^\(.*\)\(\berror\b\)/::error:: incomplete taxonomy translation \1\2/i" | tee $DIR/taxonomies.log

if [ -f "${DATADIR}/ParlaMint-$parla/ParlaMint-$parla.xml" ] ; then

( Scripts/validate-parlamint.pl Schema ${DATADIR}/ParlaMint-$parla 2>&1 || echo "ERROR: validate-parlamint.pl exited with <> 0" ) \
Expand Down Expand Up @@ -55,6 +60,10 @@ for parla in $(jq -r '.[]' <<< $1 ); do
FAIL=1
echo "::error:: ParlaMint-$parla validation failed"
fi

echo "::warning:: TMP restore taxonomy"
git checkout Corpora/Taxonomies/ParlaMint-taxonomy*
git checkout ${DATADIR}/ParlaMint-$parla/ParlaMint-taxonomy*
done

if [ $FAIL -eq 1 ] ; then
Expand Down
15 changes: 15 additions & 0 deletions Corpora/Taxonomies/ParlaMint-taxonomy-NER.ana.xml
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,9 @@
<term>Entidades Nombradas</term>
</desc>
<!--Corpus ParlaMint-EE is missing et translation of Named entities-->
<desc n="ParlaMint-FI" xml:lang="fi">
<term>nimetyt entiteetit</term>
</desc>
<!--Corpus ParlaMint-FR is missing fr translation of Named entities-->
<desc n="ParlaMint-ES-GA" xml:lang="gl">
<term>Entidades nomeadas</term>
Expand Down Expand Up @@ -87,6 +90,9 @@
<catDesc n="ParlaMint-EE" xml:lang="et">
<term>isik</term>
</catDesc>
<catDesc n="ParlaMint-FI" xml:lang="fi">
<term>henkilö</term>
</catDesc>
<catDesc n="ParlaMint-FR" xml:lang="fr">
<term>personne</term>
</catDesc>
Expand Down Expand Up @@ -158,6 +164,9 @@
<catDesc n="ParlaMint-EE" xml:lang="et">
<term>koht</term>
</catDesc>
<catDesc n="ParlaMint-FI" xml:lang="fi">
<term>paikka</term>
</catDesc>
<catDesc n="ParlaMint-FR" xml:lang="fr">
<term>lieu</term>
</catDesc>
Expand Down Expand Up @@ -229,6 +238,9 @@
<catDesc n="ParlaMint-EE" xml:lang="et">
<term>organisatsioon</term>
</catDesc>
<catDesc n="ParlaMint-FI" xml:lang="fi">
<term>organisaatio</term>
</catDesc>
<catDesc n="ParlaMint-FR" xml:lang="fr">
<term>organisation</term>
</catDesc>
Expand Down Expand Up @@ -300,6 +312,9 @@
<catDesc n="ParlaMint-EE" xml:lang="et">
<term>muu</term>
</catDesc>
<catDesc n="ParlaMint-FI" xml:lang="fi">
<term>Muu</term>
</catDesc>
<catDesc n="ParlaMint-FR" xml:lang="fr">
<term>divers</term>
</catDesc>
Expand Down
Loading

0 comments on commit b11cc46

Please sign in to comment.