From 13bbafc9b5fd1918959ad79a11d907165990faea Mon Sep 17 00:00:00 2001 From: Simon Zuberek Date: Mon, 3 Jun 2024 17:14:23 -0400 Subject: [PATCH] Normalizes the '%' sign Signed-off-by: Simon Zuberek --- Jenkinsfile | 2 +- .../text_normalization/it/data/measure/measurements.tsv | 3 ++- .../it/data_text_normalization/test_cases_measure.txt | 3 ++- .../nemo_text_processing/it/test_sparrowhawk_normalization.sh | 2 +- 4 files changed, 6 insertions(+), 4 deletions(-) diff --git a/Jenkinsfile b/Jenkinsfile index 6822ee055..da0815541 100644 --- a/Jenkinsfile +++ b/Jenkinsfile @@ -23,7 +23,7 @@ pipeline { VI_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/06-08-23-0' SV_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/06-08-23-0' ZH_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/04-30-24-0' - IT_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/10-26-23-0' + IT_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/06-03-24-0' HY_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/03-12-24-0' MR_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/03-12-24-1' DEFAULT_TN_CACHE='/home/jenkinsci/TestData/text_norm/ci/grammars/06-08-23-0' diff --git a/nemo_text_processing/text_normalization/it/data/measure/measurements.tsv b/nemo_text_processing/text_normalization/it/data/measure/measurements.tsv index 68b808dcd..bb359e6a0 100644 --- a/nemo_text_processing/text_normalization/it/data/measure/measurements.tsv +++ b/nemo_text_processing/text_normalization/it/data/measure/measurements.tsv @@ -60,4 +60,5 @@ l litro dl decilitro bar bar kcal chilocaloria -cal caloria \ No newline at end of file +cal caloria +% percento \ No newline at end of file diff --git a/tests/nemo_text_processing/it/data_text_normalization/test_cases_measure.txt b/tests/nemo_text_processing/it/data_text_normalization/test_cases_measure.txt index 6595ccd37..aa1e945d0 100644 --- a/tests/nemo_text_processing/it/data_text_normalization/test_cases_measure.txt +++ b/tests/nemo_text_processing/it/data_text_normalization/test_cases_measure.txt @@ -3,4 +3,5 @@ 4,3 l~quattro virgola tre litri 5 km/s~cinque chilometri per secondo 15 A~quindici ampere -155 d~cento cinquantacinque giorni \ No newline at end of file +155 d~cento cinquantacinque giorni +il 18% delle emissioni di carbonio~il diciotto percento delle emissioni di carbonio \ No newline at end of file diff --git a/tests/nemo_text_processing/it/test_sparrowhawk_normalization.sh b/tests/nemo_text_processing/it/test_sparrowhawk_normalization.sh index e43d90353..a49aa1d1d 100644 --- a/tests/nemo_text_processing/it/test_sparrowhawk_normalization.sh +++ b/tests/nemo_text_processing/it/test_sparrowhawk_normalization.sh @@ -1,7 +1,7 @@ #! /bin/sh PGRAMMARS_DIR=${1:-"/workspace/sparrowhawk/documentation/grammars"} -PROJECT_DIR=${2:-"/workspace/tests/en"} +PROJECT_DIR=${2:-"/workspace/tests/"} runtest () { input=$1