commit f4498ba9a0dd2540b022274f7850fe011ea26bf6
parent 3cf403bced54b5710e9925ad2ed77160d5f7c877
Author: Antoine Amarilli <a3nm@a3nm.net>
Date: Sun, 11 Aug 2019 21:23:40 +0200
document normal test output
Diffstat:
3 files changed, 46 insertions(+), 2 deletions(-)
diff --git a/TODO b/TODO
@@ -4,7 +4,6 @@
less than the one indicated in lexique? ("paon" en 1 mais "chaos" en 2)
- Adjust the diaeresis uncertainty threshold to assert that all verses are
correct (change your opinion about the syllable with least confidence)
-- Document expected errors of test.sh and commit necessary files
- remove kludge for invalid characters, split them in specific chunks
- Improve performance with profiling
- Only indicate hemistiche status when there is a problem with hemistiches
@@ -18,6 +17,14 @@
- When reporting hemistiche errors, highlight possible hemistiche positions
where an hemistiche could have been placed
+=== Diérèses/synérèses ==
+
+- When training, take into consideration the contexts where we haven't been able
+ to infer the number of syllables, and only learn at each step from the
+ contexts where we are the most certain (including the unknown occurrences),
+ instead of having a hardcoded default threshold
+- Formally evaluate the performance of the approach without additions
+
=== Other approaches ===
- Learn rhyme and gender agnostically by clustering: prepare an undirected graph
diff --git a/test.sh b/test.sh
@@ -3,7 +3,8 @@
# about the hiatus error found in malherbe, see:
# http://books.google.de/books?id=qpQGAAAAQAAJ&pg=PA40&lpg=PA40&dq=Et+que+pour+retarder+une+heure+seulement+%22Pour+ne+mourir+jamais%22,+meure+%C3%A9ternellement&source=bl&ots=G8VEFnXkmB&sig=qzmHRiloQpIp6Ebb-9aJrYOoIM0&hl=en&sa=X&ei=3oL8T9WiJ6aB4gTK8pWPBw&redir_esc=y#v=onepage&q=Et%20que%20pour%20retarder%20une%20heure%20seulement%20%22Pour%20ne%20mourir%20jamais%22%2C%20meure%20%C3%A9ternellement&f=false
-echo "It is normal that some errors occur when running this script"
+echo "It is normal that some errors occur when running this script" >/dev/stderr
+echo "See test_expected_output.out for the usual errors that are output" >/dev/stderr
for a in test/*.tpl; do
echo "$a"
if [[ $a == *cyrano_full* ]]
diff --git a/test_expected_output.out b/test_expected_output.out
@@ -0,0 +1,36 @@
+test/albatros.tpl
+test/andromaque.tpl
+stdin:1724: > Andromaque m’attend. Phœnix, garde son fils.
+stdin:1724: Bad rhyme sound for type B (expected "i"/"iz", inferred "is"/"il"/"iss"/"ils"/"ilz"/"isz")
+test/au_lecteur.tpl
+test/boileau.tpl
+stdin:1021: > Entouré à demi d'un vieux parchemin noir,
+stdin:1021: > HHHH
+stdin:1021: Illegal hiatus (see 'H' above)
+stdin:3479: > Va revoir ses billets et compter son argent ;
+stdin:3479: Bad rhyme ending for type B (expected "-nd", inferred "-nt")
+stdin:3741: > Il est vrai. Mais pourtant sans loi et sans police,
+stdin:3741: > HHHH
+stdin:3741: Illegal hiatus (see 'H' above)
+stdin:4285: > Le vice audacieux des hommes avoué
+stdin:4285: Bad rhyme ending for type B (expected "-oé", inferred "-ué")
+stdin:4423: > Suivre à front découvert Zouzou et Messaline ;
+stdin:4423: > HHHH
+stdin:4423: Illegal hiatus (see 'H' above)
+stdin:5697: > Que de savants plaideurs désormais inutiles !
+stdin:5697: Bad rhyme sound for type A (expected "ijz"/"ijs"/"ij", inferred "il"/"ilz"/"ils")
+stdin:6052: > Wurts... Ah ! quel nom, grand roi, quel Hector que ce Wurts !
+stdin:6052: Bad rhyme sound for type B (expected "yR"/"yRz"/"yRs", inferred "9Rs"/"uRts"/"uRtz"/"9Rz"/"9R"/"uRt"/"uRs"/"uRz"/"uR")
+test/cyrano_full.tpl
+test/cyrano.tpl
+test/desdichado.tpl
+test/fils.tpl
+test/letters.tpl
+test/mithridate.tpl
+test/nez.tpl
+stdin:52: > De la moitié du commencement d'une, car
+stdin:52: Bad rhyme ending for type B (expected "-t", inferred "-ar")
+test/prudhomme.tpl
+stdin:342: > Peu à peu les forçant à croître avec mesure,
+stdin:342: > HHHHH
+stdin:342: Illegal hiatus (see 'H' above)