sources.sh (591B)
1 #!/bin/bash 2 3 4 cat lexique-dicollecte-fr-v6.2.txt | sed '1,16d' | awk -F "\t" '{printf("%s\t%s\t%s\t%s\t%s\t%s\t%s\n", $2, $5, $3, substr($4, 1, 1), substr($4, length($4)-5, 3), substr($4, length($4)-1, 2), $18);}' > dicollecte 5 6 cat dicollecte | ./fix_elision_dicollecte_1.sh| ./fix_elision_dicollecte_1.sh| 7 ./fix_elision_dicollecte_1.sh| ./fix_elision_dicollecte_1.sh | 8 ./fix_elision_dicollecte_1.sh > dicollecte_elision_schwa 9 10 # homophones_* were generated by a first pass of dicollecte 11 # and of cut -f 1-7 ~/git/lexique/lexique 12 # through ./homophones.py without using TLF definitions 13