homophones

find homophones in French
git clone https://a3nm.net/git/homophones/
Log | Files | Refs

sources.sh (591B)


      1 #!/bin/bash
      2 
      3 
      4 cat lexique-dicollecte-fr-v6.2.txt | sed '1,16d' | awk -F "\t" '{printf("%s\t%s\t%s\t%s\t%s\t%s\t%s\n", $2, $5, $3, substr($4, 1, 1), substr($4, length($4)-5, 3), substr($4, length($4)-1, 2), $18);}' > dicollecte
      5 
      6 cat dicollecte | ./fix_elision_dicollecte_1.sh| ./fix_elision_dicollecte_1.sh|
      7   ./fix_elision_dicollecte_1.sh| ./fix_elision_dicollecte_1.sh |
      8   ./fix_elision_dicollecte_1.sh > dicollecte_elision_schwa
      9 
     10 # homophones_* were generated by a first pass of dicollecte
     11 # and of cut -f 1-7 ~/git/lexique/lexique
     12 # through ./homophones.py without using TLF definitions
     13