#!/bin/sh # 28 de januario 2020, 10 e 16 de februario 2020 FRIABASE=/home/rudhar/d/rudhar.com/lingtics/intrlnga/cgi-grep/fria # Remove indicationes de accentation e pronunciation. # Muta prép (francese) al plus general prep cat < tmp01.txt s@@@g s@ ?\[[A-Z][a-z]*\]@@g s@ \[A, Ned\]@@g s@ ?\[sanskrito\]@@g s@ ?\[ʒ[ea]?(ia)?\]@@g s@ \[fedʒiar\]@@g s@ ?\[ʒ…ʒ\]@@g s@ ?\{ch…ch\}@@g s@ ?\[gi\]@@g s@ \[emaljar\]@@g s@ \[emaljator\]@@g s@ \[alja\]@@g s@ \{[eèou]\}@@g s@ \{ts\}@@g s@ \{ch\}@@g s@ \{ch[ao]\}@@g s@ \{tch\}@@g s@ \{plwa\}@@g s@ \{chich\}@@g s@ \{chak\}@@g s@ \{dja\}@@g s@ \{gre\}@@g s@ \{vudu\}@@g s@ \{iglu\}@@g s@ \{buge\}@@g s@ \{aa\}@@g s@ \{ija\}@@g s@ \{ana\}@@g s@ \{rel\}@@g s@ \{ke\}@@g s@ \{chokes\}@@g s@ \{mozambik\}@@g s@prép\.@prep.@ EOF sed -r -f tmp01.txt $FRIABASE/fria.htm > tmp02.txt ./friatoia < tmp02.txt SlashExpander < tmp03.txt > LISTA-fr.txt SlashExpander < tmp04.txt > THESAURO-fr.txt sort -u LISTA-fr.txt THESAURO-fr.txt > TOTO-fr.txt rm tmp0[1234].txt