Blame view
tools/lia_ltbox/lia_phon/src/aphon/compile_exep.c
3.65 KB
e6be5137b reinitialized pro... |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 |
/* -------------------------------------------------------- LIA_PHON : Un systeme complet de phonetisation de textes -------------------------------------------------------- Copyright (C) 2001 FREDERIC BECHET .................................................................. This file is part of LIA_PHON LIA_PHON is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA .................................................................. For any publication related to scientific work using LIA_PHON, the following reference paper must be mentioned in the bibliography: Bechet F., 2001, "LIA_PHON - Un systeme complet de phonetisation de textes", revue Traitement Automatique des Langues (T.A.L.) volume 42, numero 1/2001, edition Hermes .................................................................. Contact : FREDERIC BECHET - LIA - UNIVERSITE D'AVIGNON AGROPARC BP1228 84911 AVIGNON CEDEX 09 FRANCE frederic.bechet@lia.univ-avignon.fr .................................................................. */ /* Compile une liste d'exceptions au format suivant: - 1 mot par ligne - pour chaque mot: graphie phonetisation exemple: # ddyyaizz $ ddoollaarr Produit un fichier .sirlex compilable avec 'compile_lexique' et un fichier .zonpho contenant les phonetisations */ /* FRED */ #include <stdio.h> #include <stdlib.h> #include <string.h> #include <strings.h> /*................................................................*/ #define TailleLigne 10000 #define True 1 #define False 0 #define max(a,b) ((a)>(b)?(a):(b)) #define min(a,b) ((a)<(b)?(a):(b)) void ERREUR(char *ch1,char *ch2) { fprintf(stderr,"ERREUR : %s %s ",ch1,ch2); exit(0); } /*................................................................*/ int main(int argc, char **argv) { char ch[TailleLigne],*zone,*graf,*phon; int nb,indice,taille; FILE *file,*filegraf,*filephon; if (argc<2) { fprintf(stderr,"Syntaxe : %s <list exceptions phonetisees> ",argv[0]); exit(0); } sprintf(ch,"%s.sirlex",argv[1]); if (!(filegraf=fopen(ch,"wt"))) ERREUR("can't write in:",ch); sprintf(ch,"%s.zonpho",argv[1]); if (!(filephon=fopen(ch,"wb"))) ERREUR("can't write in:",ch); /* calcul de la taille max des phonetisations */ if (!(file=fopen(argv[1],"rt"))) ERREUR("can't open :",argv[1]); fseek(file,0,SEEK_END); zone=(char*)malloc(sizeof(char)*(int)(taille=ftell(file)/sizeof(char))); fseek(file,0,SEEK_SET); for(zone[0]='\0',indice=0,nb=0;fgets(ch,TailleLigne,file);nb++) { if ((nb+1)%100000==0) fprintf(stderr,"En cours : %d ",nb+1); graf=strtok(ch," \t "); phon=strtok(NULL," \t "); fprintf(filegraf,"%d\t%s ",indice,graf); strcpy(zone+indice,phon); zone[indice+strlen(phon)]='\0'; indice+=strlen(phon)+1; if (indice>=taille-10) ERREUR("pourquoi 'taille' est-t-il trop petit ??",""); } fwrite(zone,sizeof(char),indice,filephon); fclose(file); fclose(filegraf); fclose(filephon); exit(0); } |