Annotation of src/usr.bin/spell/spellprog.c, Revision 1.1
1.1 ! millert 1: /* $OpenBSD$ */
! 2:
! 3: /*
! 4: * Copyright (c) 1991, 1993
! 5: * The Regents of the University of California. All rights reserved.
! 6: *
! 7: * Redistribution and use in source and binary forms, with or without
! 8: * modification, are permitted provided that the following conditions
! 9: * are met:
! 10: * 1. Redistributions of source code must retain the above copyright
! 11: * notice, this list of conditions and the following disclaimer.
! 12: * 2. Redistributions in binary form must reproduce the above copyright
! 13: * notice, this list of conditions and the following disclaimer in the
! 14: * documentation and/or other materials provided with the distribution.
! 15: * 3. All advertising materials mentioning features or use of this software
! 16: * must display the following acknowledgement:
! 17: * This product includes software developed by the University of
! 18: * California, Berkeley and its contributors.
! 19: * 4. Neither the name of the University nor the names of its contributors
! 20: * may be used to endorse or promote products derived from this software
! 21: * without specific prior written permission.
! 22: *
! 23: * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
! 24: * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
! 25: * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
! 26: * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
! 27: * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
! 28: * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
! 29: * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
! 30: * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
! 31: * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
! 32: * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
! 33: * SUCH DAMAGE.
! 34: *
! 35: * @(#)spell.h 8.1 (Berkeley) 6/6/93
! 36: */
! 37: /*
! 38: * Copyright (C) Caldera International Inc. 2001-2002.
! 39: * All rights reserved.
! 40: *
! 41: * Redistribution and use in source and binary forms, with or without
! 42: * modification, are permitted provided that the following conditions
! 43: * are met:
! 44: * 1. Redistributions of source code and documentation must retain the above
! 45: * copyright notice, this list of conditions and the following disclaimer.
! 46: * 2. Redistributions in binary form must reproduce the above copyright
! 47: * notice, this list of conditions and the following disclaimer in the
! 48: * documentation and/or other materials provided with the distribution.
! 49: * 3. All advertising materials mentioning features or use of this software
! 50: * must display the following acknowledgement:
! 51: * This product includes software developed or owned by Caldera
! 52: * International, Inc.
! 53: * 4. Neither the name of Caldera International, Inc. nor the names of other
! 54: * contributors may be used to endorse or promote products derived from
! 55: * this software without specific prior written permission.
! 56: *
! 57: * USE OF THE SOFTWARE PROVIDED FOR UNDER THIS LICENSE BY CALDERA
! 58: * INTERNATIONAL, INC. AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR
! 59: * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
! 60: * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
! 61: * IN NO EVENT SHALL CALDERA INTERNATIONAL, INC. BE LIABLE FOR ANY DIRECT,
! 62: * INDIRECT INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
! 63: * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
! 64: * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
! 65: * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
! 66: * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
! 67: * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
! 68: * POSSIBILITY OF SUCH DAMAGE.
! 69: */
! 70:
! 71: #ifndef lint
! 72: static const char copyright[] =
! 73: "@(#) Copyright (c) 1991, 1993\n\
! 74: The Regents of the University of California. All rights reserved.\n";
! 75: #endif /* not lint */
! 76:
! 77: #ifndef lint
! 78: #if 0
! 79: static const char sccsid[] = "@(#)spell.c 8.1 (Berkeley) 6/6/93";
! 80: #else
! 81: #endif
! 82: static const char rcsid[] = "$OpenBSD$";
! 83: #endif /* not lint */
! 84:
! 85: #include <sys/param.h>
! 86: #include <sys/mman.h>
! 87: #include <sys/stat.h>
! 88:
! 89: #include <ctype.h>
! 90: #include <err.h>
! 91: #include <errno.h>
! 92: #include <fcntl.h>
! 93: #include <limits.h>
! 94: #include <locale.h>
! 95: #include <stdio.h>
! 96: #include <stdlib.h>
! 97: #include <string.h>
! 98: #include <unistd.h>
! 99:
! 100: #define DLEV 2
! 101:
! 102: int an(char *, char *, char *, int);
! 103: int bility(char *, char *, char *, int);
! 104: int es(char *, char *, char *, int);
! 105: int dict(char *, char *);
! 106: int i_to_y(char *, char *, char *, int);
! 107: int ily(char *, char *, char *, int);
! 108: int ize(char *, char *, char *, int);
! 109: int metry(char *, char *, char *, int);
! 110: int monosyl(char *, char *);
! 111: int ncy(char *, char *, char *, int);
! 112: int nop(void);
! 113: int trypref(char *, char *, int);
! 114: int tryword(char *, char *, int);
! 115: int s(char *, char *, char *, int);
! 116: int strip(char *, char *, char *, int);
! 117: int suffix(char *, int);
! 118: int tion(char *, char *, char *, int);
! 119: int vowel(int);
! 120: int y_to_e(char *, char *, char *, int);
! 121: int CCe(char *, char *, char *, int);
! 122: int VCe(char *, char *, char *, int);
! 123: char *lookuppref(char **, char *);
! 124: char *skipv(char *);
! 125: void ise(void);
! 126: void print_word(FILE *);
! 127: void ztos(char *);
! 128: __dead void usage(void);
! 129:
! 130: /* from look.c */
! 131: int look(unsigned char *, unsigned char *, unsigned char *);
! 132:
! 133: struct suftab {
! 134: char *suf; /* XXX - needs to be writable for ise() */
! 135: int (*p1)(); /* XXX - variable args */
! 136: int n1;
! 137: char *d1;
! 138: char *a1;
! 139: int (*p2)(); /* XXX - variable args */
! 140: int n2;
! 141: char *d2;
! 142: char *a2;
! 143: } suftab[] = {
! 144: {"ssen", ily, 4, "-y+iness", "+ness" },
! 145: {"ssel", ily, 4, "-y+i+less", "+less" },
! 146: {"se", s, 1, "", "+s", es, 2, "-y+ies", "+es" },
! 147: {"s'", s, 2, "", "+'s"},
! 148: {"s", s, 1, "", "+s"},
! 149: {"ecn", ncy, 1, "", "-t+ce"},
! 150: {"ycn", ncy, 1, "", "-cy+t"},
! 151: {"ytilb", nop, 0, "", ""},
! 152: {"ytilib", bility, 5, "-le+ility", ""},
! 153: {"elbaif", i_to_y, 4, "-y+iable", ""},
! 154: {"elba", CCe, 4, "-e+able", "+able"},
! 155: {"yti", CCe, 3, "-e+ity", "+ity"},
! 156: {"ylb", y_to_e, 1, "-e+y", ""},
! 157: {"yl", ily, 2, "-y+ily", "+ly"},
! 158: {"laci", strip, 2, "", "+al"},
! 159: {"latnem", strip, 2, "", "+al"},
! 160: {"lanoi", strip, 2, "", "+al"},
! 161: {"tnem", strip, 4, "", "+ment"},
! 162: {"gni", CCe, 3, "-e+ing", "+ing"},
! 163: {"reta", nop, 0, "", ""},
! 164: {"re", strip, 1, "", "+r", i_to_y, 2, "-y+ier", "+er"},
! 165: {"de", strip, 1, "", "+d", i_to_y, 2, "-y+ied", "+ed"},
! 166: {"citsi", strip, 2, "", "+ic"},
! 167: {"cihparg", i_to_y, 1, "-y+ic", ""},
! 168: {"tse", strip, 2, "", "+st", i_to_y, 3, "-y+iest", "+est"},
! 169: {"cirtem", i_to_y, 1, "-y+ic", ""},
! 170: {"yrtem", metry, 0, "-ry+er", ""},
! 171: {"cigol", i_to_y, 1, "-y+ic", ""},
! 172: {"tsigol", i_to_y, 2, "-y+ist", ""},
! 173: {"tsi", VCe, 3, "-e+ist", "+ist"},
! 174: {"msi", VCe, 3, "-e+ism", "+ist"},
! 175: {"noitacif", i_to_y, 6, "-y+ication", ""},
! 176: {"noitazi", ize, 5, "-e+ation", ""},
! 177: {"rota", tion, 2, "-e+or", ""},
! 178: {"noit", tion, 3, "-e+ion", "+ion"},
! 179: {"naino", an, 3, "", "+ian"},
! 180: {"na", an, 1, "", "+n"},
! 181: {"evit", tion, 3, "-e+ive", "+ive"},
! 182: {"ezi", CCe, 3, "-e+ize", "+ize"},
! 183: {"pihs", strip, 4, "", "+ship"},
! 184: {"dooh", ily, 4, "-y+hood", "+hood"},
! 185: {"ekil", strip, 4, "", "+like"},
! 186: { NULL }
! 187: };
! 188:
! 189: char *preftab[] = {
! 190: "anti",
! 191: "bio",
! 192: "dis",
! 193: "electro",
! 194: "en",
! 195: "fore",
! 196: "hyper",
! 197: "intra",
! 198: "inter",
! 199: "iso",
! 200: "kilo",
! 201: "magneto",
! 202: "meta",
! 203: "micro",
! 204: "milli",
! 205: "mis",
! 206: "mono",
! 207: "multi",
! 208: "non",
! 209: "out",
! 210: "over",
! 211: "photo",
! 212: "poly",
! 213: "pre",
! 214: "pseudo",
! 215: "re",
! 216: "semi",
! 217: "stereo",
! 218: "sub",
! 219: "super",
! 220: "thermo",
! 221: "ultra",
! 222: "under", /* must precede un */
! 223: "un",
! 224: NULL
! 225: };
! 226:
! 227: struct wlist {
! 228: int fd;
! 229: unsigned char *front;
! 230: unsigned char *back;
! 231: } *wlists;
! 232:
! 233: int vflag;
! 234: int xflag;
! 235: char word[LINE_MAX];
! 236: char original[LINE_MAX];
! 237: char *deriv[40];
! 238: char affix[40];
! 239:
! 240: /*
! 241: * The spellprog utility accepts a newline-delimited list of words
! 242: * on stdin. For arguments it expects the path to a word list and
! 243: * the path to a file in which to store found words.
! 244: *
! 245: * In normal usage, spell is called twice. The first time it is
! 246: * called with a stop list to flag commonly mispelled words. The
! 247: * remaining words are then passed to spell again, this time with
! 248: * the dictionary file as the first (non-flag) argument.
! 249: *
! 250: * Unlike historic versions of spellprog, this one does not use
! 251: * hashed files. Instead it simply requires that files be sorted
! 252: * lexigraphically and uses the same algorithm as the look utility.
! 253: *
! 254: * Note that spellprog should be called via the spell shell script
! 255: * and is not meant to be invoked directly by the user.
! 256: */
! 257:
! 258: int
! 259: main(int argc, char **argv)
! 260: {
! 261: char *ep, *cp, *dp;
! 262: char *outfile;
! 263: int ch, fold, i;
! 264: struct stat sb;
! 265: FILE *file, *found;
! 266:
! 267: setlocale(LC_ALL, "");
! 268:
! 269: outfile = NULL;
! 270: while ((ch = getopt(argc, argv, "bvxo:")) != -1) {
! 271: switch (ch) {
! 272: case 'b':
! 273: /* Use British dictionary and convert ize -> ise. */
! 274: ise();
! 275: break;
! 276: case 'o':
! 277: outfile = optarg;
! 278: break;
! 279: case 'v':
! 280: /* Also write derivations to "found" file. */
! 281: vflag++;
! 282: break;
! 283: case 'x':
! 284: /* Print plausible stems to stdout. */
! 285: xflag++;
! 286: break;
! 287: default:
! 288: usage();
! 289: }
! 290:
! 291: }
! 292: argc -= optind;
! 293: argv += optind;
! 294: if (argc < 1)
! 295: usage();
! 296:
! 297: /* Open and mmap the word/stop lists. */
! 298: if ((wlists = malloc(sizeof(struct wlist) * (argc + 1))) == NULL)
! 299: err(1, "malloc");
! 300: for (i = 0; argc--; i++) {
! 301: wlists[i].fd = open(argv[i], O_RDONLY, 0);
! 302: if (wlists[i].fd == -1 || fstat(wlists[i].fd, &sb) != 0)
! 303: err(1, "%s", argv[i]);
! 304: if (sb.st_size > SIZE_T_MAX)
! 305: errx(1, "%s: %s", argv[i], strerror(EFBIG));
! 306: wlists[i].front = mmap(NULL, (size_t)sb.st_size, PROT_READ,
! 307: MAP_PRIVATE, wlists[i].fd, (off_t)0);
! 308: if (wlists[i].front == MAP_FAILED)
! 309: err(1, "%s", argv[i]);
! 310: wlists[i].back = wlists[i].front + sb.st_size;
! 311: }
! 312: wlists[i].fd = -1;
! 313:
! 314: /* Open file where found words are to be saved. */
! 315: if (outfile == NULL)
! 316: found = NULL;
! 317: else if ((found = fopen(outfile, "w")) == NULL)
! 318: err(1, "cannot open %s", outfile);
! 319:
! 320: /* XXX - this fprintf is for loop abuse */
! 321: for (;; print_word(file)) {
! 322: affix[0] = '\0';
! 323: file = found;
! 324: for (ep = word; (*ep = ch = getchar()) != '\n'; ep++) {
! 325: if (ep - word == sizeof(word) - 1) {
! 326: *ep = '\0';
! 327: warnx("word too long (%s)", word);
! 328: while ((ch = getchar()) != '\n')
! 329: ; /* slurp until EOL */
! 330: }
! 331: if (ch == EOF) {
! 332: if (found != NULL)
! 333: fclose(found);
! 334: exit(0);
! 335: }
! 336: }
! 337: for (cp = word, dp = original; cp < ep; )
! 338: *dp++ = *cp++;
! 339: *dp = '\0';
! 340: fold = 0;
! 341: for (cp = word; cp < ep; cp++)
! 342: if (islower(*cp))
! 343: goto lcase;
! 344: if (trypref(ep, ".", 0))
! 345: continue;
! 346: ++fold;
! 347: for (cp = original + 1, dp = word + 1; dp < ep; dp++, cp++)
! 348: *dp = tolower(*cp);
! 349: lcase:
! 350: if (trypref(ep, ".", 0) || suffix(ep, 0))
! 351: continue;
! 352: if (isupper(word[0])) {
! 353: for (cp = original, dp = word; (*dp = *cp++); dp++) {
! 354: if (fold)
! 355: *dp = tolower(*dp);
! 356: }
! 357: word[0] = tolower(word[0]);
! 358: goto lcase;
! 359: }
! 360: file = stdout;
! 361: }
! 362:
! 363: exit(0);
! 364: }
! 365:
! 366: void
! 367: print_word(FILE *f)
! 368: {
! 369:
! 370: if (f != NULL) {
! 371: if (vflag && affix[0] != '\0' && affix[0] != '.')
! 372: fprintf(f, "%s\t%s\n", affix, original);
! 373: else
! 374: fprintf(f, "%s\n", original);
! 375: }
! 376: }
! 377:
! 378: /*
! 379: * For each matching suffix in suftab, call the function associated
! 380: * with that suffix (p1 and p2).
! 381: */
! 382: int
! 383: suffix(char *ep, int lev)
! 384: {
! 385: struct suftab *t;
! 386: char *cp, *sp;
! 387:
! 388: lev += DLEV;
! 389: deriv[lev] = deriv[lev-1] = 0;
! 390: for (t = suftab; (sp = t->suf); t++) {
! 391: cp = ep;
! 392: while (*sp) {
! 393: if (*--cp != *sp++)
! 394: goto next;
! 395: }
! 396: for (sp = cp; --sp >= word && !vowel(*sp);)
! 397: ; /* nothing */
! 398: if (sp < word)
! 399: return(0);
! 400: if ((*t->p1)(ep-t->n1, t->d1, t->a1, lev+1))
! 401: return(1);
! 402: if (t->p2 != NULL) {
! 403: deriv[lev] = deriv[lev+1] = '\0';
! 404: return((*t->p2)(ep-t->n2, t->d2, t->a2, lev));
! 405: }
! 406: return(0);
! 407: next: ;
! 408: }
! 409: return(0);
! 410: }
! 411:
! 412: int
! 413: nop(void)
! 414: {
! 415:
! 416: return(0);
! 417: }
! 418:
! 419: int
! 420: strip(char *ep, char *d, char *a, int lev)
! 421: {
! 422:
! 423: return(trypref(ep, a, lev) || suffix(ep, lev));
! 424: }
! 425:
! 426: int
! 427: s(char *ep, char *d, char *a, int lev)
! 428: {
! 429:
! 430: if (lev > DLEV + 1)
! 431: return(0);
! 432: if (*ep == 's' && ep[-1] == 's')
! 433: return(0);
! 434: return(strip(ep, d, a, lev));
! 435: }
! 436:
! 437: int
! 438: an(char *ep, char *d, char *a, int lev)
! 439: {
! 440:
! 441: if (!isupper(*word)) /* must be proper name */
! 442: return(0);
! 443: return(trypref(ep,a,lev));
! 444: }
! 445:
! 446: int
! 447: ize(char *ep, char *d, char *a, int lev)
! 448: {
! 449:
! 450: *ep++ = 'e';
! 451: return(strip(ep ,"", d, lev));
! 452: }
! 453:
! 454: int
! 455: y_to_e(char *ep, char *d, char *a, int lev)
! 456: {
! 457: char c = *ep;
! 458:
! 459: *ep++ = 'e';
! 460: if (strip(ep, "", d, lev))
! 461: return (1);
! 462: ep[-1] = c;
! 463: return (0);
! 464: }
! 465:
! 466: int
! 467: ily(char *ep, char *d, char *a, int lev)
! 468: {
! 469:
! 470: if (ep[-1] == 'i')
! 471: return(i_to_y(ep, d, a, lev));
! 472: else
! 473: return(strip(ep, d, a, lev));
! 474: }
! 475:
! 476: int
! 477: ncy(char *ep, char *d, char *a, int lev)
! 478: {
! 479:
! 480: if (skipv(skipv(ep-1)) < word)
! 481: return(0);
! 482: ep[-1] = 't';
! 483: return(strip(ep, d, a, lev));
! 484: }
! 485:
! 486: int
! 487: bility(char *ep, char *d, char *a, int lev)
! 488: {
! 489:
! 490: *ep++ = 'l';
! 491: return(y_to_e(ep, d, a, lev));
! 492: }
! 493:
! 494: int
! 495: i_to_y(char *ep, char *d, char *a, int lev)
! 496: {
! 497:
! 498: if (ep[-1] == 'i') {
! 499: ep[-1] = 'y';
! 500: a = d;
! 501: }
! 502: return(strip(ep, "", a, lev));
! 503: }
! 504:
! 505: int
! 506: es(char *ep, char *d, char *a, int lev)
! 507: {
! 508:
! 509: if (lev > DLEV)
! 510: return(0);
! 511:
! 512: switch (ep[-1]) {
! 513: default:
! 514: return(0);
! 515: case 'i':
! 516: return(i_to_y(ep, d, a, lev));
! 517: case 's':
! 518: case 'h':
! 519: case 'z':
! 520: case 'x':
! 521: return(strip(ep, d, a, lev));
! 522: }
! 523: }
! 524:
! 525: int
! 526: metry(char *ep, char *d, char *a, int lev)
! 527: {
! 528:
! 529: ep[-2] = 'e';
! 530: ep[-1] = 'r';
! 531: return(strip(ep, d, a, lev));
! 532: }
! 533:
! 534: int
! 535: tion(char *ep, char *d, char *a, int lev)
! 536: {
! 537:
! 538: switch (ep[-2]) {
! 539: case 'c':
! 540: case 'r':
! 541: return(trypref(ep, a, lev));
! 542: case 'a':
! 543: return(y_to_e(ep, d, a, lev));
! 544: }
! 545: return(0);
! 546: }
! 547:
! 548: /*
! 549: * Possible consonant-consonant-e ending.
! 550: */
! 551: int
! 552: CCe(char *ep, char *d, char *a, int lev)
! 553: {
! 554:
! 555: switch (ep[-1]) {
! 556: case 'l':
! 557: if (vowel(ep[-2]))
! 558: break;
! 559: switch (ep[-2]) {
! 560: case 'l':
! 561: case 'r':
! 562: case 'w':
! 563: break;
! 564: default:
! 565: return(y_to_e(ep, d, a, lev));
! 566: }
! 567: break;
! 568: case 's':
! 569: if (ep[-2] == 's')
! 570: break;
! 571: case 'c':
! 572: case 'g':
! 573: if (*ep == 'a')
! 574: return(0);
! 575: case 'v':
! 576: case 'z':
! 577: if (vowel(ep[-2]))
! 578: break;
! 579: case 'u':
! 580: if (y_to_e(ep, d, a, lev))
! 581: return(1);
! 582: if (!(ep[-2] == 'n' && ep[-1] == 'g'))
! 583: return(0);
! 584: }
! 585: return(VCe(ep, d, a, lev));
! 586: }
! 587:
! 588: /*
! 589: * Possible consonant-vowel-consonant-e ending.
! 590: */
! 591: int
! 592: VCe(char *ep, char *d, char *a, int lev)
! 593: {
! 594: char c;
! 595:
! 596: c = ep[-1];
! 597: if (c == 'e')
! 598: return(0);
! 599: if (!vowel(c) && vowel(ep[-2])) {
! 600: c = *ep;
! 601: *ep++ = 'e';
! 602: if (trypref(ep, d, lev) || suffix(ep, lev))
! 603: return(1);
! 604: ep--;
! 605: *ep = c;
! 606: }
! 607: return(strip(ep, d, a, lev));
! 608: }
! 609:
! 610: char *
! 611: lookuppref(char **wp, char *ep)
! 612: {
! 613: char **sp;
! 614: char *bp,*cp;
! 615:
! 616: for (sp = preftab; *sp; sp++) {
! 617: bp = *wp;
! 618: for (cp = *sp; *cp; cp++, bp++) {
! 619: if (tolower(*bp) != *cp)
! 620: goto next;
! 621: }
! 622: for (cp = bp; cp < ep; cp++) {
! 623: if (vowel(*cp)) {
! 624: *wp = bp;
! 625: return(*sp);
! 626: }
! 627: }
! 628: next: ;
! 629: }
! 630: return(0);
! 631: }
! 632:
! 633: /*
! 634: * If the word is not in the dictionary, try stripping off prefixes
! 635: * until the word is found or we run out of prefixes to check.
! 636: */
! 637: int
! 638: trypref(char *ep, char *a, int lev)
! 639: {
! 640: char *cp;
! 641: char *bp;
! 642: char *pp;
! 643: int val = 0;
! 644: char space[20];
! 645:
! 646: deriv[lev] = a;
! 647: if (tryword(word, ep, lev))
! 648: return(1);
! 649: bp = word;
! 650: pp = space;
! 651: deriv[lev+1] = pp;
! 652: while ((cp = lookuppref(&bp, ep))) {
! 653: *pp++ = '+';
! 654: while ((*pp = *cp++))
! 655: pp++;
! 656: if (tryword(bp, ep, lev+1)) {
! 657: val = 1;
! 658: break;
! 659: }
! 660: if (pp - space >= sizeof(space))
! 661: return(0);
! 662: }
! 663: deriv[lev+1] = deriv[lev+2] = '\0';
! 664: return(val);
! 665: }
! 666:
! 667: int
! 668: tryword(char *bp, char *ep, int lev)
! 669: {
! 670: int i, j;
! 671: char duple[3];
! 672:
! 673: if (ep-bp <= 1)
! 674: return(0);
! 675: if (vowel(*ep) && monosyl(bp, ep))
! 676: return(0);
! 677:
! 678: i = dict(bp, ep);
! 679: if (i == 0 && vowel(*ep) && ep[-1] == ep[-2] && monosyl(bp, ep-1)) {
! 680: ep--;
! 681: deriv[++lev] = duple;
! 682: duple[0] = '+';
! 683: duple[1] = *ep;
! 684: duple[2] = '\0';
! 685: i = dict(bp, ep);
! 686: }
! 687: if (vflag == 0 || i == 0)
! 688: return(i);
! 689:
! 690: /* Also tack on possible derivations. (XXX - warn on truncation?) */
! 691: for (j = lev; j > 0; j--) {
! 692: if (deriv[j])
! 693: strlcat(affix, deriv[j], sizeof(affix));
! 694: }
! 695: return(i);
! 696: }
! 697:
! 698: int
! 699: monosyl(char *bp, char *ep)
! 700: {
! 701:
! 702: if (ep < bp + 2)
! 703: return(0);
! 704: if (vowel(*--ep) || !vowel(*--ep) || ep[1] == 'x' || ep[1] == 'w')
! 705: return(0);
! 706: while (--ep >= bp)
! 707: if (vowel(*ep))
! 708: return(0);
! 709: return(1);
! 710: }
! 711:
! 712: char *
! 713: skipv(char *s)
! 714: {
! 715:
! 716: if (s >= word && vowel(*s))
! 717: s--;
! 718: while (s >= word && !vowel(*s))
! 719: s--;
! 720: return(s);
! 721: }
! 722:
! 723: int
! 724: vowel(int c)
! 725: {
! 726:
! 727: switch (tolower(c)) {
! 728: case 'a':
! 729: case 'e':
! 730: case 'i':
! 731: case 'o':
! 732: case 'u':
! 733: case 'y':
! 734: return(1);
! 735: }
! 736: return(0);
! 737: }
! 738:
! 739: /*
! 740: * Crummy way to Britishise.
! 741: */
! 742: void
! 743: ise(void)
! 744: {
! 745: struct suftab *p;
! 746:
! 747: for (p = suftab; p->suf; p++) {
! 748: ztos(p->suf);
! 749: ztos(p->d1);
! 750: ztos(p->a1);
! 751: }
! 752: }
! 753:
! 754: void
! 755: ztos(char *s)
! 756: {
! 757:
! 758: for (; *s; s++)
! 759: if (*s == 'z')
! 760: *s = 's';
! 761: }
! 762:
! 763: /*
! 764: * Look up a word in the dictionary.
! 765: * Returns 1 if found, 0 if not.
! 766: */
! 767: int
! 768: dict(char *bp, char *ep)
! 769: {
! 770: char c;
! 771: int i, rval;
! 772:
! 773: c = *ep;
! 774: *ep = '\0';
! 775: if (xflag)
! 776: printf("=%s\n", bp);
! 777: for (i = rval = 0; wlists[i].fd != -1; i++) {
! 778: if ((rval = look((unsigned char *)bp, wlists[i].front,
! 779: wlists[i].back)) == 1)
! 780: break;
! 781: }
! 782: *ep = c;
! 783: return(rval);
! 784: }
! 785:
! 786: __dead void
! 787: usage(void)
! 788: {
! 789: extern char *__progname;
! 790:
! 791: fprintf(stderr, "usage: %s [-bvx] [-o found-words] word-list ...\n",
! 792: __progname);
! 793: exit(1);
! 794: }