Added MySpell library to project

2006-03-11 16:21:45 +00:00 · 2006-03-11 16:21:45 +00:00 · dbac4566d8
commit dbac4566d8
parent 6455734f3d
19 changed files with 7251 additions and 0 deletions
--- a/goldlib/myspell/affentry.cxx
+++ b/goldlib/myspell/affentry.cxx
@ -0,0 +1,393 @@
+#include "license.readme"
+
+
+#include <cctype>
+#include <cstring>
+#include <cstdlib>
+#include <cstdio>
+
+#include "affentry.hxx"
+
+#if !defined(_MSC_VER)
+using namespace std;
+#endif
+
+extern char * mystrdup(const char * s);
+extern char *  myrevstrdup(const char * s);
+
+PfxEntry::PfxEntry(AffixMgr* pmgr, affentry* dp)
+{
+  // register affix manager
+  pmyMgr = pmgr;
+
+  // set up its intial values
+  achar = dp->achar;         // char flag 
+  strip = dp->strip;         // string to strip
+  appnd = dp->appnd;         // string to append
+  stripl = dp->stripl;       // length of strip string
+  appndl = dp->appndl;       // length of append string
+  numconds = dp->numconds;   // number of conditions to match
+  xpflg = dp->xpflg;         // cross product flag
+  // then copy over all of the conditions
+  memcpy(&conds[0],&dp->conds[0],SETSIZE*sizeof(conds[0]));
+  next = NULL;
+  nextne = NULL;
+  nexteq = NULL;
+}
+
+
+PfxEntry::~PfxEntry()
+{
+    achar = '\0';
+    if (appnd) free(appnd);
+    if (strip)free(strip);
+    pmyMgr = NULL;
+    appnd = NULL;
+    strip = NULL;    
+}
+
+
+
+// add prefix to this word assuming conditions hold
+char * PfxEntry::add(const char * word, int len)
+{
+    int			cond;
+    char	        tword[MAXWORDLEN+1];
+
+     /* make sure all conditions match */
+     if ((len > stripl) && (len >= numconds)) {
+            unsigned char * cp = (unsigned char *) word;
+            for (cond = 0;  cond < numconds;  cond++) {
+	       if ((conds[*cp++] & (1 << cond)) == 0)
+	          break;
+            }
+            if (cond >= numconds) {
+	      /* we have a match so add prefix */
+              int tlen = 0;
+              if (appndl) {
+	          strcpy(tword,appnd);
+                  tlen += appndl;
+               } 
+               char * pp = tword + tlen;
+               strcpy(pp, (word + stripl));
+               return mystrdup(tword);
+	    }
+     }
+     return NULL;    
+}
+
+
+
+
+// check if this prefix entry matches 
+struct hentry * PfxEntry::check(const char * word, int len)
+{
+    int			cond;	// condition number being examined
+    int	                tmpl;   // length of tmpword
+    struct hentry *     he;     // hash entry of root word or NULL
+    unsigned char *	cp;		
+    char	        tmpword[MAXWORDLEN+1];
+
+
+    // on entry prefix is 0 length or already matches the beginning of the word.
+    // So if the remaining root word has positive length
+    // and if there are enough chars in root word and added back strip chars
+    // to meet the number of characters conditions, then test it
+
+     tmpl = len - appndl;
+
+     if ((tmpl > 0) &&  (tmpl + stripl >= numconds)) {
+
+	    // generate new root word by removing prefix and adding
+	    // back any characters that would have been stripped
+
+	    if (stripl) strcpy (tmpword, strip);
+	    strcpy ((tmpword + stripl), (word + appndl));
+
+            // now make sure all of the conditions on characters
+            // are met.  Please see the appendix at the end of
+            // this file for more info on exactly what is being
+            // tested
+
+	    cp = (unsigned char *)tmpword;
+	    for (cond = 0;  cond < numconds;  cond++) {
+		if ((conds[*cp++] & (1 << cond)) == 0) break;
+	    }
+
+            // if all conditions are met then check if resulting
+            // root word in the dictionary
+
+	    if (cond >= numconds) {
+		tmpl += stripl;
+		if ((he = pmyMgr->lookup(tmpword)) != NULL) {
+		   if (TESTAFF(he->astr, achar, he->alen)) return he;
+		}
+
+		// prefix matched but no root word was found 
+                // if XPRODUCT is allowed, try again but now 
+                // ross checked combined with a suffix
+
+		if (xpflg & XPRODUCT) {
+		   he = pmyMgr->suffix_check(tmpword, tmpl, XPRODUCT, (AffEntry *)this);
+                   if (he) return he;
+		}
+	    }
+     }
+    return NULL;
+}
+
+
+
+SfxEntry::SfxEntry(AffixMgr * pmgr, affentry* dp)
+{
+  // register affix manager
+  pmyMgr = pmgr;
+
+  // set up its intial values
+  achar = dp->achar;         // char flag 
+  strip = dp->strip;         // string to strip
+  appnd = dp->appnd;         // string to append
+  stripl = dp->stripl;       // length of strip string
+  appndl = dp->appndl;       // length of append string
+  numconds = dp->numconds;   // number of conditions to match
+  xpflg = dp->xpflg;         // cross product flag
+
+  // then copy over all of the conditions
+  memcpy(&conds[0],&dp->conds[0],SETSIZE*sizeof(conds[0]));
+
+  rappnd = myrevstrdup(appnd);
+}
+
+
+SfxEntry::~SfxEntry()
+{
+    achar = '\0';
+    if (appnd) free(appnd);
+    if (rappnd) free(rappnd);
+    if (strip) free(strip);
+    pmyMgr = NULL;
+    appnd = NULL;
+    strip = NULL;    
+}
+
+
+
+// add suffix to this word assuming conditions hold
+char * SfxEntry::add(const char * word, int len)
+{
+    int			cond;
+    char	        tword[MAXWORDLEN+1];
+
+     /* make sure all conditions match */
+     if ((len > stripl) && (len >= numconds)) {
+            unsigned char * cp = (unsigned char *) (word + len);
+            for (cond = numconds; --cond >=0; ) {
+	       if ((conds[*--cp] & (1 << cond)) == 0)
+	          break;
+            }
+            if (cond < 0) {
+	      /* we have a match so add suffix */
+              strcpy(tword,word);
+              int tlen = len;
+              if (stripl) {
+		 tlen -= stripl;
+              }
+              char * pp = (tword + tlen);
+              if (appndl) {
+	          strcpy(pp,appnd);
+                  tlen += appndl;
+	      } else *pp = '\0';
+               return mystrdup(tword);
+	    }
+     }
+     return NULL;
+}
+
+
+
+// see if this suffix is present in the word 
+struct hentry * SfxEntry::check(const char * word, int len, int optflags, AffEntry* ppfx)
+{
+    int	                tmpl;		 // length of tmpword 
+    int			cond;		 // condition beng examined
+    struct hentry *     he;              // hash entry pointer
+    unsigned char *	cp;
+    char	        tmpword[MAXWORDLEN+1];
+    PfxEntry* ep = (PfxEntry *) ppfx;
+
+
+    // if this suffix is being cross checked with a prefix
+    // but it does not support cross products skip it
+
+    if ((optflags & XPRODUCT) != 0 &&  (xpflg & XPRODUCT) == 0)
+        return NULL;
+
+    // upon entry suffix is 0 length or already matches the end of the word.
+    // So if the remaining root word has positive length
+    // and if there are enough chars in root word and added back strip chars
+    // to meet the number of characters conditions, then test it
+
+    tmpl = len - appndl;
+
+    if ((tmpl > 0)  &&  (tmpl + stripl >= numconds)) {
+
+	    // generate new root word by removing suffix and adding
+	    // back any characters that would have been stripped or
+	    // or null terminating the shorter string
+
+	    strcpy (tmpword, word);
+	    cp = (unsigned char *)(tmpword + tmpl);
+	    if (stripl) {
+		strcpy ((char *)cp, strip);
+		tmpl += stripl;
+		cp = (unsigned char *)(tmpword + tmpl);
+	    } else *cp = '\0';
+
+            // now make sure all of the conditions on characters
+            // are met.  Please see the appendix at the end of
+            // this file for more info on exactly what is being
+            // tested
+
+	    for (cond = numconds;  --cond >= 0; ) {
+		if ((conds[*--cp] & (1 << cond)) == 0) break;
+	    }
+
+            // if all conditions are met then check if resulting
+            // root word in the dictionary
+
+	    if (cond < 0) {
+	        if ((he = pmyMgr->lookup(tmpword)) != NULL) {
+                     if (TESTAFF(he->astr, achar , he->alen) && 
+                           ((optflags & XPRODUCT) == 0 || 
+                           TESTAFF(he->astr, ep->getFlag(), he->alen))) return he;
+	        }  
+	    }
+    }
+    return NULL;
+}
+
+
+
+
+#if 0
+
+Appendix:  Understanding Affix Code
+
+
+An affix is either a  prefix or a suffix attached to root words to make 
+other words.
+
+Basically a Prefix or a Suffix is set of AffEntry objects
+which store information about the prefix or suffix along 
+with supporting routines to check if a word has a particular 
+prefix or suffix or a combination.
+
+The structure affentry is defined as follows:
+
+struct affentry
+{
+   unsigned char achar;   // char used to represent the affix
+   char * strip;          // string to strip before adding affix
+   char * appnd;          // the affix string to add
+   short  stripl;         // length of the strip string
+   short  appndl;         // length of the affix string
+   short  numconds;       // the number of conditions that must be met
+   short  xpflg;          // flag: XPRODUCT- combine both prefix and suffix 
+   char   conds[SETSIZE]; // array which encodes the conditions to be met
+};
+
+
+Here is a suffix borrowed from the en_US.aff file.  This file 
+is whitespace delimited.
+
+SFX D Y 4 
+SFX D   0     e          d
+SFX D   y     ied        [^aeiou]y
+SFX D   0     ed         [^ey]
+SFX D   0     ed         [aeiou]y
+
+This information can be interpreted as follows:
+
+In the first line has 4 fields
+
+Field
+-----
+1     SFX - indicates this is a suffix
+2     D   - is the name of the character flag which represents this suffix
+3     Y   - indicates it can be combined with prefixes (cross product)
+4     4   - indicates that sequence of 4 affentry structures are needed to
+               properly store the affix information
+
+The remaining lines describe the unique information for the 4 SfxEntry 
+objects that make up this affix.  Each line can be interpreted
+as follows: (note fields 1 and 2 are as a check against line 1 info)
+
+Field
+-----
+1     SFX         - indicates this is a suffix
+2     D           - is the name of the character flag for this affix
+3     y           - the string of chars to strip off before adding affix
+                         (a 0 here indicates the NULL string)
+4     ied         - the string of affix characters to add
+5     [^aeiou]y   - the conditions which must be met before the affix
+                    can be applied
+
+Field 5 is interesting.  Since this is a suffix, field 5 tells us that
+there are 2 conditions that must be met.  The first condition is that 
+the next to the last character in the word must *NOT* be any of the 
+following "a", "e", "i", "o" or "u".  The second condition is that
+the last character of the word must end in "y".
+
+So how can we encode this information concisely and be able to 
+test for both conditions in a fast manner?  The answer is found
+but studying the wonderful ispell code of Geoff Kuenning, et.al. 
+(now available under a normal BSD license).
+
+If we set up a conds array of 256 bytes indexed (0 to 255) and access it
+using a character (cast to an unsigned char) of a string, we have 8 bits
+of information we can store about that character.  Specifically we
+could use each bit to say if that character is allowed in any of the 
+last (or first for prefixes) 8 characters of the word.
+
+Basically, each character at one end of the word (up to the number 
+of conditions) is used to index into the conds array and the resulting 
+value found there says whether the that character is valid for a 
+specific character position in the word.  
+
+For prefixes, it does this by setting bit 0 if that char is valid 
+in the first position, bit 1 if valid in the second position, and so on. 
+
+If a bit is not set, then that char is not valid for that postion in the
+word.
+
+If working with suffixes bit 0 is used for the character closest 
+to the front, bit 1 for the next character towards the end, ..., 
+with bit numconds-1 representing the last char at the end of the string. 
+
+Note: since entries in the conds[] are 8 bits, only 8 conditions 
+(read that only 8 character positions) can be examined at one
+end of a word (the beginning for prefixes and the end for suffixes.
+
+So to make this clearer, lets encode the conds array values for the 
+first two affentries for the suffix D described earlier.
+
+
+  For the first affentry:    
+     numconds = 1             (only examine the last character)
+
+     conds['e'] =  (1 << 0)   (the word must end in an E)
+     all others are all 0
+
+  For the second affentry:
+     numconds = 2             (only examine the last two characters)     
+
+     conds[X] = conds[X] | (1 << 0)     (aeiou are not allowed)
+         where X is all characters *but* a, e, i, o, or u
+         
+
+     conds['y'] = (1 << 1)     (the last char must be a y)
+     all other bits for all other entries in the conds array are zero
+
+
+#endif
+
--- a/goldlib/myspell/affentry.hxx
+++ b/goldlib/myspell/affentry.hxx
@ -0,0 +1,86 @@
+#ifndef _AFFIX_HXX_
+#define _AFFIX_HXX_
+
+#include "atypes.hxx"
+#include "baseaffix.hxx"
+#include "affixmgr.hxx"
+
+
+/* A Prefix Entry  */
+
+class PfxEntry : public AffEntry
+{
+       AffixMgr*    pmyMgr;
+
+       PfxEntry * next;
+       PfxEntry * nexteq;
+       PfxEntry * nextne;
+       PfxEntry * flgnxt;
+
+public:
+
+  PfxEntry(AffixMgr* pmgr, affentry* dp );
+  ~PfxEntry();
+
+  struct hentry *      check(const char * word, int len);
+
+  inline bool          allowCross() { return ((xpflg & XPRODUCT) != 0); }
+  inline unsigned char getFlag()   { return achar;   }
+  inline const char *  getKey()    { return appnd;  } 
+  char *               add(const char * word, int len);
+
+  inline PfxEntry *    getNext()   { return next;   }
+  inline PfxEntry *    getNextNE() { return nextne; }
+  inline PfxEntry *    getNextEQ() { return nexteq; }
+  inline PfxEntry *    getFlgNxt() { return flgnxt; }
+
+  inline void   setNext(PfxEntry * ptr)   { next = ptr;   }
+  inline void   setNextNE(PfxEntry * ptr) { nextne = ptr; }
+  inline void   setNextEQ(PfxEntry * ptr) { nexteq = ptr; }
+  inline void   setFlgNxt(PfxEntry * ptr) { flgnxt = ptr; }
+};
+
+
+
+
+/* A Suffix Entry */
+
+class SfxEntry : public AffEntry
+{
+       AffixMgr*    pmyMgr;
+       char *       rappnd;
+
+       SfxEntry *   next;
+       SfxEntry *   nexteq;
+       SfxEntry *   nextne;
+       SfxEntry *   flgnxt;
+
+public:
+
+  SfxEntry(AffixMgr* pmgr, affentry* dp );
+  ~SfxEntry();
+
+  struct hentry *   check(const char * word, int len, int optflags, 
+                                                       AffEntry* ppfx);
+
+  inline bool          allowCross() { return ((xpflg & XPRODUCT) != 0); }
+  inline unsigned char getFlag()   { return achar;   }
+  inline const char *  getKey()    { return rappnd; } 
+  char *               add(const char * word, int len);
+
+  inline SfxEntry *    getNext()   { return next;   }
+  inline SfxEntry *    getNextNE() { return nextne; }
+  inline SfxEntry *    getNextEQ() { return nexteq; }
+  inline SfxEntry *    getFlgNxt() { return flgnxt; }
+
+  inline void   setNext(SfxEntry * ptr)   { next = ptr;   }
+  inline void   setNextNE(SfxEntry * ptr) { nextne = ptr; }
+  inline void   setNextEQ(SfxEntry * ptr) { nexteq = ptr; }
+  inline void   setFlgNxt(SfxEntry * ptr) { flgnxt = ptr; }
+
+};
+
+
+#endif
+
+
--- a/goldlib/myspell/affixmgr.cxx
+++ b/goldlib/myspell/affixmgr.cxx
--- a/goldlib/myspell/affixmgr.hxx
+++ b/goldlib/myspell/affixmgr.hxx
@ -0,0 +1,66 @@
+#ifndef _AFFIXMGR_HXX_
+#define _AFFIXMGR_HXX_
+
+#include "atypes.hxx"
+#include "baseaffix.hxx"
+#include "hashmgr.hxx"
+#include <cstdio>
+
+class AffixMgr
+{
+
+  AffEntry *          pStart[SETSIZE];
+  AffEntry *          sStart[SETSIZE];
+  AffEntry *          pFlag[SETSIZE];
+  AffEntry *          sFlag[SETSIZE];
+  HashMgr *           pHMgr;
+  char *              trystring;
+  char *              encoding;
+  char *              compound;
+  int                 cpdmin;
+  int                 numrep;
+  replentry *         reptable;
+  int                 nummap;
+  mapentry *          maptable;
+  bool                nosplitsugs;
+
+
+public:
+ 
+  AffixMgr(const char * affpath, HashMgr * ptr);
+  ~AffixMgr();
+  struct hentry *     affix_check(const char * word, int len);
+  struct hentry *     prefix_check(const char * word, int len);
+  struct hentry *     suffix_check(const char * word, int len, int sfxopts, AffEntry* ppfx);
+  int                 expand_rootword(struct guessword * wlst, int maxn, 
+                             const char * ts, int wl, const char * ap, int al);
+  struct hentry *     compound_check(const char * word, int len, char compound_flag);
+  struct hentry *     lookup(const char * word);
+  int                 get_numrep();
+  struct replentry *  get_reptable();
+  int                 get_nummap();
+  struct mapentry *   get_maptable();
+  char *              get_encoding();
+  char *              get_try_string();
+  char *              get_compound();
+  bool                get_nosplitsugs();
+             
+private:
+  int  parse_file(const char * affpath);
+  int  parse_try(char * line);
+  int  parse_set(char * line);
+  int  parse_cpdflag(char * line);
+  int  parse_cpdmin(char * line);
+  int  parse_reptable(char * line, FILE * af);
+  int  parse_maptable(char * line, FILE * af);
+  int  parse_affix(char * line, const char at, FILE * af);
+
+  void encodeit(struct affentry * ptr, char * cs);
+  int build_pfxlist(AffEntry* pfxptr);
+  int build_sfxlist(AffEntry* sfxptr);
+  int process_pfx_order();
+  int process_sfx_order();
+};
+
+#endif
+
--- a/goldlib/myspell/atypes.hxx
+++ b/goldlib/myspell/atypes.hxx
@ -0,0 +1,45 @@
+#ifndef _ATYPES_HXX_
+#define _ATYPES_HXX_
+
+#define SETSIZE         256
+#define MAXAFFIXES      256
+#define MAXWORDLEN      100
+#define XPRODUCT        (1 << 0)
+
+#define MAXLNLEN        1024
+
+#define TESTAFF( a , b , c ) memchr((void *)(a), (int)(b), (size_t)(c) )
+
+struct affentry
+{
+   char * strip;
+   char * appnd;
+   short  stripl;
+   short  appndl;
+   short  numconds;
+   short  xpflg;
+   char   achar;
+   char   conds[SETSIZE];
+};
+
+struct replentry {
+  char * pattern;
+  char * replacement;
+};
+
+struct mapentry {
+  char * set;
+  int len;
+};
+
+struct guessword {
+  char * word;
+  bool allow;
+};
+
+#endif
+
+
+
+
+
--- a/goldlib/myspell/baseaffix.hxx
+++ b/goldlib/myspell/baseaffix.hxx
@ -0,0 +1,17 @@
+#ifndef _BASEAFF_HXX_
+#define _BASEAFF_HXX_
+
+class AffEntry
+{
+protected:
+       char *       appnd;
+       char *       strip;
+       short        appndl;
+       short        stripl;
+       short        numconds;
+       short        xpflg;
+       char         achar;
+       char         conds[SETSIZE];
+};
+
+#endif
--- a/goldlib/myspell/csutil.cxx
+++ b/goldlib/myspell/csutil.cxx
--- a/goldlib/myspell/csutil.hxx
+++ b/goldlib/myspell/csutil.hxx
@ -0,0 +1,67 @@
+#ifndef __CSUTILHXX__
+#define __CSUTILHXX__
+
+
+// First some base level utility routines
+
+// remove end of line char(s)
+void   mychomp(char * s);
+
+// duplicate string                          
+char * mystrdup(const char * s);
+
+// duplicate reverse of string                   
+char * myrevstrdup(const char * s);
+
+// parse into tokens with char delimiter                
+char * mystrsep(char ** sptr, const char delim);
+
+// is one string a leading subset of another   
+int    isSubset(const char * s1, const char * s2);
+
+
+// character encoding information
+
+struct cs_info {
+  unsigned char ccase;
+  unsigned char clower;
+  unsigned char cupper;
+};
+
+
+struct enc_entry {
+  const char * enc_name;
+  struct cs_info * cs_table;
+};
+
+// language to encoding default map
+
+struct lang_map {
+  const char * lang;
+  const char * def_enc;
+};
+
+struct cs_info * get_current_cs(const char * es);
+
+const char * get_default_enc(const char * lang);
+
+// convert null terminated string to all caps using encoding 
+void enmkallcap(char * d, const char * p, const char * encoding);
+
+// convert null terminated string to all little using encoding
+void enmkallsmall(char * d, const char * p, const char * encoding);
+
+// convert null terminated string to have intial capital using encoding
+void enmkinitcap(char * d, const char * p, const char * encoding);
+
+// convert null terminated string to all caps 
+void mkallcap(char * p, const struct cs_info * csconv);
+
+// convert null terminated string to all little
+void mkallsmall(char * p, const struct cs_info * csconv);
+
+// convert null terminated string to have intial capital
+void mkinitcap(char * p, const struct cs_info * csconv);
+
+
+#endif
--- a/goldlib/myspell/dictmgr.cxx
+++ b/goldlib/myspell/dictmgr.cxx
@ -0,0 +1,127 @@
+
+#include <cstdlib>
+#include <cstring>
+#include <cctype>
+#include <cstdio>
+
+#include "dictmgr.hxx"
+
+#if !defined(_MSC_VER)
+using namespace std;
+#endif
+
+// some utility functions
+extern void mychomp(char * s);
+extern char * mystrdup(const char * s);
+extern char * mystrsep(char ** stringp, const char delim);
+
+DictMgr::DictMgr(const char * dictpath, const char * etype) 
+{
+  // load list of etype entries
+  numdict = 0;
+  pdentry = (dictentry *)malloc(MAXDICTIONARIES*sizeof(struct dictentry));
+  if (pdentry) {
+     if (parse_file(dictpath, etype)) {
+        numdict = 0;
+        // no dictionary.lst found is okay
+     }
+  } else {
+     numdict = 0;
+  }
+}
+
+
+DictMgr::~DictMgr() 
+{
+  dictentry * pdict = NULL;
+  if (pdentry) {
+     pdict = pdentry;
+     for (int i=0;i<numdict;i++) {
+        if (pdict->lang) {
+            free(pdict->lang);
+            pdict->lang = NULL;
+        }
+        if (pdict->region) {
+            free(pdict->region);
+            pdict->region=NULL;
+        }
+        if (pdict->filename) {
+            free(pdict->filename);
+            pdict->filename = NULL;
+        }
+        pdict++;
+     }
+     free(pdentry);
+     pdentry = NULL;
+     pdict = NULL;
+  }
+  numdict = 0;
+}
+
+
+// read in list of etype entries and build up structure to describe them
+int  DictMgr::parse_file(const char * dictpath, const char * etype)
+{
+
+    int i;
+    char line[MAXDICTENTRYLEN+1];
+    dictentry * pdict = pdentry;
+
+    // open the dictionary list file
+    FILE * dictlst;
+    dictlst = fopen(dictpath,"r");
+    if (!dictlst) {
+      return 1;
+    }
+
+    // step one is to parse the dictionary list building up the 
+    // descriptive structures
+
+    // read in each line ignoring any that dont start with etype
+    while (fgets(line,MAXDICTENTRYLEN,dictlst)) {
+       mychomp(line);
+
+       /* parse in a dictionary entry */
+       if (strncmp(line,etype,4) == 0) {
+	  if (numdict < MAXDICTIONARIES) {
+             char * tp = line;
+             char * piece;
+             i = 0;
+             while ((piece=mystrsep(&tp,' '))) {
+                if (*piece != '\0') {
+                    switch(i) {
+                       case 0: break;
+		       case 1: pdict->lang = mystrdup(piece); break;
+                       case 2: if (strcmp (piece, "ANY") == 0)
+				 pdict->region = mystrdup("");
+			       else
+				 pdict->region = mystrdup(piece);
+			       break;
+                       case 3: pdict->filename = mystrdup(piece); break;
+		       default: break;
+                    }
+                    i++;
+                }
+                free(piece);
+	     }
+             if (i == 4) {
+                 numdict++;
+                 pdict++;
+	     } else {
+                 fprintf(stderr,"dictionary list corruption in line \"%s\"\n",line);
+                 fflush(stderr);
+	     }
+	  }
+       }
+    }
+    fclose(dictlst);
+    return 0;
+}
+
+// return text encoding of dictionary
+int DictMgr::get_list(dictentry ** ppentry)
+{
+  *ppentry = pdentry;
+  return numdict;
+}
+
--- a/goldlib/myspell/dictmgr.hxx
+++ b/goldlib/myspell/dictmgr.hxx
@ -0,0 +1,31 @@
+#ifndef _DICTMGR_HXX_
+#define _DICTMGR_HXX_
+
+#define MAXDICTIONARIES 100
+#define MAXDICTENTRYLEN 1024
+
+struct dictentry {
+  char * filename;
+  char * lang;
+  char * region;
+};
+
+
+class DictMgr
+{
+
+  int                 numdict;
+  dictentry *         pdentry;
+
+public:
+ 
+  DictMgr(const char * dictpath, const char * etype);
+  ~DictMgr();
+  int get_list(dictentry** ppentry);
+            
+private:
+  int  parse_file(const char * dictpath, const char * etype);
+
+};
+
+#endif
--- a/goldlib/myspell/example.cxx
+++ b/goldlib/myspell/example.cxx
@ -0,0 +1,89 @@
+#include <cstring>
+#include <cstdlib>
+#include <cstdio>
+
+#include "myspell.hxx"
+
+extern char * mystrdup(const char * s);
+
+using namespace std;
+
+int 
+main(int argc, char** argv)
+{
+
+    char * af;
+    char * df;
+    char * wtc;
+    FILE* wtclst;
+
+  /* first parse the command line options */
+  /* arg1 - affix file, arg2 dictionary file, arg3 - file of words to check */
+
+  if (argv[1]) {
+       af = mystrdup(argv[1]);
+  } else {
+    fprintf(stderr,"correct syntax is:\n"); 
+    fprintf(stderr,"example affix_file dictionary_file file_of_words_to_check\n");
+    exit(1);
+  }
+  if (argv[2]) {
+       df = mystrdup(argv[2]);
+  } else {
+    fprintf(stderr,"correct syntax is:\n"); 
+    fprintf(stderr,"example affix_file dictionary_file file_of_words_to_check\n");
+    exit(1);
+  }
+  if (argv[3]) {
+       wtc = mystrdup(argv[3]);
+  } else {
+    fprintf(stderr,"correct syntax is:\n"); 
+    fprintf(stderr,"example affix_file dictionary_file file_of_words_to_check\n");
+    exit(1);
+  }
+
+  
+  /* open the words to check list */
+  wtclst = fopen(wtc,"r");
+  if (!wtclst) {
+    fprintf(stderr,"Error - could not open file of words to check\n");
+    exit(1);
+  }
+
+   
+    MySpell * pMS= new MySpell(af,df);
+    
+    int k;
+    int dp;
+    char buf[101];
+
+    while(fgets(buf,100,wtclst)) {
+      k = strlen(buf);
+      *(buf + k - 1) = '\0';
+       dp = pMS->spell(buf);
+       if (dp) {
+          fprintf(stdout,"\"%s\" is okay\n",buf);
+          fprintf(stdout,"\n");
+       } else {
+          fprintf(stdout,"\"%s\" is incorrect!\n",buf);
+          fprintf(stdout,"   suggestions:\n");
+          char ** wlst;
+          int ns = pMS->suggest(&wlst,buf);
+          for (int i=0; i < ns; i++) {
+            fprintf(stdout,"    ...\"%s\"\n",wlst[i]);
+            free(wlst[i]);
+          }
+          fprintf(stdout,"\n");
+          free(wlst);
+       }
+    }
+
+    delete pMS;
+    fclose(wtclst);
+    free(wtc);
+    free(df);
+    free(af);
+
+    return 0;
+}
+
--- a/goldlib/myspell/hashmgr.cxx
+++ b/goldlib/myspell/hashmgr.cxx
@ -0,0 +1,213 @@
+#include "license.readme"
+
+#if !defined(_MSC_VER)
+#include <unistd.h>
+#endif
+#include <cstdlib>
+#include <cstring>
+#include <fcntl.h>
+#include <cstdio>
+
+#include "hashmgr.hxx"
+
+extern void mychomp(char * s);
+extern char * mystrdup(const char *);
+
+#if !defined(_MSC_VER)
+using namespace std;
+#endif
+
+
+// build a hash table from a munched word list
+
+HashMgr::HashMgr(const char * tpath)
+{
+  tablesize = 0;
+  tableptr = NULL;
+  int ec = load_tables(tpath);
+  if (ec) {
+    /* error condition - what should we do here */
+    fprintf(stderr,"Hash Manager Error : %d\n",ec);
+    fflush(stderr);
+    if (tableptr) {
+      free(tableptr);
+    }
+    tablesize = 0;
+  }
+}
+
+
+HashMgr::~HashMgr()
+{
+  if (tableptr) {
+    // now pass through hash table freeing up everything
+    // go through column by column of the table
+    for (int i=0; i < tablesize; i++) {
+      struct hentry * pt = &tableptr[i];
+      struct hentry * nt = NULL;
+      if (pt) {
+	if (pt->word) free(pt->word);
+        if (pt->astr) free(pt->astr);
+        pt = pt->next;
+      }
+      while(pt) {
+        nt = pt->next;
+	if (pt->word) free(pt->word);
+        if (pt->astr) free(pt->astr);
+        free(pt);
+	pt = nt;
+      }
+    }
+    free(tableptr);
+  }
+  tablesize = 0;
+}
+
+
+
+// lookup a root word in the hashtable
+
+struct hentry * HashMgr::lookup(const char *word) const
+{
+    struct hentry * dp;
+    if (tableptr) {
+       dp = &tableptr[hash(word)];
+       if (dp->word == NULL) return NULL;
+       for (  ;  dp != NULL;  dp = dp->next) {
+          if (strcmp(word,dp->word) == 0) return dp;
+       }
+    }
+    return NULL;
+}
+
+
+
+// add a word to the hash table (private)
+
+int HashMgr::add_word(const char * word, int wl, const char * aff, int al)
+{
+    int i = hash(word);
+    struct hentry * dp = &tableptr[i];
+    struct hentry* hp;
+    if (dp->word == NULL) {
+       dp->wlen = wl;
+       dp->alen = al;
+       dp->word = mystrdup(word);
+       dp->astr = mystrdup(aff);
+       dp->next = NULL;
+       if ((wl) && (dp->word == NULL)) return 1;
+       if ((al) && (dp->astr == NULL)) return 1;
+    } else {
+       hp = (struct hentry *) malloc (sizeof(struct hentry));
+       if (hp == NULL) return 1;
+       hp->wlen = wl;
+       hp->alen = al;
+       hp->word = mystrdup(word);
+       hp->astr = mystrdup(aff);
+       hp->next = NULL;      
+       while (dp->next != NULL) dp=dp->next; 
+       dp->next = hp;
+       if ((wl) && (hp->word == NULL)) return 1;
+       if ((al) && (hp->astr == NULL)) return 1;
+    }
+    return 0;
+}     
+
+
+
+// walk the hash table entry by entry - null at end
+struct hentry * HashMgr::walk_hashtable(int &col, struct hentry * hp) const
+{
+  //reset to start
+  if ((col < 0) || (hp == NULL)) {
+    col = -1;
+    hp = NULL;
+  }
+
+  if (hp && hp->next != NULL) {
+    hp = hp->next;
+  } else {
+    col++;
+    hp = (col < tablesize) ? &tableptr[col] : NULL;
+    // search for next non-blank column entry
+    while (hp && (hp->word == NULL)) {
+        col ++;
+        hp = (col < tablesize) ? &tableptr[col] : NULL;
+    }
+    if (col < tablesize) return hp;
+    hp = NULL;
+    col = -1;
+  }
+  return hp;
+}
+
+
+
+// load a munched word list and build a hash table on the fly
+
+int HashMgr::load_tables(const char * tpath)
+{
+  int wl, al;
+  char * ap;
+
+  // raw dictionary - munched file
+  FILE * rawdict = fopen(tpath, "r");
+  if (rawdict == NULL) return 1;
+
+  // first read the first line of file to get hash table size */
+  char ts[MAXDELEN];
+  if (! fgets(ts, MAXDELEN-1,rawdict)) return 2;
+  mychomp(ts);
+  tablesize = atoi(ts);
+  if (!tablesize) return 4; 
+  tablesize = tablesize + 5;
+  if ((tablesize %2) == 0) tablesize++;
+
+  // allocate the hash table
+  tableptr = (struct hentry *) calloc(tablesize, sizeof(struct hentry));
+  if (! tableptr) return 3;
+
+  // loop through all words on much list and add to hash
+  // table and create word and affix strings
+
+  while (fgets(ts,MAXDELEN-1,rawdict)) {
+    mychomp(ts);
+    // split each line into word and affix char strings
+    ap = strchr(ts,'/');
+    if (ap) {
+      *ap = '\0';
+      ap++;
+      al = strlen(ap);
+    } else {
+      al = 0;
+      ap = NULL;
+    }
+
+    wl = strlen(ts);
+
+    // add the word and its index
+    if (add_word(ts,wl,ap,al)) 
+      return 5;;
+
+  }
+
+  fclose(rawdict);
+  return 0;
+}
+
+
+// the hash function is a simple load and rotate
+// algorithm borrowed
+
+int HashMgr::hash(const char * word) const
+{
+    long  hv = 0;
+    for (int i=0; i < 4  &&  *word != 0; i++)
+	hv = (hv << 8) | (*word++);
+    while (*word != 0) {
+      ROTATE(hv,ROTATE_LEN);
+      hv ^= (*word++);
+    }
+    return (unsigned long) hv % tablesize;
+}
+
--- a/goldlib/myspell/hashmgr.hxx
+++ b/goldlib/myspell/hashmgr.hxx
@ -0,0 +1,27 @@
+#ifndef _HASHMGR_HXX_
+#define _HASHMGR_HXX_
+
+#include "htypes.hxx"
+
+class HashMgr
+{
+  int             tablesize;
+  struct hentry * tableptr;
+
+public:
+  HashMgr(const char * tpath);
+  ~HashMgr();
+
+  struct hentry * lookup(const char *) const;
+  int hash(const char *) const;
+  struct hentry * walk_hashtable(int & col, struct hentry * hp) const;
+
+private:
+  HashMgr( const HashMgr & ); // not implemented
+  HashMgr &operator=( const HashMgr & ); // not implemented
+  int load_tables(const char * tpath);
+  int add_word(const char * word, int wl, const char * ap, int al);
+
+};
+
+#endif
--- a/goldlib/myspell/htypes.hxx
+++ b/goldlib/myspell/htypes.hxx
@ -0,0 +1,20 @@
+#ifndef _HTYPES_HXX_
+#define _HTYPES_HXX_
+
+#define MAXDELEN    256
+
+#define ROTATE_LEN   5
+
+#define ROTATE(v,q) \
+   (v) = ((v) << (q)) | (((v) >> (32 - q)) & ((1 << (q))-1));
+
+struct hentry
+{
+  short    wlen;
+  short    alen;
+  char *   word;
+  char *   astr;
+  struct   hentry * next;
+}; 
+
+#endif
--- a/goldlib/myspell/license.readme
+++ b/goldlib/myspell/license.readme
@ -0,0 +1,61 @@
+/*
+ * Copyright 2002 Kevin B. Hendricks, Stratford, Ontario, Canada
+ * And Contributors.  All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ *
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ *
+ * 3. All modifications to the source code must be clearly marked as
+ *    such.  Binary redistributions based on modified source code
+ *    must be clearly marked as modified versions in the documentation
+ *    and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY KEVIN B. HENDRICKS AND CONTRIBUTORS 
+ * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS 
+ * FOR A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL 
+ * KEVIN B. HENDRICKS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, 
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, 
+ * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 
+ * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ *
+ * NOTE: A special thanks and credit goes to Geoff Kuenning
+ * the creator of ispell.  MySpell's affix algorithms were
+ * based on those of ispell which should be noted is
+ * copyright Geoff Kuenning et.al. and now available
+ * under a BSD style license. For more information on ispell
+ * and affix compression in general, please see:
+ * http://www.cs.ucla.edu/ficus-members/geoff/ispell.html
+ * (the home page for ispell)
+ *
+ * An almost complete rewrite  of MySpell for use by  
+ * the Mozilla project has been developed by David Einstein 
+ * (Deinst@world.std.com).  David and I are now 
+ * working on parallel development tracks to help 
+ * our respective projects (Mozilla and OpenOffice.org 
+ * and we will maintain full affix file and dictionary 
+ * file compatibility and work on merging our versions 
+ * of MySpell back into a single tree. David has been 
+ * a significant help in improving MySpell.
+ * 
+ * Special thanks also go to La'szlo' Ne'meth 
+ * <nemethl@gyorsposta.hu> who is the author of the 
+ * Hungarian dictionary and who developed and contributed 
+ * the code to support compound words in MySpell 
+ * and fixed numerous problems with the encoding 
+ * case conversion tables.
+ *
+ */
--- a/goldlib/myspell/myspell.cxx
+++ b/goldlib/myspell/myspell.cxx
@ -0,0 +1,302 @@
+#include "license.readme"
+
+#include <cstring>
+#include <cstdlib>
+#include <cstdio>
+
+#include "myspell.hxx"
+
+#if !defined(_MSC_VER)
+using namespace std;
+#endif
+
+
+MySpell::MySpell(const char * affpath, const char * dpath)
+{
+    encoding = NULL;
+    csconv = NULL;
+
+    /* first set up the hash manager */
+    pHMgr = new HashMgr(dpath);
+
+    /* next set up the affix manager */
+    /* it needs access to the hash manager lookup methods */
+    pAMgr = new AffixMgr(affpath,pHMgr);
+
+    /* get the preferred try string and the dictionary */
+    /* encoding from the Affix Manager for that dictionary */
+    char * try_string = pAMgr->get_try_string();
+    encoding = pAMgr->get_encoding();
+    csconv = get_current_cs(encoding);
+
+    /* and finally set up the suggestion manager */
+    maxSug = 100;
+    pSMgr = new SuggestMgr(try_string, maxSug, pAMgr);
+    if (try_string) free(try_string);
+}
+
+
+MySpell::~MySpell()
+{
+    if (pSMgr) delete pSMgr;
+    if (pAMgr) delete pAMgr;
+    if (pHMgr) delete pHMgr;
+    pSMgr = NULL;
+    pAMgr = NULL;
+    pHMgr = NULL;
+    csconv= NULL;
+    if (encoding) free(encoding);
+    encoding = NULL;
+}
+
+
+// make a copy of src at destination while removing all leading
+// blanks and removing any trailing periods after recording
+// their presence with the abbreviation flag
+// also since already going through character by character, 
+// set the capitalization type
+// return the length of the "cleaned" word
+
+int MySpell::cleanword(char * dest, const char * src, int * pcaptype, int * pabbrev)
+{ 
+
+  // with the new breakiterator code this should not be needed anymore
+   const char * special_chars = "._#$%&()* +,-/:;<=>[]\\^`{|}~\t \x0a\x0d\x01\'\"";
+
+   unsigned char * p = (unsigned char *) dest;
+   const unsigned char * q = (const unsigned char * ) src;
+
+   // first skip over any leading special characters
+   while ((*q != '\0') && (strchr(special_chars,(int)(*q)))) q++;
+   
+   // now strip off any trailing special characters 
+   // if a period comes after a normal char record its presence
+   *pabbrev = 0;
+   int nl = strlen((const char *)q);
+   while ((nl > 0) && (strchr(special_chars,(int)(*(q+nl-1))))) {
+       nl--;
+   }
+   if ( *(q+nl) == '.' ) *pabbrev = 1;
+   
+   // if no characters are left it can't be an abbreviation and can't be capitalized
+   if (nl <= 0) { 
+       *pcaptype = NOCAP;
+       *pabbrev = 0;
+       *p = '\0';
+       return 0;
+   }
+
+   // now determine the capitalization type of the first nl letters
+   int ncap = 0;
+   int nneutral = 0;
+   int nc = 0;
+   while (nl > 0) {
+       nc++;
+       if (csconv[(*q)].ccase) ncap++;
+       if (csconv[(*q)].cupper == csconv[(*q)].clower) nneutral++;
+       *p++ = *q++;
+       nl--;
+   }
+   // remember to terminate the destination string
+   *p = '\0';
+
+   // now finally set the captype
+   if (ncap == 0) {
+        *pcaptype = NOCAP;
+   } else if ((ncap == 1) && csconv[(unsigned char)(*dest)].ccase) {
+        *pcaptype = INITCAP;
+  } else if ((ncap == nc) || ((ncap + nneutral) == nc)){
+        *pcaptype = ALLCAP;
+  } else {
+        *pcaptype = HUHCAP;
+  }
+  return nc;
+} 
+       
+
+int MySpell::spell(const char * word)
+{
+  char * rv=NULL;
+  char cw[MAXWORDLEN+1];
+  char wspace[MAXWORDLEN+1];
+
+  int wl = strlen(word);
+  if (wl > (MAXWORDLEN - 1)) return 0;
+  int captype = 0;
+  int abbv = 0;
+  wl = cleanword(cw, word, &captype, &abbv);
+  if (wl == 0) return 1;
+
+  switch(captype) {
+     case HUHCAP:
+     case NOCAP:   { 
+                     rv = check(cw); 
+                     if ((abbv) && !(rv)) {
+		         memcpy(wspace,cw,wl);
+                         *(wspace+wl) = '.';
+                         *(wspace+wl+1) = '\0';
+                         rv = check(wspace);
+                     }
+                     break;
+                   }
+
+     case ALLCAP:  {
+                     memcpy(wspace,cw,(wl+1));
+                     mkallsmall(wspace, csconv);
+                     rv = check(wspace);
+                     if (!rv) {
+                        mkinitcap(wspace, csconv);
+                        rv = check(wspace);
+                     }
+                     if (!rv) rv = check(cw);
+                     if ((abbv) && !(rv)) {
+		         memcpy(wspace,cw,wl);
+                         *(wspace+wl) = '.';
+                         *(wspace+wl+1) = '\0';
+                         rv = check(wspace);
+                     }
+                     break; 
+                   }
+     case INITCAP: { 
+                     memcpy(wspace,cw,(wl+1));
+                     mkallsmall(wspace, csconv);
+                     rv = check(wspace);
+                     if (!rv) rv = check(cw);
+                     if ((abbv) && !(rv)) {
+		         memcpy(wspace,cw,wl);
+                         *(wspace+wl) = '.';
+                         *(wspace+wl+1) = '\0';
+                         rv = check(wspace);
+                     }
+                     break; 
+                   }
+  }
+  if (rv) return 1;
+  return 0;
+}
+
+
+char * MySpell::check(const char * word)
+{
+  struct hentry * he = NULL;
+  if (pHMgr)
+     he = pHMgr->lookup (word);
+
+  if ((he == NULL) && (pAMgr)) {
+     // try stripping off affixes */
+     he = pAMgr->affix_check(word, strlen(word));
+
+     // try check compound word
+     if ((he == NULL) && (pAMgr->get_compound())) {
+          he = pAMgr->compound_check(word, strlen(word), (pAMgr->get_compound())[0]);
+     }
+
+  }
+
+  if (he) return he->word;
+  return NULL;
+}
+
+
+
+int MySpell::suggest(char*** slst, const char * word)
+{
+  char cw[MAXWORDLEN+1];
+  char wspace[MAXWORDLEN+1];
+  if (! pSMgr) return 0;
+  int wl = strlen(word);
+  if (wl > (MAXWORDLEN-1)) return 0;
+  int captype = 0;
+  int abbv = 0;
+  wl = cleanword(cw, word, &captype, &abbv);
+  if (wl == 0) return 0;
+
+  int ns = 0;
+  char ** wlst = (char **) calloc(maxSug, sizeof(char *));
+  if (wlst == NULL) return 0;
+
+  switch(captype) {
+     case NOCAP:   { 
+                     ns = pSMgr->suggest(wlst, ns, cw); 
+                     break;
+                   }
+
+     case INITCAP: { 
+
+                     memcpy(wspace,cw,(wl+1));
+                     mkallsmall(wspace, csconv);
+                     ns = pSMgr->suggest(wlst, ns, wspace);
+                     if (ns > 0) {
+                       for (int j=0; j < ns; j++)
+                         mkinitcap(wlst[j], csconv);
+                     }
+                     ns = pSMgr->suggest(wlst,ns,cw); 
+                     break;
+                   }
+
+     case HUHCAP: { 
+                     ns = pSMgr->suggest(wlst, ns, cw);
+                     if (ns != -1) {
+                       memcpy(wspace,cw,(wl+1));
+                       mkallsmall(wspace, csconv);
+                       ns = pSMgr->suggest(wlst, ns, wspace);
+                     } 
+                     break;
+                   }
+
+     case ALLCAP: { 
+                     memcpy(wspace,cw,(wl+1));
+                     mkallsmall(wspace, csconv);
+                     ns = pSMgr->suggest(wlst, ns, wspace);
+                     if (ns > 0) {
+                       for (int j=0; j < ns; j++)
+                         mkallcap(wlst[j], csconv);
+                     } 
+                     if (ns != -1) 
+                         ns = pSMgr->suggest(wlst, ns , cw);
+                     break;
+                   }
+  }
+  if (ns > 0) {
+       *slst = wlst;
+       return ns;
+  }
+  // try ngram approach since found nothing
+  if (ns == 0) { 
+     ns = pSMgr->ngsuggest(wlst, cw, pHMgr);
+     if (ns) {
+         switch(captype) {
+	    case NOCAP:  break;
+            case HUHCAP: break; 
+            case INITCAP: { 
+                            for (int j=0; j < ns; j++)
+                              mkinitcap(wlst[j], csconv);
+                          }
+                          break;
+
+            case ALLCAP: { 
+                            for (int j=0; j < ns; j++)
+                              mkallcap(wlst[j], csconv);
+                         } 
+                         break;
+	 }
+         *slst = wlst;
+         return ns;
+     }
+  }
+  if (ns < 0) {
+     // we ran out of memory - we should free up as much as possible
+     for (int i=0;i<maxSug; i++)
+	 if (wlst[i] != NULL) free(wlst[i]);
+  }
+  if (wlst) free(wlst);
+  *slst = NULL;
+  return 0;
+}
+
+
+char * MySpell::get_dic_encoding()
+{
+  return encoding;
+}
+
--- a/goldlib/myspell/myspell.hxx
+++ b/goldlib/myspell/myspell.hxx
@ -0,0 +1,37 @@
+#include "hashmgr.hxx"
+#include "affixmgr.hxx"
+#include "suggestmgr.hxx"
+#include "csutil.hxx"
+
+#define NOCAP   0
+#define INITCAP 1
+#define ALLCAP  2
+#define HUHCAP  3
+
+
+#ifndef _MYSPELLMGR_HXX_
+#define _MYSPELLMGR_HXX_
+
+class MySpell
+{
+  AffixMgr*       pAMgr;
+  HashMgr*        pHMgr;
+  SuggestMgr*     pSMgr;
+  char *          encoding;
+  struct cs_info * csconv;
+  int             maxSug;
+
+public:
+  MySpell(const char * affpath, const char * dpath);
+  ~MySpell();
+
+  int suggest(char*** slst, const char * word);
+  int spell(const char *);
+  char * get_dic_encoding();
+
+private:
+   int    cleanword(char *, const char *, int *, int *);
+   char * check(const char *);
+};
+
+#endif
--- a/goldlib/myspell/suggestmgr.cxx
+++ b/goldlib/myspell/suggestmgr.cxx
@ -0,0 +1,539 @@
+#include "license.readme"
+
+#include <cstdlib>
+#include <cctype>
+#include <cstring>
+#include <cstdio>
+
+#include "suggestmgr.hxx"
+
+#if !defined(_MSC_VER)
+using namespace std;
+#endif
+
+extern char * mystrdup(const char *);
+
+
+SuggestMgr::SuggestMgr(const char * tryme, int maxn, 
+                       AffixMgr * aptr)
+{
+
+  // register affix manager and check in string of chars to 
+  // try when building candidate suggestions
+  pAMgr = aptr;
+  ctry = mystrdup(tryme);
+  ctryl = 0;
+  if (ctry)
+    ctryl = strlen(ctry);
+  maxSug = maxn;
+  nosplitsugs=(0==1);
+  if (pAMgr) pAMgr->get_nosplitsugs();
+}
+
+
+SuggestMgr::~SuggestMgr()
+{
+  pAMgr = NULL;
+  if (ctry) free(ctry);
+  ctry = NULL;
+  ctryl = 0;
+  maxSug = 0;
+}
+
+
+
+// generate suggestions for a mispelled word
+//    pass in address of array of char * pointers
+
+int SuggestMgr::suggest(char** wlst, int ns, const char * word)
+{
+    
+    int nsug = ns;
+
+    // perhaps we made chose the wrong char from a related set
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = mapchars(wlst, word, nsug);
+
+    // perhaps we made a typical fault of spelling
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = replchars(wlst, word, nsug);
+
+    // did we forget to add a char
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = forgotchar(wlst, word, nsug);
+
+    // did we swap the order of chars by mistake
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = swapchar(wlst, word, nsug);
+
+    // did we add a char that should not be there
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = extrachar(wlst, word, nsug);
+   
+    // did we just hit the wrong key in place of a good char
+    if ((nsug < maxSug) && (nsug > -1))
+      nsug = badchar(wlst, word, nsug);
+
+    // perhaps we forgot to hit space and two words ran together
+    if (!nosplitsugs) {
+        if ((nsug < maxSug) && (nsug > -1))
+           nsug = twowords(wlst, word, nsug);
+    }
+    return nsug;
+}
+
+
+
+// suggestions for when chose the wrong char out of a related set
+int SuggestMgr::mapchars(char** wlst, const char * word, int ns)
+{
+  int wl = strlen(word);
+  if (wl < 2 || ! pAMgr) return ns;
+
+  int nummap = pAMgr->get_nummap();
+  struct mapentry* maptable = pAMgr->get_maptable();
+  if (maptable==NULL) return ns;
+  ns = map_related(word, 0, wlst, ns, maptable, nummap);
+  return ns;
+}
+
+
+int SuggestMgr::map_related(const char * word, int i, char** wlst, int ns, const mapentry* maptable, int nummap) 
+{
+  char c = *(word + i);
+  if (c == 0) {
+      int cwrd = 1;
+      for (int m=0; m < ns; m++)
+	  if (strcmp(word,wlst[m]) == 0) cwrd = 0;
+      if ((cwrd) && check(word,strlen(word))) {
+	  if (ns < maxSug) {
+	      wlst[ns] = mystrdup(word);
+	      if (wlst[ns] == NULL) return -1;
+	      ns++;
+	  }
+      }
+      return ns;
+  } 
+  int in_map = 0;
+  for (int j = 0; j < nummap; j++) {
+    if (strchr(maptable[j].set,c) != 0) {
+      in_map = 1;
+      char * newword = strdup(word);
+      for (int k = 0; k < maptable[j].len; k++) {
+	*(newword + i) = *(maptable[j].set + k);
+	ns = map_related(newword, (i+1), wlst, ns, maptable, nummap);
+      }
+      free(newword);
+    }
+  }
+  if (!in_map) {
+     i++;
+     ns = map_related(word, i, wlst, ns, maptable, nummap);
+  }
+  return ns;
+}
+
+
+
+// suggestions for a typical fault of spelling, that
+// differs with more, than 1 letter from the right form.
+int SuggestMgr::replchars(char** wlst, const char * word, int ns)
+{
+  char candidate[MAXSWL];
+  const char * r;
+  int lenr, lenp;
+  int cwrd;
+
+  int wl = strlen(word);
+  if (wl < 2 || ! pAMgr) return ns;
+
+  int numrep = pAMgr->get_numrep();
+  struct replentry* reptable = pAMgr->get_reptable();
+  if (reptable==NULL) return ns;
+
+  for (int i=0; i < numrep; i++ ) {
+      r = word;
+      lenr = strlen(reptable[i].replacement);
+      lenp = strlen(reptable[i].pattern);
+      // search every occurence of the pattern in the word
+      while ((r=strstr(r, reptable[i].pattern)) != NULL) {
+	  strcpy(candidate, word);
+	  if (r-word + lenr + strlen(r+lenp) >= MAXSWL) break;
+	  strcpy(candidate+(r-word),reptable[i].replacement);
+	  strcpy(candidate+(r-word)+lenr, r+lenp);
+          cwrd = 1;
+          for (int k=0; k < ns; k++)
+	      if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+          if ((cwrd) && check(candidate,strlen(candidate))) {
+	      if (ns < maxSug) {
+		  wlst[ns] = mystrdup(candidate);
+		  if (wlst[ns] == NULL) return -1;
+		  ns++;
+	      } else return ns;
+	  }
+          r++; // search for the next letter
+      }
+   }
+   return ns;
+}
+
+
+// error is wrong char in place of correct one
+int SuggestMgr::badchar(char ** wlst, const char * word, int ns)
+{
+  char	tmpc;
+  char	candidate[MAXSWL];
+
+  int wl = strlen(word);
+  int cwrd;
+  strcpy (candidate, word);
+
+  // swap out each char one by one and try all the tryme
+  // chars in its place to see if that makes a good word
+  for (int i=0; i < wl; i++) {
+    tmpc = candidate[i];
+    for (int j=0; j < ctryl; j++) {
+       if (ctry[j] == tmpc) continue;
+       candidate[i] = ctry[j];
+       cwrd = 1;
+       for (int k=0; k < ns; k++)
+	 if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+       if ((cwrd) && check(candidate,wl)) {
+	 if (ns < maxSug) {
+            wlst[ns] = mystrdup(candidate);
+            if (wlst[ns] == NULL) return -1;
+            ns++;
+         } else return ns;
+       }
+       candidate[i] = tmpc;
+    }
+  }
+  return ns;
+}
+
+
+// error is word has an extra letter it does not need 
+int SuggestMgr::extrachar(char** wlst, const char * word, int ns)
+{
+   char	   candidate[MAXSWL];
+   const char *  p;
+   char *  r;
+   int cwrd;
+
+   int wl = strlen(word);
+   if (wl < 2) return ns;
+
+   // try omitting one char of word at a time
+   strcpy (candidate, word + 1);
+   for (p = word, r = candidate;  *p != 0;  ) {
+       cwrd = 1;
+       for (int k=0; k < ns; k++)
+	 if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+       if ((cwrd) && check(candidate,wl-1)) {
+	 if (ns < maxSug) {
+            wlst[ns] = mystrdup(candidate);
+            if (wlst[ns] == NULL) return -1;
+            ns++;
+         } else return ns; 
+       }
+       *r++ = *p++;
+   }
+   return ns;
+}
+
+
+// error is mising a letter it needs
+int SuggestMgr::forgotchar(char ** wlst, const char * word, int ns)
+{
+   char	candidate[MAXSWL];
+   const char *	p;
+   char *	q;
+   int cwrd;
+
+   int wl = strlen(word);
+
+   // try inserting a tryme character before every letter
+   strcpy(candidate + 1, word);
+   for (p = word, q = candidate;  *p != 0;  )  {
+      for (int i = 0;  i < ctryl;  i++) {
+	 *q = ctry[i];
+         cwrd = 1;
+         for (int k=0; k < ns; k++)
+	   if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+         if ((cwrd) && check(candidate,wl+1)) {
+	    if (ns < maxSug) {
+                wlst[ns] = mystrdup(candidate);
+                if (wlst[ns] == NULL) return -1;
+                ns++;
+            } else return ns; 
+         }
+      }
+      *q++ = *p++;
+   }
+
+   // now try adding one to end */
+   for (int i = 0;  i < ctryl;  i++) {
+      *q = ctry[i];
+      cwrd = 1;
+      for (int k=0; k < ns; k++)
+	if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+      if ((cwrd) && check(candidate,wl+1)) {
+	 if (ns < maxSug) {
+             wlst[ns] = mystrdup(candidate);
+             if (wlst[ns] == NULL) return -1;
+             ns++;
+         } else return ns;
+      }
+   }
+   return ns;
+}
+
+
+/* error is should have been two words */
+int SuggestMgr::twowords(char ** wlst, const char * word, int ns)
+{
+    char candidate[MAXSWL];
+    char * p;
+
+    int wl=strlen(word);
+    if (wl < 3) return ns;
+    strcpy(candidate + 1, word);
+
+    // split the string into two pieces after every char
+    // if both pieces are good words make them a suggestion
+    for (p = candidate + 1;  p[1] != '\0';  p++) {
+       p[-1] = *p;
+       *p = '\0';
+       if (check(candidate,strlen(candidate))) {
+	 if (check((p+1),strlen(p+1))) {
+	    *p = ' ';
+	    if (ns < maxSug) {
+                wlst[ns] = mystrdup(candidate);
+                if (wlst[ns] == NULL) return -1;
+                ns++;
+            } else return ns;
+         }
+       }
+    }
+    return ns;
+}
+
+
+// error is adjacent letter were swapped
+int SuggestMgr::swapchar(char ** wlst, const char * word, int ns)
+{
+   char	candidate[MAXSWL];
+   char * p;
+   char	tmpc;
+   int cwrd;
+
+   int wl = strlen(word);
+
+   // try swapping adjacent chars one by one
+   strcpy(candidate, word);
+   for (p = candidate;  p[1] != 0;  p++) {
+      tmpc = *p;
+      *p = p[1];
+      p[1] = tmpc;
+      cwrd = 1;
+      for (int k=0; k < ns; k++)
+	if (strcmp(candidate,wlst[k]) == 0) cwrd = 0;
+      if ((cwrd) && check(candidate,wl)) {
+	 if (ns < maxSug) {
+             wlst[ns] = mystrdup(candidate);
+             if (wlst[ns] == NULL) return -1;
+             ns++;
+         } else return ns;
+      }
+      tmpc = *p;
+      *p = p[1];
+      p[1] = tmpc;
+   }
+   return ns;
+}
+
+
+// generate a set of suggestions for very poorly spelled words
+int SuggestMgr::ngsuggest(char** wlst, char * word, HashMgr* pHMgr)
+{
+
+  int i, j;
+  int lval;
+  int sc;
+  int lp;
+
+  if (! pHMgr) return 0;
+
+  // exhaustively search through all root words
+  // keeping track of the MAX_ROOTS most similar root words
+  struct hentry * roots[MAX_ROOTS];
+  int scores[MAX_ROOTS];
+  for (i = 0; i < MAX_ROOTS; i++) {
+    roots[i] = NULL;
+    scores[i] = -100 * i;
+  }
+  lp = MAX_ROOTS - 1;
+
+  int n = strlen(word);
+
+  struct hentry* hp = NULL;
+  int col = -1;
+  while ((hp = pHMgr->walk_hashtable(col, hp))) {
+    sc = ngram(3, word, hp->word, NGRAM_LONGER_WORSE);
+    if (sc > scores[lp]) {
+      scores[lp] = sc;
+      roots[lp] = hp;
+      int lval = sc;
+      for (j=0; j < MAX_ROOTS; j++)
+	if (scores[j] < lval) {
+	  lp = j;
+          lval = scores[j];
+	}
+    }  
+  }
+
+  // find minimum threshhold for a passable suggestion
+  // mangle original word three differnt ways
+  // and score them to generate a minimum acceptable score
+  int thresh = 0;
+  char * mw = NULL;
+  for (int sp = 1; sp < 4; sp++) {
+     mw = strdup(word);
+     for (int k=sp; k < n; k+=4) *(mw + k) = '*';
+     thresh = thresh + ngram(n, word, mw, NGRAM_ANY_MISMATCH);
+     free(mw);
+  }
+  mw = NULL;
+  thresh = thresh / 3;
+  thresh--;
+
+  // now expand affixes on each of these root words and
+  // and use length adjusted ngram scores to select
+  // possible suggestions
+  char * guess[MAX_GUESS];
+  int gscore[MAX_GUESS];
+  for(i=0;i<MAX_GUESS;i++) {
+     guess[i] = NULL;
+     gscore[i] = -100 * i;
+  }
+
+  lp = MAX_GUESS - 1;
+
+  struct guessword * glst;
+  glst = (struct guessword *) calloc(MAX_WORDS,sizeof(struct guessword));
+  if (! glst) return 0;
+
+  for (i = 0; i < MAX_ROOTS; i++) {
+
+      if (roots[i]) {
+        struct hentry * rp = roots[i];
+	int nw = pAMgr->expand_rootword(glst, MAX_WORDS, rp->word, rp->wlen,
+                                        rp->astr, rp->alen);
+        for (int k = 0; k < nw; k++) {
+           sc = ngram(n, word, glst[k].word, NGRAM_ANY_MISMATCH);
+           if (sc > thresh) {
+              if (sc > gscore[lp]) {
+	         if (guess[lp]) free (guess[lp]);
+                 gscore[lp] = sc;
+                 guess[lp] = glst[k].word;
+                 lval = sc;
+                 for (j=0; j < MAX_GUESS; j++)
+	            if (gscore[j] < lval) {
+	               lp = j;
+                       lval = gscore[j];
+	            }
+	      } else {
+                 free (glst[k].word);  
+              }
+	   }            
+	}
+      }
+  }
+  if (glst) free(glst);
+
+  // now we are done generating guesses
+  // sort in order of decreasing score and copy over
+  
+  bubblesort(&guess[0], &gscore[0], MAX_GUESS);
+  int ns = 0;
+  for (i=0; i < MAX_GUESS; i++) {
+    if (guess[i]) {
+      int unique = 1;
+      for (j=i+1; j < MAX_GUESS; j++)
+	if (guess[j]) 
+	    if (!strcmp(guess[i], guess[j])) unique = 0;
+      if (unique) {
+         wlst[ns++] = guess[i];
+      } else {
+	 free(guess[i]);
+      }
+    }
+  }
+  return ns;
+}
+
+
+
+
+// see if a candidate suggestion is spelled correctly
+// needs to check both root words and words with affixes
+int SuggestMgr::check(const char * word, int len)
+{
+  struct hentry * rv=NULL;
+  if (pAMgr) { 
+    rv = pAMgr->lookup(word);
+    if (rv == NULL) rv = pAMgr->affix_check(word,len);
+  }
+  if (rv) return 1;
+  return 0;
+}
+
+
+
+// generate an n-gram score comparing s1 and s2
+int SuggestMgr::ngram(int n, char * s1, const char * s2, int uselen)
+{
+  int nscore = 0;
+  int l1 = strlen(s1);
+  int l2 = strlen(s2);
+  int ns;
+  for (int j=1;j<=n;j++) {
+    ns = 0;
+    for (int i=0;i<=(l1-j);i++) {
+      char c = *(s1 + i + j);
+      *(s1 + i + j) = '\0';
+      if (strstr(s2,(s1+i))) ns++;
+      *(s1 + i + j ) = c;
+    }
+    nscore = nscore + ns;
+    if (ns < 2) break;
+  }
+  ns = 0;
+  if (uselen == NGRAM_LONGER_WORSE) ns = (l2-l1)-2;
+  if (uselen == NGRAM_ANY_MISMATCH) ns = abs(l2-l1)-2;
+  return (nscore - ((ns > 0) ? ns : 0));
+}
+
+
+// sort in decreasing order of score
+void SuggestMgr::bubblesort(char** rword, int* rsc, int n )
+{
+      int m = 1;
+      while (m < n) {
+	  int j = m;
+	  while (j > 0) {
+	    if (rsc[j-1] < rsc[j]) {
+	        int sctmp = rsc[j-1];
+                char * wdtmp = rword[j-1];
+	        rsc[j-1] = rsc[j];
+                rword[j-1] = rword[j];
+                rsc[j] = sctmp;
+                rword[j] = wdtmp;
+	        j--;
+	    } else break;
+	  }
+          m++;
+      }
+      return;
+}
+
--- a/goldlib/myspell/suggestmgr.hxx
+++ b/goldlib/myspell/suggestmgr.hxx
@ -0,0 +1,48 @@
+#ifndef _SUGGESTMGR_HXX_
+#define _SUGGESTMGR_HXX_
+
+#define MAXSWL 100
+#define MAX_ROOTS 10
+#define MAX_WORDS 500
+#define MAX_GUESS 10
+
+#define NGRAM_IGNORE_LENGTH 0
+#define NGRAM_LONGER_WORSE  1
+#define NGRAM_ANY_MISMATCH  2
+
+
+#include "atypes.hxx"
+#include "affixmgr.hxx"
+#include "hashmgr.hxx"
+
+class SuggestMgr
+{
+  char *          ctry;
+  int             ctryl;
+  AffixMgr*       pAMgr;
+  int             maxSug;
+  bool            nosplitsugs;
+
+public:
+  SuggestMgr(const char * tryme, int maxn, AffixMgr *aptr);
+  ~SuggestMgr();
+
+  int suggest(char** wlst, int ns, const char * word);
+  int check(const char *, int);
+  int ngsuggest(char ** wlst, char * word, HashMgr* pHMgr);
+
+private:
+   int replchars(char**, const char *, int);
+   int mapchars(char**, const char *, int);
+   int map_related(const char *, int, char ** wlst, int, const mapentry*, int);
+   int forgotchar(char **, const char *, int);
+   int swapchar(char **, const char *, int);
+   int extrachar(char **, const char *, int);
+   int badchar(char **, const char *, int);
+   int twowords(char **, const char *, int);
+   int ngram(int n, char * s1, const char * s2, int uselen);
+   void bubblesort( char ** rwd, int * rsc, int n);
+};
+
+#endif
+