Blob Blame History Raw
diff -ru vim70.orig/src/Makefile vim70.hunspell/src/Makefile
--- vim70.orig/src/Makefile	2006-12-15 12:29:41.000000000 +0000
+++ vim70.hunspell/src/Makefile	2006-12-14 11:11:20.000000000 +0000
@@ -1287,7 +1287,7 @@
 PFLAGS = $(PROTO_FLAGS) -DPROTO $(LINT_CFLAGS)
 
 ALL_LIB_DIRS = $(GUI_LIBS_DIR) $(X_LIBS_DIR)
-ALL_LIBS = $(GUI_LIBS1) $(GUI_X_LIBS) $(GUI_LIBS2) $(X_PRE_LIBS) $(X_LIBS) $(X_EXTRA_LIBS) $(LIBS) $(EXTRA_LIBS) $(MZSCHEME_LIBS) $(PERL_LIBS) $(PYTHON_LIBS) $(TCL_LIBS) $(RUBY_LIBS) $(PROFILE_LIBS)
+ALL_LIBS = $(GUI_LIBS1) $(GUI_X_LIBS) $(GUI_LIBS2) $(X_PRE_LIBS) $(X_LIBS) $(X_EXTRA_LIBS) $(LIBS) $(EXTRA_LIBS) $(MZSCHEME_LIBS) $(PERL_LIBS) $(PYTHON_LIBS) $(TCL_LIBS) $(RUBY_LIBS) $(PROFILE_LIBS) -lhunspell-1.1
 
 # abbreviations
 DEST_BIN = $(DESTDIR)$(BINDIR)
diff -ru vim70.orig/src/spell.c vim70.hunspell/src/spell.c
--- vim70.orig/src/spell.c	2006-12-15 12:29:44.000000000 +0000
+++ vim70.hunspell/src/spell.c	2006-12-15 12:27:49.000000000 +0000
@@ -319,6 +319,8 @@
 # include <time.h>	/* for time_t */
 #endif
 
+#include "hunspell/hunspell.h"
+
 #define MAXWLEN 250		/* Assume max. word len is this many bytes.
 				   Some places assume a word length fits in a
 				   byte, thus it can't be above 255. */
@@ -428,6 +430,8 @@
 #define	SP_FORMERROR	-2	/* format error in spell file */
 #define SP_OTHERERROR	-3	/* other error while reading spell file */
 
+#define MAXREGIONS 20
+
 /*
  * Structure used to store words and other info for one language, loaded from
  * a .spl file.
@@ -450,6 +454,10 @@
     char_u	*sl_name;	/* language name "en", "en.rare", "nl", etc. */
     char_u	*sl_fname;	/* name of .spl file */
     int		sl_add;		/* TRUE if it's a .add file. */
+    int		sl_ishunspell;	/* TRUE if it's an unconverted hunspell aff/dic combination. */
+    Hunhandle	*sl_hunspell;
+    vimconv_T   sl_tohunconv;
+    vimconv_T   sl_fromhunconv;
 
     char_u	*sl_fbyts;	/* case-folded word bytes */
     idx_T	*sl_fidxs;	/* case-folded word indexes */
@@ -460,7 +468,7 @@
 
     char_u	*sl_info;	/* infotext string or NULL */
 
-    char_u	sl_regions[17];	/* table with up to 8 region names plus NUL */
+    char_u	sl_regions[MAXREGIONS * 2 + 1];	/* table with up to 8 region names plus NUL */
 
     char_u	*sl_midword;	/* MIDWORD string or NULL */
 
@@ -997,6 +1005,36 @@
 static char_u	*repl_from = NULL;
 static char_u	*repl_to = NULL;
 
+static void
+ensurehunspellinit(lp)
+    slang_T *lp;
+{
+    if (!lp->sl_hunspell)
+    {
+        char_u *dic = lp->sl_fname;
+        char_u *aff = vim_strnsave(dic, strlen(dic));
+    
+	vim_strncpy(aff + strlen(aff) - 3, "aff", 3);
+    
+	lp->sl_hunspell = Hunspell_create(aff, dic);
+
+	vim_free(aff);
+
+	if (convert_setup(&lp->sl_tohunconv, spell_enc(), 
+	    Hunspell_get_dic_encoding(lp->sl_hunspell)) == FAIL)
+	{
+	    lp->sl_tohunconv.vc_fail = TRUE;
+	}
+
+	if (convert_setup(&lp->sl_fromhunconv, 
+	    Hunspell_get_dic_encoding(lp->sl_hunspell), spell_enc()) == FAIL)
+	{
+	    lp->sl_fromhunconv.vc_fail = TRUE;
+	}
+    }
+}
+
+
 /*
  * Main spell-checking function.
  * "ptr" points to a character that could be the start of a word.
@@ -1101,27 +1139,70 @@
     {
 	mi.mi_lp = LANGP_ENTRY(wp->w_buffer->b_langp, lpi);
 
+	if (mi.mi_lp->lp_slang->sl_ishunspell)
+	{
+	    slang_T *lp = mi.mi_lp->lp_slang;
+	    char_u *converted = 0;
+	    char_u *thisword;
+	    char_u *mi_end = mi.mi_end;
+	    char_u *mi_final =  mi.mi_word + strlen(mi.mi_word);
+
+	    while (1)
+	    {
+		ensurehunspellinit(lp);
+		if ((lp->sl_tohunconv.vc_fail == TRUE) || (lp->sl_fromhunconv.vc_fail == TRUE))
+		    break;
+
+		if (mi_end != mi.mi_word)
+		{
+		    thisword = vim_strnsave(mi.mi_word, mi_end - mi.mi_word);
+		    converted = string_convert(&lp->sl_tohunconv, thisword, NULL);
+		    if (converted)
+		    {
+			if (Hunspell_spell(lp->sl_hunspell, converted) != 0)
+			{
+			    mi.mi_result = SP_OK;
+			    mi.mi_end = mi.mi_cend = mi.mi_word + strlen(thisword);
+			}
+			vim_free(converted);
+		    }
+		    vim_free(thisword);
+		}
+
+		if (mi_end == mi_final)
+		    break;
+
+		do
+		{
+		    mb_ptr_adv(mi_end);
+		} while (*mi_end != NUL && spell_iswordp(mi_end, wp->w_buffer));
+	    }
+	}
+
 	/* If reloading fails the language is still in the list but everything
 	 * has been cleared. */
-	if (mi.mi_lp->lp_slang->sl_fidxs == NULL)
+	if (!mi.mi_lp->lp_slang->sl_ishunspell && mi.mi_lp->lp_slang->sl_fidxs == NULL)
 	    continue;
 
-	/* Check for a matching word in case-folded words. */
-	find_word(&mi, FIND_FOLDWORD);
+	if (!mi.mi_lp->lp_slang->sl_ishunspell)
+	{
+	    /* Check for a matching word in case-folded words. */
+	    find_word(&mi, FIND_FOLDWORD);
 
-	/* Check for a matching word in keep-case words. */
-	find_word(&mi, FIND_KEEPWORD);
+	    /* Check for a matching word in keep-case words. */
+	    find_word(&mi, FIND_KEEPWORD);
 
-	/* Check for matching prefixes. */
-	find_prefix(&mi, FIND_FOLDWORD);
+	    /* Check for matching prefixes. */
+	    find_prefix(&mi, FIND_FOLDWORD);
 
-	/* For a NOBREAK language, may want to use a word without a following
-	 * word as a backup. */
-	if (mi.mi_lp->lp_slang->sl_nobreak && mi.mi_result == SP_BAD
-						   && mi.mi_result2 != SP_BAD)
-	{
-	    mi.mi_result = mi.mi_result2;
-	    mi.mi_end = mi.mi_end2;
+	    /* For a NOBREAK language, may want to use a word without a following
+	     * word as a backup. */
+	    if (mi.mi_lp->lp_slang->sl_nobreak && mi.mi_result == SP_BAD
+						       && mi.mi_result2 != SP_BAD)
+	    {
+		mi.mi_result = mi.mi_result2;
+		mi.mi_end = mi.mi_end2;
+	    }
 	}
 
 	/* Count the word in the first language where it's found to be OK. */
@@ -2359,6 +2440,80 @@
 
     if (r == FAIL)
     {
+#	define HUNSPELLDICT "/usr/share/myspell/"
+	DIR *dirp = opendir(HUNSPELLDICT);
+	if (dirp != NULL)
+	{
+	    slang_T* thislang[MAXREGIONS] = {0};
+	    slang_T *lp = 0;
+	    struct dirent *dp;
+	    int i = 0;
+
+	    while ((dp = readdir(dirp)) != NULL)
+	    {
+		char_u final_name[MAXPATHL];
+		char_u spf_name[MAXPATHL];
+		char_u thisregion[3] = {0};
+		char *resolvedlink = final_name;
+		int j, regionpos;
+
+		if (strncmp(dp->d_name, lang, strlen(lang)) != 0)
+		    continue;
+		
+		if ((strlen(dp->d_name) <= 4) || (dp->d_name[strlen(lang)] != '_'))
+		    continue;
+
+		if (strncmp(".dic", dp->d_name + strlen(dp->d_name) - 4, 4) != 0)
+		    continue;
+
+		vim_strncpy(spf_name, HUNSPELLDICT, strlen(HUNSPELLDICT));
+		vim_strncpy(spf_name + strlen(HUNSPELLDICT), dp->d_name, strlen(HUNSPELLDICT));
+
+		if (realpath(spf_name, resolvedlink) != resolvedlink)
+		    continue;
+
+		thisregion[0] = tolower(dp->d_name[strlen(lang)+1]);
+		thisregion[1] = tolower(dp->d_name[strlen(lang)+1+1]);
+
+		r = OK;
+
+		for (j = 0; j < MAXREGIONS; ++j)
+		{
+		    if (thislang[j] && (strcmp(thislang[j]->sl_fname, final_name) == 0))
+			break;
+		}
+
+		if (j < MAXREGIONS)
+		    lp = thislang[j];
+		else
+		{
+		    lp = slang_alloc(lang);
+		    lp->sl_ishunspell = TRUE;
+
+		    lp->sl_fname = vim_strsave(resolvedlink);
+
+		    lp->sl_next = first_lang;
+		    first_lang = lp;
+		    thislang[i] = lp;
+		}
+
+		regionpos = 0;
+		while (lp->sl_regions[regionpos] != 0) ++regionpos;
+
+		//silently lose regions which won't fit in
+		if (regionpos == MAXREGIONS * 2)
+		    continue;
+
+		vim_strncpy(lp->sl_regions + regionpos, thisregion, 2);
+
+		++i;
+	    }
+	    closedir(dirp);
+	}
+    }
+
+    if (r == FAIL)
+    {
 	smsg((char_u *)_("Warning: Cannot find word list \"%s.%s.spl\" or \"%s.ascii.spl\""),
 						     lang, spell_enc(), lang);
     }
@@ -2429,6 +2584,9 @@
 slang_free(lp)
     slang_T	*lp;
 {
+    Hunspell_destroy(lp->sl_hunspell);
+    convert_setup(&lp->sl_tohunconv, NULL, NULL);
+    convert_setup(&lp->sl_fromhunconv, NULL, NULL);
     vim_free(lp->sl_name);
     vim_free(lp->sl_fname);
     slang_clear(lp);
@@ -2974,7 +3132,7 @@
 {
     int		i;
 
-    if (len > 16)
+    if (len > MAXREGIONS*2)
 	return SP_FORMERROR;
     for (i = 0; i < len; ++i)
 	lp->sl_regions[i] = getc(fd);			/* <regionname> */
@@ -4112,6 +4270,7 @@
     /* loop over comma separated language names. */
     for (splp = buf->b_p_spl; *splp != NUL; )
     {
+	int hunspellregionunsupported;
 	/* Get one language name. */
 	copy_option_part(&splp, lang, MAXWLEN, ",");
 
@@ -4182,6 +4341,7 @@
 	/*
 	 * Loop over the languages, there can be several files for "lang".
 	 */
+	hunspellregionunsupported = 0;
 	for (slang = first_lang; slang != NULL; slang = slang->sl_next)
 	    if (filename ? fullpathcmp(lang, slang->sl_fname, FALSE) == FPC_SAME
 			 : STRICMP(lang, slang->sl_name) == 0)
@@ -4199,6 +4359,11 @@
 				/* This addition file is for other regions. */
 				region_mask = 0;
 			}
+			else if (slang->sl_ishunspell)
+			{
+			    region_mask = 0;
+			    hunspellregionunsupported++;
+			}
 			else
 			    /* This is probably an error.  Give a warning and
 			     * accept the words anyway. */
@@ -4207,7 +4372,10 @@
 								      region);
 		    }
 		    else
+		    {
+			hunspellregionunsupported--;
 			region_mask = 1 << c;
+		    }
 		}
 
 		if (region_mask != 0)
@@ -4225,6 +4393,9 @@
 			nobreak = TRUE;
 		}
 	    }
+
+	if (region && hunspellregionunsupported >= 1)
+	    smsg((char_u *) _("Warning: region %s not supported"), region);
     }
 
     /* round 0: load int_wordlist, if possible.
@@ -4832,7 +5003,7 @@
     char_u	*si_info;	/* info text chars or NULL  */
     int		si_region_count; /* number of regions supported (1 when there
 				    are no regions) */
-    char_u	si_region_name[16]; /* region names; used only if
+    char_u	si_region_name[MAXREGIONS*2]; /* region names; used only if
 				     * si_region_count > 1) */
 
     garray_T	si_rep;		/* list of fromto_T entries from REP lines */
@@ -7093,7 +7264,7 @@
 		else
 		{
 		    line += 8;
-		    if (STRLEN(line) > 16)
+		    if (STRLEN(line) > MAXREGIONS)
 			smsg((char_u *)_("Too many regions in %s line %d: %s"),
 						       fname, lnum, line);
 		    else
@@ -8973,7 +9144,7 @@
     char_u	wfname[MAXPATHL];
     char_u	**innames;
     int		incount;
-    afffile_T	*(afile[8]);
+    afffile_T	*(afile[MAXREGIONS]);
     int		i;
     int		len;
     struct stat	st;
@@ -9040,8 +9211,8 @@
 	EMSG(_(e_invarg));	/* need at least output and input names */
     else if (vim_strchr(gettail(wfname), '_') != NULL)
 	EMSG(_("E751: Output file name must not have region name"));
-    else if (incount > 8)
-	EMSG(_("E754: Only up to 8 regions supported"));
+    else if (incount > MAXREGIONS)
+	EMSG2(_("E754: Only up to %d regions supported"), MAXREGIONS);
     else
     {
 	/* Check for overwriting before doing things that may take a lot of
@@ -11097,6 +11268,36 @@
     {
 	lp = LANGP_ENTRY(curbuf->b_langp, lpi);
 
+	if (lp->lp_slang->sl_ishunspell)
+	{
+	    slang_T *slp = lp->lp_slang;
+	    char **slst;
+	    char_u *converted = 0;
+
+	    ensurehunspellinit(slp);
+
+	    converted = string_convert(&slp->sl_tohunconv, su->su_fbadword, NULL);
+	    if (converted)
+	    {
+		int suggests;
+		suggests = Hunspell_suggest(slp->sl_hunspell, &slst, converted);
+		if (suggests > 0)
+		{
+		    int i;
+		    char_u *suggest;
+		    for (i = 0; i < suggests; ++i)
+		    {
+			suggest = string_convert(&slp->sl_fromhunconv, slst[i], NULL);
+			add_suggestion(su, &su->su_ga, suggest, su->su_badlen, i, 0, FALSE,
+			    slp, FALSE);
+			vim_free(suggest);
+		    }
+		    free(slst);
+		}
+		vim_free(converted);
+	    }
+	}
+
 	/* If reloading a spell file fails it's still in the list but
 	 * everything has been cleared. */
 	if (lp->lp_slang->sl_fbyts == NULL)