/*
* $Id$
*
+ *
+ * Copyright (c) 2005-2009 by the citadel.org team
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
* later on, or even if we update this one, we can use a different ID so the
* system knows it needs to throw away the existing index and rebuild it.
*/
-#define FT_WORDBREAKER_ID 0x001f
+#define FT_WORDBREAKER_ID 0x0021
/*
* Minimum and maximum length of words to index
*/
-#define WB_MIN 3
+#define WB_MIN 4 // nothing with 3 or less chars
#define WB_MAX 40
void wordbreaker(char *text, int *num_tokens, int **tokens);
+void initialize_noise_words(void);
+void noise_word_cleanup(void);
+
+
+typedef struct noise_word noise_word;
+
+struct noise_word {
+ unsigned int len;
+ char *word;
+ noise_word *next;
+};