lucene-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From hoss...@apache.org
Subject svn commit: r1524848 - in /lucene/dev/branches/branch_4x: ./ dev-tools/ lucene/ lucene/analysis/ lucene/analysis/common/src/java/org/apache/lucene/analysis/core/ lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/ lucene/analysis/...
Date Thu, 19 Sep 2013 21:35:20 GMT
Author: hossman
Date: Thu Sep 19 21:35:18 2013
New Revision: 1524848

URL: http://svn.apache.org/r1524848
Log:
LUCENE-5211: Better javadocs and error checking of 'format' option in StopFilterFactory, as well as comments in all snowball formated files about specifying format option (merge r1524809)

Modified:
    lucene/dev/branches/branch_4x/   (props changed)
    lucene/dev/branches/branch_4x/dev-tools/   (props changed)
    lucene/dev/branches/branch_4x/lucene/   (props changed)
    lucene/dev/branches/branch_4x/lucene/BUILD.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/CHANGES.txt   (contents, props changed)
    lucene/dev/branches/branch_4x/lucene/JRE_VERSION_MIGRATION.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/LICENSE.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/MIGRATE.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/NOTICE.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/README.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/SYSTEM_REQUIREMENTS.txt   (props changed)
    lucene/dev/branches/branch_4x/lucene/analysis/   (props changed)
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/java/org/apache/lucene/analysis/core/StopFilterFactory.java
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/english_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/spanish_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt
    lucene/dev/branches/branch_4x/lucene/analysis/common/src/test/org/apache/lucene/analysis/core/TestStopFilterFactory.java
    lucene/dev/branches/branch_4x/lucene/analysis/icu/src/java/org/apache/lucene/collation/ICUCollationKeyFilterFactory.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/backwards/   (props changed)
    lucene/dev/branches/branch_4x/lucene/benchmark/   (props changed)
    lucene/dev/branches/branch_4x/lucene/build.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/classification/   (props changed)
    lucene/dev/branches/branch_4x/lucene/classification/build.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/classification/ivy.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/classification/src/   (props changed)
    lucene/dev/branches/branch_4x/lucene/codecs/   (props changed)
    lucene/dev/branches/branch_4x/lucene/common-build.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/index/TestBackwardsCompatibility.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/index/index.40.cfs.zip   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/index/index.40.nocfs.zip   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/index/index.40.optimized.cfs.zip   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/index/index.40.optimized.nocfs.zip   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/search/TestSort.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/search/TestSortDocValues.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/search/TestSortRandom.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/search/TestTopFieldCollector.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/core/src/test/org/apache/lucene/search/TestTotalHitCountCollector.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/demo/   (props changed)
    lucene/dev/branches/branch_4x/lucene/expressions/   (props changed)
    lucene/dev/branches/branch_4x/lucene/facet/   (props changed)
    lucene/dev/branches/branch_4x/lucene/grouping/   (props changed)
    lucene/dev/branches/branch_4x/lucene/highlighter/   (props changed)
    lucene/dev/branches/branch_4x/lucene/ivy-settings.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/join/   (props changed)
    lucene/dev/branches/branch_4x/lucene/licenses/   (props changed)
    lucene/dev/branches/branch_4x/lucene/memory/   (props changed)
    lucene/dev/branches/branch_4x/lucene/misc/   (props changed)
    lucene/dev/branches/branch_4x/lucene/module-build.xml   (props changed)
    lucene/dev/branches/branch_4x/lucene/queries/   (props changed)
    lucene/dev/branches/branch_4x/lucene/queries/src/test/org/apache/lucene/queries/function/TestFunctionQuerySort.java   (props changed)
    lucene/dev/branches/branch_4x/lucene/queryparser/   (props changed)
    lucene/dev/branches/branch_4x/lucene/replicator/   (props changed)
    lucene/dev/branches/branch_4x/lucene/sandbox/   (props changed)
    lucene/dev/branches/branch_4x/lucene/site/   (props changed)
    lucene/dev/branches/branch_4x/lucene/spatial/   (props changed)
    lucene/dev/branches/branch_4x/lucene/suggest/   (props changed)
    lucene/dev/branches/branch_4x/lucene/test-framework/   (props changed)
    lucene/dev/branches/branch_4x/lucene/tools/   (props changed)
    lucene/dev/branches/branch_4x/solr/   (props changed)
    lucene/dev/branches/branch_4x/solr/CHANGES.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/LICENSE.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/NOTICE.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/README.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/SYSTEM_REQUIREMENTS.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/build.xml   (props changed)
    lucene/dev/branches/branch_4x/solr/cloud-dev/   (props changed)
    lucene/dev/branches/branch_4x/solr/common-build.xml   (props changed)
    lucene/dev/branches/branch_4x/solr/contrib/   (props changed)
    lucene/dev/branches/branch_4x/solr/core/   (props changed)
    lucene/dev/branches/branch_4x/solr/core/src/test/org/apache/solr/core/TestConfig.java   (props changed)
    lucene/dev/branches/branch_4x/solr/example/   (props changed)
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_da.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_de.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_es.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fi.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fr.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_hu.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_it.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_nl.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_no.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_pt.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_ru.txt
    lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_sv.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_da.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_de.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_es.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fi.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fr.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_hu.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_it.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_nl.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_no.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_pt.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_ru.txt
    lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_sv.txt
    lucene/dev/branches/branch_4x/solr/licenses/   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpclient-LICENSE-ASL.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpclient-NOTICE.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpcore-LICENSE-ASL.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpcore-NOTICE.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpmime-LICENSE-ASL.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/licenses/httpmime-NOTICE.txt   (props changed)
    lucene/dev/branches/branch_4x/solr/scripts/   (props changed)
    lucene/dev/branches/branch_4x/solr/site/   (props changed)
    lucene/dev/branches/branch_4x/solr/solrj/   (props changed)
    lucene/dev/branches/branch_4x/solr/test-framework/   (props changed)
    lucene/dev/branches/branch_4x/solr/webapp/   (props changed)

Modified: lucene/dev/branches/branch_4x/lucene/CHANGES.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/CHANGES.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/CHANGES.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/CHANGES.txt Thu Sep 19 21:35:18 2013
@@ -36,6 +36,12 @@ API Changes:
   with IndexSearcher when an ExecutorService is specified.
   (Ryan Ernst, Mike McCandless, Robert Muir)
 
+Documentation
+
+* LUCENE-5211: Better javadocs and error checking of 'format' option in 
+  StopFilterFactory, as well as comments in all snowball formated files
+  about specifying format option.  (hossman)
+
 Changes in backwards compatibility policy
 
 * LUCENE-5204: Directory doesn't have default implementations for

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/java/org/apache/lucene/analysis/core/StopFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/java/org/apache/lucene/analysis/core/StopFilterFactory.java?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/java/org/apache/lucene/analysis/core/StopFilterFactory.java (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/java/org/apache/lucene/analysis/core/StopFilterFactory.java Thu Sep 19 21:35:18 2013
@@ -22,22 +22,57 @@ import org.apache.lucene.analysis.util.C
 import org.apache.lucene.analysis.util.ResourceLoader;
 import org.apache.lucene.analysis.util.ResourceLoaderAware;
 import org.apache.lucene.analysis.util.TokenFilterFactory;
+import org.apache.lucene.analysis.util.WordlistLoader; // jdocs
 
 import java.util.Map;
 import java.io.IOException;
 
 /**
  * Factory for {@link StopFilter}.
+ *
  * <pre class="prettyprint">
  * &lt;fieldType name="text_stop" class="solr.TextField" positionIncrementGap="100" autoGeneratePhraseQueries="true"&gt;
  *   &lt;analyzer&gt;
  *     &lt;tokenizer class="solr.WhitespaceTokenizerFactory"/&gt;
  *     &lt;filter class="solr.StopFilterFactory" ignoreCase="true"
- *             words="stopwords.txt" enablePositionIncrements="true"/&gt;
+ *             words="stopwords.txt" format="wordset" /&gt;
  *   &lt;/analyzer&gt;
  * &lt;/fieldType&gt;</pre>
+ *
+ * <p>
+ * All attributes are optional:
+ * </p>
+ * <ul>
+ *  <li><code>ignoreCase</code> defaults to <code>false</code></li>
+ *  <li><code>words</code> should be the name of a stopwords file to parse, if not 
+ *      specified the factory will use {@link StopAnalyzer#ENGLISH_STOP_WORDS_SET}
+ *  </li>
+ *  <li><code>format</code> defines how the <code>words</code> file will be parsed, 
+ *      and defaults to <code>wordset</code>.  If <code>words</code> is not specified, 
+ *      then <code>format</code> must not be specified.
+ *  </li>
+ * </ul>
+ * <p>
+ * The valid values for the <code>format</code> option are:
+ * </p>
+ * <ul>
+ *  <li><code>wordset</code> - This is the default format, which supports one word per 
+ *      line (including any intra-word whitespace) and allows whole line comments 
+ *      begining with the "#" character.  Blank lines are ignored.  See 
+ *      {@link WordlistLoader#getLines WordlistLoader.getLines} for details.
+ *  </li>
+ *  <li><code>snowball</code> - This format allows for multiple words specified on each 
+ *      line, and trailing comments may be specified using the vertical line ("&#124;"). 
+ *      Blank lines are ignored.  See 
+ *      {@link WordlistLoader#getSnowballWordSet WordlistLoader.getSnowballWordSet} 
+ *      for details.
+ *  </li>
+ * </ul>
  */
 public class StopFilterFactory extends TokenFilterFactory implements ResourceLoaderAware {
+  public static final String FORMAT_WORDSET = "wordset";
+  public static final String FORMAT_SNOWBALL = "snowball";
+  
   private CharArraySet stopWords;
   private final String stopWordFiles;
   private final String format;
@@ -49,7 +84,7 @@ public class StopFilterFactory extends T
     super(args);
     assureMatchVersion();
     stopWordFiles = get(args, "words");
-    format = get(args, "format");
+    format = get(args, "format", (null == stopWordFiles ? null : FORMAT_WORDSET));
     ignoreCase = getBoolean(args, "ignoreCase", false);
     enablePositionIncrements = getBoolean(args, "enablePositionIncrements", true);
     if (!args.isEmpty()) {
@@ -60,12 +95,17 @@ public class StopFilterFactory extends T
   @Override
   public void inform(ResourceLoader loader) throws IOException {
     if (stopWordFiles != null) {
-      if ("snowball".equalsIgnoreCase(format)) {
+      if (FORMAT_WORDSET.equalsIgnoreCase(format)) {
+        stopWords = getWordSet(loader, stopWordFiles, ignoreCase);
+      } else if (FORMAT_SNOWBALL.equalsIgnoreCase(format)) {
         stopWords = getSnowballWordSet(loader, stopWordFiles, ignoreCase);
       } else {
-        stopWords = getWordSet(loader, stopWordFiles, ignoreCase);
+        throw new IllegalArgumentException("Unknown 'format' specified for 'words' file: " + format);
       }
     } else {
+      if (null != format) {
+        throw new IllegalArgumentException("'format' can not be specified w/o an explicit 'words' file: " + format);
+      }
       stopWords = new CharArraySet(luceneMatchVersion, StopAnalyzer.ENGLISH_STOP_WORDS_SET, ignoreCase);
     }
   }

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Danish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Dutch stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/english_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/english_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/english_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/english_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
  | An English stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | forms of BE
 

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A French stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A German stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | Hungarian stop word list
 | prepared by Anna Tordai

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | An Italian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Norwegian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Portuguese stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | a russian stop word list. comments begin with vertical bar. each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/spanish_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/spanish_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/spanish_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/spanish_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Spanish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Swedish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/lucene/analysis/common/src/test/org/apache/lucene/analysis/core/TestStopFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/lucene/analysis/common/src/test/org/apache/lucene/analysis/core/TestStopFilterFactory.java?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/lucene/analysis/common/src/test/org/apache/lucene/analysis/core/TestStopFilterFactory.java (original)
+++ lucene/dev/branches/branch_4x/lucene/analysis/common/src/test/org/apache/lucene/analysis/core/TestStopFilterFactory.java Thu Sep 19 21:35:18 2013
@@ -57,6 +57,11 @@ public class TestStopFilterFactory exten
     assertTrue(words.contains("her"));
     assertTrue(words.contains("hers"));
     assertTrue(words.contains("herself"));
+
+    // defaults
+    factory = (StopFilterFactory) tokenFilterFactory("Stop");
+    assertEquals(StopAnalyzer.ENGLISH_STOP_WORDS_SET, factory.getStopWords());
+    assertEquals(false, factory.isIgnoreCase());
   }
   
   /** Test that bogus arguments result in exception */
@@ -68,4 +73,30 @@ public class TestStopFilterFactory exten
       assertTrue(expected.getMessage().contains("Unknown parameters"));
     }
   }
+
+  /** Test that bogus arguments result in exception */
+  public void testBogusFormats() throws Exception {
+    try {
+      tokenFilterFactory("Stop", 
+                         "words", "stop-snowball.txt",
+                         "format", "bogus");
+      fail();
+    } catch (IllegalArgumentException expected) {
+      String msg = expected.getMessage();
+      assertTrue(msg, msg.contains("Unknown"));
+      assertTrue(msg, msg.contains("format"));
+      assertTrue(msg, msg.contains("bogus"));
+    }
+    try {
+      tokenFilterFactory("Stop", 
+                         // implicit default words file
+                         "format", "bogus");
+      fail();
+    } catch (IllegalArgumentException expected) {
+      String msg = expected.getMessage();
+      assertTrue(msg, msg.contains("can not be specified"));
+      assertTrue(msg, msg.contains("format"));
+      assertTrue(msg, msg.contains("bogus"));
+    }
+  }
 }

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_da.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_da.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_da.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_da.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Danish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_de.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_de.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_de.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_de.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A German stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_es.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_es.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_es.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_es.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Spanish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fi.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fi.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fi.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fi.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | forms of BE
 

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fr.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fr.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fr.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_fr.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A French stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_hu.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_hu.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_hu.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_hu.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | Hungarian stop word list
 | prepared by Anna Tordai

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_it.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_it.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_it.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_it.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | An Italian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_nl.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_nl.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_nl.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_nl.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Dutch stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_no.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_no.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_no.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_no.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Norwegian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_pt.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_pt.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_pt.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_pt.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Portuguese stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_ru.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_ru.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_ru.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_ru.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | a russian stop word list. comments begin with vertical bar. each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_sv.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_sv.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_sv.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/example-schemaless/solr/collection1/conf/lang/stopwords_sv.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Swedish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_da.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_da.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_da.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_da.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Danish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_de.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_de.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_de.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_de.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A German stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_es.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_es.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_es.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_es.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Spanish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fi.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fi.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fi.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fi.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | forms of BE
 

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fr.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fr.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fr.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_fr.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A French stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_hu.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_hu.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_hu.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_hu.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
  
 | Hungarian stop word list
 | prepared by Anna Tordai

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_it.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_it.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_it.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_it.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | An Italian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_nl.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_nl.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_nl.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_nl.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Dutch stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_no.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_no.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_no.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_no.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Norwegian stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_pt.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_pt.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_pt.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_pt.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Portuguese stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_ru.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_ru.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_ru.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_ru.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | a russian stop word list. comments begin with vertical bar. each stop
  | word is at the start of a line.

Modified: lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_sv.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_sv.txt?rev=1524848&r1=1524847&r2=1524848&view=diff
==============================================================================
--- lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_sv.txt (original)
+++ lucene/dev/branches/branch_4x/solr/example/solr/collection1/conf/lang/stopwords_sv.txt Thu Sep 19 21:35:18 2013
@@ -4,6 +4,8 @@
  | Also see http://www.opensource.org/licenses/bsd-license.html
  |  - Encoding was converted to UTF-8.
  |  - This notice was added.
+ |
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
 
  | A Swedish stop word list. Comments begin with vertical bar. Each stop
  | word is at the start of a line.



Mime
View raw message