Here is the corresponding stopwords.txt file content: \# Licensed to the Apache Software Foundation (ASF) under one or more \# contributor license agreements. See the NOTICE file distributed with \# this work for additional information regarding copyright ownership. \# The ASF licenses this file to You under the Apache License, Version 2.0 \# (the "License"); you may not use this file except in compliance with \# the License. You may obtain a copy of the License at \# \# http://www.apache.org/licenses/LICENSE-2.0 \# \# Unless required by applicable law or agreed to in writing, software \# distributed under the License is distributed on an "AS IS" BASIS, \# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. \# See the License for the specific language governing permissions and \# limitations under the License.
\# ----------------------------------------------------------------------- \# a couple of test stopwords to test that the words are really being \# configured from this file: stopworda stopwordb \# Standard english stop words taken from Lucene's StopAnalyzer a an \# and are as at be but by \# for \# if in into \# is it no \# not of on \# or s such t that the their then there these they this to was will with On Mon, Jun 12, 2023 at 11:06 PM gnandre <arnoldbron...@gmail.com> wrote: > Hi, > > I am using Solr 9.2.1 (official docker image). > > When I try to index a document, I get the error shown at the bottom of > this email. > > Here is my corresponding filter setting > > <fieldType name="url_path_text" class="solr.TextField"> > <analyzer type="index"> > <tokenizer name="pattern" pattern= > "https?:\/\/((www[^\.]+)|(www.))?|\/([^/]\.[^/]$)?|\.?mat\.[^/]+|[?#].*$" > group="-1"/> > <filter name="wordDelimiterGraph" protected="protect.txt" > preserveOriginal="1" generateWordParts="1" generateNumberParts="1" > catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange= > "1"/> > <filter name="flattenGraph"/> > <filter name="stop" format="snowball" ignoreCase="true" words= > "stopwords.txt"/> > <filter name="lowercase"/> > <filter name="icuNormalizer2"/> > <filter name="snowballPorter" protected="protwords.txt" language= > "English"/> > <filter name="removeDuplicates"/> > </analyzer> > <analyzer type="query"> > <tokenizer name="whitespace"/> > <filter name="stop" format="snowball" ignoreCase="true" words= > "stopwords.txt"/> > <filter name="wordDelimiterGraph" protected="protect.txt" > preserveOriginal="1" generateWordParts="1" generateNumberParts="1" > catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange= > "1"/> > <filter name="lowercase"/> > <filter name="icuNormalizer2"/> > <filter name="snowballPorter" protected="protwords.txt" language= > "English"/> > <filter name="removeDuplicates"/> > </analyzer> > </fieldType> > > What am I missing? > > development-environment-solr-9-1 | 2023-06-13 02:58:09.441 ERROR > (qtp479459041-20) [ x:documentation] o.a.s.h.RequestHandlerBase > org.apache.solr.common.SolrException: Exception writing document id > doc:en:doc1 to the index; possible analysis error. => > org.apache.solr.common.SolrException: Exception writing document id > doc:en:doc1 to the index; possible analysis error. > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.addDoc(DirectUpdateHandler2.java:323) > development-environment-solr-9-1 | org.apache.solr.common.SolrException: > Exception writing document id doc:en:doc1 to the index; possible analysis > error. > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.addDoc(DirectUpdateHandler2.java:323) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.RunUpdateProcessorFactory$RunUpdateProcessor.processAdd(RunUpdateProcessorFactory.java:76) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.UpdateRequestProcessor.processAdd(UpdateRequestProcessor.java:55) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.DistributedUpdateProcessor.doLocalAdd(DistributedUpdateProcessor.java:270) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.DistributedUpdateProcessor.doVersionAdd(DistributedUpdateProcessor.java:545) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.DistributedUpdateProcessor.lambda$versionAdd$0(DistributedUpdateProcessor.java:357) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.VersionBucket.runWithLock(VersionBucket.java:51) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.DistributedUpdateProcessor.versionAdd(DistributedUpdateProcessor.java:354) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.DistributedUpdateProcessor.processAdd(DistributedUpdateProcessor.java:236) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.processor.LogUpdateProcessorFactory$LogUpdateProcessor.processAdd(LogUpdateProcessorFactory.java:111) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.loader.JavabinLoader$1.update(JavabinLoader.java:123) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.client.solrj.request.JavaBinUpdateRequestCodec$StreamingCodec.readOuterMostDocIterator(JavaBinUpdateRequestCodec.java:342) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.client.solrj.request.JavaBinUpdateRequestCodec$StreamingCodec.readIterator(JavaBinUpdateRequestCodec.java:286) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.common.util.JavaBinCodec.readObject(JavaBinCodec.java:338) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.common.util.JavaBinCodec.readVal(JavaBinCodec.java:283) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.client.solrj.request.JavaBinUpdateRequestCodec$StreamingCodec.readNamedList(JavaBinUpdateRequestCodec.java:236) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.common.util.JavaBinCodec.readObject(JavaBinCodec.java:303) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.common.util.JavaBinCodec.readVal(JavaBinCodec.java:283) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.common.util.JavaBinCodec.unmarshal(JavaBinCodec.java:193) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.client.solrj.request.JavaBinUpdateRequestCodec.unmarshal(JavaBinUpdateRequestCodec.java:126) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.loader.JavabinLoader.parseAndLoadDocs(JavabinLoader.java:135) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.loader.JavabinLoader.load(JavabinLoader.java:74) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.UpdateRequestHandler$1.load(UpdateRequestHandler.java:101) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.ContentStreamHandlerBase.handleRequestBody(ContentStreamHandlerBase.java:84) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.handler.RequestHandlerBase.handleRequest(RequestHandlerBase.java:224) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.core.SolrCore.execute(SolrCore.java:2890) ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.HttpSolrCall.executeCoreRequest(HttpSolrCall.java:872) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.HttpSolrCall.call(HttpSolrCall.java:568) ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.SolrDispatchFilter.dispatch(SolrDispatchFilter.java:252) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.SolrDispatchFilter.lambda$doFilter$0(SolrDispatchFilter.java:220) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.ServletUtils.traceHttpRequestExecution2(ServletUtils.java:257) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.ServletUtils.rateLimitRequest(ServletUtils.java:227) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.SolrDispatchFilter.doFilter(SolrDispatchFilter.java:215) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.servlet.SolrDispatchFilter.doFilter(SolrDispatchFilter.java:197) > ~[?:?] > development-environment-solr-9-1 | at > org.eclipse.jetty.servlet.FilterHolder.doFilter(FilterHolder.java:210) > ~[jetty-servlet-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.servlet.ServletHandler$Chain.doFilter(ServletHandler.java:1635) > ~[jetty-servlet-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.servlet.ServletHandler.doHandle(ServletHandler.java:527) > ~[jetty-servlet-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.handle(ScopedHandler.java:131) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.security.SecurityHandler.handle(SecurityHandler.java:578) > ~[jetty-security-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.HandlerWrapper.handle(HandlerWrapper.java:122) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.nextHandle(ScopedHandler.java:223) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.session.SessionHandler.doHandle(SessionHandler.java:1570) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.nextHandle(ScopedHandler.java:221) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ContextHandler.doHandle(ContextHandler.java:1383) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.nextScope(ScopedHandler.java:176) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.servlet.ServletHandler.doScope(ServletHandler.java:484) > ~[jetty-servlet-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.session.SessionHandler.doScope(SessionHandler.java:1543) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.nextScope(ScopedHandler.java:174) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ContextHandler.doScope(ContextHandler.java:1305) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ScopedHandler.handle(ScopedHandler.java:129) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.ContextHandlerCollection.handle(ContextHandlerCollection.java:149) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.InetAccessHandler.handle(InetAccessHandler.java:228) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.HandlerCollection.handle(HandlerCollection.java:141) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.HandlerWrapper.handle(HandlerWrapper.java:122) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.rewrite.handler.RewriteHandler.handle(RewriteHandler.java:301) > ~[jetty-rewrite-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.HandlerWrapper.handle(HandlerWrapper.java:122) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.gzip.GzipHandler.handle(GzipHandler.java:822) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.handler.HandlerWrapper.handle(HandlerWrapper.java:122) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.Server.handle(Server.java:563) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.HttpChannel.lambda$handle$0(HttpChannel.java:505) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.HttpChannel.dispatch(HttpChannel.java:762) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.HttpChannel.handle(HttpChannel.java:497) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.server.HttpConnection.onFillable(HttpConnection.java:282) > ~[jetty-server-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.io.AbstractConnection$ReadCallback.succeeded(AbstractConnection.java:314) > ~[jetty-io-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.io.FillInterest.fillable(FillInterest.java:100) > ~[jetty-io-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.io.SelectableChannelEndPoint$1.run(SelectableChannelEndPoint.java:53) > ~[jetty-io-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.strategy.AdaptiveExecutionStrategy.runTask(AdaptiveExecutionStrategy.java:416) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.strategy.AdaptiveExecutionStrategy.consumeTask(AdaptiveExecutionStrategy.java:385) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.strategy.AdaptiveExecutionStrategy.tryProduce(AdaptiveExecutionStrategy.java:272) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.strategy.AdaptiveExecutionStrategy.lambda$new$0(AdaptiveExecutionStrategy.java:140) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.ReservedThreadExecutor$ReservedThread.run(ReservedThreadExecutor.java:411) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.QueuedThreadPool.runJob(QueuedThreadPool.java:934) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at > org.eclipse.jetty.util.thread.QueuedThreadPool$Runner.run(QueuedThreadPool.java:1078) > ~[jetty-util-10.0.13.jar:10.0.13] > development-environment-solr-9-1 | at java.lang.Thread.run(Unknown > Source) [?:?] > development-environment-solr-9-1 | Caused by: > java.lang.NullPointerException: stopWords > development-environment-solr-9-1 | at > java.util.Objects.requireNonNull(Unknown Source) ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.StopFilter.<init>(StopFilter.java:39) ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.core.StopFilter.<init>(StopFilter.java:43) ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.core.StopFilterFactory.create(StopFilterFactory.java:91) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.analysis.TokenizerChain.createComponents(TokenizerChain.java:132) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.AnalyzerWrapper.createComponents(AnalyzerWrapper.java:120) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.AnalyzerWrapper.createComponents(AnalyzerWrapper.java:120) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.analysis.Analyzer.tokenStream(Analyzer.java:193) ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.document.Field.tokenStream(Field.java:486) ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.IndexingChain$PerField.invert(IndexingChain.java:1103) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.IndexingChain.processField(IndexingChain.java:681) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.IndexingChain.processDocument(IndexingChain.java:566) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.DocumentsWriterPerThread.updateDocuments(DocumentsWriterPerThread.java:241) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.DocumentsWriter.updateDocuments(DocumentsWriter.java:432) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.IndexWriter.updateDocuments(IndexWriter.java:1533) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.lucene.index.IndexWriter.updateDocuments(IndexWriter.java:1522) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.updateDocOrDocValues(DirectUpdateHandler2.java:1050) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.doNormalUpdate(DirectUpdateHandler2.java:409) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.addDoc0(DirectUpdateHandler2.java:362) > ~[?:?] > development-environment-solr-9-1 | at > org.apache.solr.update.DirectUpdateHandler2.addDoc(DirectUpdateHandler2.java:299) > ~[?:?] > development-environment-solr-9-1 | ... 73 more >