On May 7, 2007, at 11:05 AM, Brian Whitman wrote:
Using resin 3.0.23 with a trunk solr war I am having a problem adding documents with utf-8 characters, including the utf8-example in exampledocs.

The document simply doesn't get added to Solr. Flat ascii documents work fine as does all non-update stuff.

To reproduce:
install resin 3 and set up solr according to the wiki for resin.
./post.sh utf8-example.xml

I also have a real world document that doesn't work (from our nutch crawls):
wget http://variogr.am/badfile.txt
./post.sh badfile.txt


A solr rock star advised me to try SOLR-214, which fixes the problem. Perhaps he'll illuminate us as to the reasons! But for now be careful with Resin.


-Brian







I get this in my resin logs.

[10:53:10.834] java.io.CharConversionException: illegal utf8 encoding at 0xc3, a [10:53:10.834] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:97) [10:53:10.834] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:178)
[10:53:10.834]  at com.caucho.vfs.ReadStream.read(ReadStream.java:499)
[10:53:10.834] at com.caucho.vfs.BufferedReaderAdapter.read (BufferedReaderAdapter.java:64) [10:53:10.834] at org.xmlpull.mxp1.MXParser.fillBuf(MXParser.java: 2972)
[10:53:10.834]  at org.xmlpull.mxp1.MXParser.more(MXParser.java:3026)
[10:53:10.834] at org.xmlpull.mxp1.MXParser.parseProlog (MXParser.java:1410) [10:53:10.834] at org.xmlpull.mxp1.MXParser.nextImpl(MXParser.java: 1395)
[10:53:10.834]  at org.xmlpull.mxp1.MXParser.next(MXParser.java:1093)
[10:53:10.834] at org.xmlpull.mxp1.MXParser.nextTag(MXParser.java: 1078) [10:53:10.834] at org.apache.solr.handler.XmlUpdateRequestHandler.update (XmlUpdateRequestHandler.java:111) [10:53:10.834] at org.apache.solr.handler.XmlUpdateRequestHandler.handleRequestBody (XmlUpdateRequestHandler.java:84) [10:53:10.834] at org.apache.solr.handler.RequestHandlerBase.handleRequest (RequestHandlerBase.java:77) [10:53:10.834] at org.apache.solr.core.SolrCore.execute (SolrCore.java:671) [10:53:10.834] at org.apache.solr.servlet.SolrDispatchFilter.execute (SolrDispatchFilter.java:188) [10:53:10.834] at org.apache.solr.servlet.SolrDispatchFilter.doFilter (SolrDispatchFilter.java:156) [10:53:10.834] at com.caucho.server.dispatch.FilterFilterChain.doFilter (FilterFilterChain.java:70) [10:53:10.834] at com.caucho.server.webapp.WebAppFilterChain.doFilter (WebAppFilterChain.java:173) [10:53:10.834] at com.caucho.server.dispatch.ServletInvocation.service (ServletInvocation.java:229) [10:53:10.834] at com.caucho.server.http.HttpRequest.handleRequest (HttpRequest.java:274) [10:53:10.834] at com.caucho.server.port.TcpConnection.run (TcpConnection.java:511) [10:53:10.834] at com.caucho.util.ThreadPool.runTasks (ThreadPool.java:520)
[10:53:10.834]  at com.caucho.util.ThreadPool.run(ThreadPool.java:442)
[10:53:10.834]  at java.lang.Thread.run(Thread.java:619)
[10:53:10.834]
[10:53:10.835] /update  0 2
[10:53:10.836] java.io.CharConversionException: illegal utf8 encoding at 0xc3, a [10:53:10.836] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:97) [10:53:10.836] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:178)
[10:53:10.836]  at com.caucho.vfs.ReadStream.read(ReadStream.java:499)
[10:53:10.836] at com.caucho.vfs.BufferedReaderAdapter.read (BufferedReaderAdapter.java:64) [10:53:10.836] at org.xmlpull.mxp1.MXParser.fillBuf(MXParser.java: 2972)
[10:53:10.836]  at org.xmlpull.mxp1.MXParser.more(MXParser.java:3026)
[10:53:10.836] at org.xmlpull.mxp1.MXParser.parseProlog (MXParser.java:1410) [10:53:10.836] at org.xmlpull.mxp1.MXParser.nextImpl(MXParser.java: 1395)
[10:53:10.836]  at org.xmlpull.mxp1.MXParser.next(MXParser.java:1093)
[10:53:10.836] at org.xmlpull.mxp1.MXParser.nextTag(MXParser.java: 1078) [10:53:10.836] at org.apache.solr.handler.XmlUpdateRequestHandler.update (XmlUpdateRequestHandler.java:111) [10:53:10.836] at org.apache.solr.handler.XmlUpdateRequestHandler.handleRequestBody (XmlUpdateRequestHandler.java:84) [10:53:10.836] at org.apache.solr.handler.RequestHandlerBase.handleRequest (RequestHandlerBase.java:77) [10:53:10.836] at org.apache.solr.core.SolrCore.execute (SolrCore.java:671) [10:53:10.836] at org.apache.solr.servlet.SolrDispatchFilter.execute (SolrDispatchFilter.java:188) [10:53:10.836] at org.apache.solr.servlet.SolrDispatchFilter.doFilter (SolrDispatchFilter.java:156) [10:53:10.836] at com.caucho.server.dispatch.FilterFilterChain.doFilter (FilterFilterChain.java:70) [10:53:10.836] at com.caucho.server.webapp.WebAppFilterChain.doFilter (WebAppFilterChain.java:173) [10:53:10.836] at com.caucho.server.dispatch.ServletInvocation.service (ServletInvocation.java:229) [10:53:10.836] at com.caucho.server.http.HttpRequest.handleRequest (HttpRequest.java:274) [10:53:10.836] at com.caucho.server.port.TcpConnection.run (TcpConnection.java:511) [10:53:10.836] at com.caucho.util.ThreadPool.runTasks (ThreadPool.java:520)
[10:53:10.836]  at com.caucho.util.ThreadPool.run(ThreadPool.java:442)
[10:53:10.836]  at java.lang.Thread.run(Thread.java:619)
[10:53:10.836]
[10:53:10.837] [2] HTTP/1.1 500 illegal utf8 encoding at 0xc3, a
[10:53:10.837]
[10:53:10.837] java.io.CharConversionException: illegal utf8 encoding at 0xc3, a [10:53:10.837] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:97) [10:53:10.837] at com.caucho.vfs.i18n.UTF8Reader.read (UTF8Reader.java:178)
[10:53:10.837]  at com.caucho.vfs.ReadStream.read(ReadStream.java:499)
[10:53:10.837] at com.caucho.vfs.BufferedReaderAdapter.read (BufferedReaderAdapter.java:64) [10:53:10.837] at org.xmlpull.mxp1.MXParser.fillBuf(MXParser.java: 2972)
[10:53:10.837]  at org.xmlpull.mxp1.MXParser.more(MXParser.java:3026)
[10:53:10.837] at org.xmlpull.mxp1.MXParser.parseProlog (MXParser.java:1410) [10:53:10.837] at org.xmlpull.mxp1.MXParser.nextImpl(MXParser.java: 1395)
[10:53:10.837]  at org.xmlpull.mxp1.MXParser.next(MXParser.java:1093)
[10:53:10.837] at org.xmlpull.mxp1.MXParser.nextTag(MXParser.java: 1078) [10:53:10.837] at org.apache.solr.handler.XmlUpdateRequestHandler.update (XmlUpdateRequestHandler.java:111) [10:53:10.837] at org.apache.solr.handler.XmlUpdateRequestHandler.handleRequestBody (XmlUpdateRequestHandler.java:84) [10:53:10.837] at org.apache.solr.handler.RequestHandlerBase.handleRequest (RequestHandlerBase.java:77) [10:53:10.837] at org.apache.solr.core.SolrCore.execute (SolrCore.java:671) [10:53:10.837] at org.apache.solr.servlet.SolrDispatchFilter.execute (SolrDispatchFilter.java:188) [10:53:10.837] at org.apache.solr.servlet.SolrDispatchFilter.doFilter (SolrDispatchFilter.java:156) [10:53:10.837] at com.caucho.server.dispatch.FilterFilterChain.doFilter (FilterFilterChain.java:70) [10:53:10.837] at com.caucho.server.webapp.WebAppFilterChain.doFilter (WebAppFilterChain.java:173) [10:53:10.837] at com.caucho.server.dispatch.ServletInvocation.service (ServletInvocation.java:229) [10:53:10.837] at com.caucho.server.http.HttpRequest.handleRequest (HttpRequest.java:274) [10:53:10.837] at com.caucho.server.port.TcpConnection.run (TcpConnection.java:511) [10:53:10.837] at com.caucho.util.ThreadPool.runTasks (ThreadPool.java:520)
[10:53:10.837]  at com.caucho.util.ThreadPool.run(ThreadPool.java:442)
[10:53:10.837]  at java.lang.Thread.run(Thread.java:619)
[10:53:10.837]



--
http://variogr.am/
[EMAIL PROTECTED]




Reply via email to