Got it working with the updated config: <dataConfig> <dataSource type="JdbcDataSource" name="db" jndiName="java:comp/env/jdbc/BuildDB" /> <dataSource name="bin" type="BinFileDataSource" /> <document> <entity name="productDocument" onError="skip" datsource="db" query="SELECT pa.prdAttachmentID id, pa.productId, pa.manufacturer, pa.fileName, pa.attachmentType, pa.displayName, lower('/mnt/shares/nasdev/mediabase/specifications/' + pa.manufacturer + '/' + CAST(pm.productid_manufacturer_id AS VARCHAR(50)) + '/' + pa.fileName) URL FROM mmc.dbo.product_attachments pa WITH (NOLOCK) INNER JOIN mmc.dbo.productid_manufacturer pm WITH (NOLOCK) ON pa.productId = pm.productid and pa.manufacturer = pm.manufacturer WHERE pa.productid = '3551LF'" > <field column="id" name="id"/> <field column="productCompositeid" name="productCompositeid"/> <field column="productid" name="productid"/> <field column="manufacturer" name="manufacturer"/> <field column="filename" name="filename"/> <field column="displayname" name="displayname"/> <field column="attachmentType" type="text" indexed="true" stored="true" />
<entity name="extract" dataSource="bin" processor="TikaEntityProcessor" url="${productDocument.URL}" format="text"> <field column="title" meta="true" name="title"/> <field column="text" name="text"/> </entity> </entity> </document> </dataConfig> -- View this message in context: http://lucene.472066.n3.nabble.com/Solr-DIH-using-JDBC-with-TIKA-tp4180737p4180742.html Sent from the Solr - User mailing list archive at Nabble.com.