You are viewing a plain text version of this content. The canonical link for it is here.
Posted to solr-user@lucene.apache.org by "Ghorpade, Parinita" <pg...@library.ucla.edu> on 2017/06/29 22:17:11 UTC

SOLR 4.10 Data import error

Hi,


I am getting following error , when I index data using Dataimporter.


I am using File Data source in the data config file

here is the config file


<dataConfig>

  <dataSource name="myfilereader" type="FileDataSource" encoding="UTF-8"/>

  <document>

    <entity name="f" rootEntity="false" dataSource="null" processor="FileListEntityProcessor" fileName=".*xml" recursive="true" baseDir="/opt/xml_content/prrla/dc/${dataimporter.request.instkey}/${dataimporter.request.colkey}">

      <entity name="x" dataSource="myfilereader" processor="XPathEntityProcessor" url="${f.fileAbsolutePath}" stream="false" forEach="/dc" transformer="DateFormatTransformer,RegexTransformer,TemplateTransformer">

        <field column="id" template="${f.file}"/>

        <field column="thumbnailExists" template="false"/>

        <field column="collectionKey" template="${dataimporter.request.colkey}"/>

        <field column="collectionName" template="${dataimporter.request.colname}"/>

        <field column="institutionKey" template="${dataimporter.request.instkey}"/>

        <field column="institutionName" template="${dataimporter.request.instname}"/>

        <field column="fileAbsolutePath" template="${f.fileAbsolutePath}"/>

        <field column="fileName" template="${f.file}"/>

        <field column="fileSize" template="${f.fileSize}"/>

        <field column="fileLastModified" template="${f.fileLastModified}"/>

        <field column="title_keyword" xpath="/dc/title"/>

        <field column="creator_keyword" xpath="/dc/creator"/>

        <field column="subject_keyword" xpath="/dc/subject"/>

        <field column="description_keyword" xpath="/dc/description"/>

        <field column="publisher_keyword" xpath="/dc/publisher"/>

        <field column="contributor_keyword" xpath="/dc/contributor"/>

        <field column="date_keyword" xpath="/dc/date"/>

        <field column="type_keyword" xpath="/dc/type"/>

        <field column="format_keyword" xpath="/dc/format"/>

        <field column="identifier_keyword" xpath="/dc/identifier"/>

        <field column="source_keyword" xpath="/dc/source"/>

        <field column="language_keyword" xpath="/dc/language"/>

        <field column="relation_keyword" xpath="/dc/relation"/>

        <field column="coverage_keyword" xpath="/dc/coverage"/>

        <field column="rights_keyword" xpath="/dc/rights"/>

      </entity>

    </entity>

  </document>

</dataConfig>




The error is:


ERROR org.apache.solr.handler.dataimport.DocBuilder: Exception while processing: f document : null:org.apache.solr.handler.dataimport.DataImportHandlerException: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.DataImportHandlerException.wrapAndThrow(DataImportHandlerException.java:63)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.initQuery(XPathEntityProcessor.java:286)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.fetchNextRow(XPathEntityProcessor.java:224)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.nextRow(XPathEntityProcessor.java:204)
        at org.apache.solr.handler.dataimport.EntityProcessorWrapper.nextRow(EntityProcessorWrapper.java:243)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:476)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:502)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:415)
        at org.apache.solr.handler.dataimport.DocBuilder.doFullDump(DocBuilder.java:330)
        at org.apache.solr.handler.dataimport.DocBuilder.execute(DocBuilder.java:232)
        at org.apache.solr.handler.dataimport.DataImporter.doFullImport(DataImporter.java:416)
        at org.apache.solr.handler.dataimport.DataImporter.runCmd(DataImporter.java:480)
        at org.apache.solr.handler.dataimport.DataImporter$1.run(DataImporter.java:461)
Caused by: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.FileDataSource.getFile(FileDataSource.java:127)
        at org.apache.solr.handler.dataimport.FileDataSource.getData(FileDataSource.java:86)
        at org.apache.solr.handler.dataimport.FileDataSource.getData(FileDataSource.java:48)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.initQuery(XPathEntityProcessor.java:283)
        ... 11 more
Caused by: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.FileDataSource.getFile(FileDataSource.java:123)
        ... 14 more
ERROR org.apache.solr.handler.dataimport.DataImporter: Full Import failed:java.lang.RuntimeException: java.lang.RuntimeException: org.apache.solr.handler.dataimport.DataImportHandlerException: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.DocBuilder.execute(DocBuilder.java:271)
        at org.apache.solr.handler.dataimport.DataImporter.doFullImport(DataImporter.java:416)
        at org.apache.solr.handler.dataimport.DataImporter.runCmd(DataImporter.java:480)
        at org.apache.solr.handler.dataimport.DataImporter$1.run(DataImporter.java:461)
Caused by: java.lang.RuntimeException: org.apache.solr.handler.dataimport.DataImportHandlerException: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:417)
        at org.apache.solr.handler.dataimport.DocBuilder.doFullDump(DocBuilder.java:330)
        at org.apache.solr.handler.dataimport.DocBuilder.execute(DocBuilder.java:232)
        ... 3 more
Caused by: org.apache.solr.handler.dataimport.DataImportHandlerException: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.DataImportHandlerException.wrapAndThrow(DataImportHandlerException.java:63)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.initQuery(XPathEntityProcessor.java:286)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.fetchNextRow(XPathEntityProcessor.java:224)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.nextRow(XPathEntityProcessor.java:204)
        at org.apache.solr.handler.dataimport.EntityProcessorWrapper.nextRow(EntityProcessorWrapper.java:243)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:476)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:502)
        at org.apache.solr.handler.dataimport.DocBuilder.buildDocument(DocBuilder.java:415)
        ... 5 more
Caused by: java.lang.RuntimeException: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.FileDataSource.getFile(FileDataSource.java:127)
        at org.apache.solr.handler.dataimport.FileDataSource.getData(FileDataSource.java:86)
        at org.apache.solr.handler.dataimport.FileDataSource.getData(FileDataSource.java:48)
        at org.apache.solr.handler.dataimport.XPathEntityProcessor.initQuery(XPathEntityProcessor.java:283)
        ... 11 more
Caused by: java.io.FileNotFoundException: Could not find file: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml (resolved to: /opt/xml_content/prrla/dc/moana/lianhuanhua_storybook/oai_3ALianhuanhua-?????????_3A1.xml
        at org.apache.solr.handler.dataimport.FileDataSource.getFile(FileDataSource.java:123)
        ... 14 more



The file name has chinese charcaters in it

oai_3ALianhuanhua-连环画_3A1.xml



Please help to resolve this issue.


Thank you

P Mulak