You are viewing a plain text version of this content. The canonical link for it is here.
Posted to user@lenya.apache.org by Adam LIM <fu...@axidea.fr> on 2005/06/09 09:34:43 UTC

Lucene: problem while crawling

Hi!!!
I got a big problem wit Lucene and I don't know how to resolve it.
Could someone explain how to make it work. I wanna crawl my site so I
executed the following command on my shell as explained in the official
website:

/home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
-Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
/search/lucene-live.xconf crawl

And this is the return:

Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml

init:
     [echo] INFO: Init

crawl:
     [echo] INFO: Crawl and dump hypertext documents
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
live.xconf)
     [echo] INFO: Show configuration
     [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
     [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
     [java]     at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
     [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
     [java]     at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
     [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
     [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
     [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
     [java]     at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
     [java]     at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
     [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
     [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
     [java]     at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
     [java]     at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
     [java] Caused by: java.lang.NoClassDefFoundError:
org/apache/log4j/Category
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
ration.java:37)
     [java]     at java.lang.Class.forName0(Native Method)
     [java]     at java.lang.Class.forName(Class.java:219)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
     [java]     ... 13 more
     [java] --- Nested Exception ---
     [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
ration.java:37)
     [java]     at java.lang.Class.forName0(Native Method)
     [java]     at java.lang.Class.forName(Class.java:219)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
     [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
     [java]     at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
     [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
     [java]     at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
     [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
     [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
     [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
     [java]     at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
     [java]     at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
     [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
     [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
     [java]     at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
     [java]     at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
     [echo] INFO: Start crawling ...
     [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
     [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
     [java]     at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
     [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
     [java]     at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
     [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
     [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
     [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
     [java]     at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
     [java]     at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
     [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
     [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
     [java]     at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
     [java]     at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
     [java] Caused by: java.lang.NoClassDefFoundError:
org/apache/log4j/Category
     [java]     at
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
rawler.java:38)
     [java]     at java.lang.Class.forName0(Native Method)
     [java]     at java.lang.Class.forName(Class.java:219)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
     [java]     ... 13 more
     [java] --- Nested Exception ---
     [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
     [java]     at
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
rawler.java:38)
     [java]     at java.lang.Class.forName0(Native Method)
     [java]     at java.lang.Class.forName(Class.java:219)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
     [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
     [java]     at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
     [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
     [java]     at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
     [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
     [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
     [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
     [java]     at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
     [java]     at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
     [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
     [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
     [java]     at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
     [java]     at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
     [echo] INFO: Crawling finished


Thank you in advance

Adam LIM,



---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by so...@gmail.com.
I am not certain it is relevant, but I documented one issue with
searching if installed from apache-lenya-1.2.2-src.tar.gz.  Maybe the
"bin" install has a similar problem?
http://solprovider.com/lenya/searchlinux

HTH,
solprovider

P.S: Thanks for letting me know about the URL.

---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Seems like this was fixed in the 1.2.3-Release of Lenya, since
I can't reproduce this problem.
However I checked the 1.2.2-bin Distribution and found a similar
issue, I try to explain as far as I understand what is wrong:

The init-target in the crawl_and_index.xml buildfile creates
a classpath which is used to run the crawl-, index- and
search-targets. The classpath is a list of pathelements each
points to a jar-file in WEB-INF/lib. One of the pathelements
has a different version-number (part of the filename) than the
(referring) jar-file in WEB-INF/lib. So the wrong version of
the Java-Library is the cause of the java.lang.NoClassDefFoundError.

The 1.2.2-bin Distribution comes with
   xalan-2.6.1-dev-20041008T0304.jar
the pathelement in crawl_and_index.xml is referring to
  <pathelement path="${web-inf.dir}/lib/xalan-2.6.0.jar"/>

I am still fighting with subversion so maybe you can do this
one-line-patch for me ;-)

greetings

Michael


Gregor J. Rothfuss wrote:
> Michael Wohlfart wrote:
> 
>> I got a similar Error, in my case the problem was that some of the
>> pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
>> libraries in WEB-INF/lib.
>> Maybe you should take a look at the pathelement for the log4j
>> Library and verify that the referred file exists in your WEB-INF/lib.
> 
> 
> can you describe in detail what was wrong, or better yet, send a patch, 
> so that this can be fixed?
> 
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
> 
> 


---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by "Gregor J. Rothfuss" <gr...@apache.org>.
Michael Wohlfart wrote:

> I got a similar Error, in my case the problem was that some of the
> pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
> libraries in WEB-INF/lib.
> Maybe you should take a look at the pathelement for the log4j
> Library and verify that the referred file exists in your WEB-INF/lib.

can you describe in detail what was wrong, or better yet, send a patch, 
so that this can be fixed?

---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by Michael Wohlfart <mi...@zsw-bw.de>.
solprovider@gmail.com wrote:
[...]
> Michael,
> I was going to point to:
> http://lenya.apache.org/1_2_x/how-to/search.html
> when I noticed you already pointed to my site.  How did you get the
> long URL instead of http://solprovider.com/lenya/search  ?  Were you
> using an old bookmark, or did I miss translating a link?

The link was in one of your emails to the list.

best regards

Michael

---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by so...@gmail.com.
On 6/9/05, Michael Wohlfart <mi...@zsw-bw.de> wrote:
> The log4j warning are caused by a missing log4j.properties file in your
> classpath. Solprovider wrote a nice article about searching in Lenya
> with an example log4j.properties file
> http://solprovider.com/solprovider/lenya.nsf/Home?readform&pg=search

Michael,
I was going to point to:
http://lenya.apache.org/1_2_x/how-to/search.html
when I noticed you already pointed to my site.  How did you get the
long URL instead of http://solprovider.com/lenya/search  ?  Were you
using an old bookmark, or did I miss translating a link?

Adam,
A usable log4j.properties is #4 under "Indexing on Windows".  You can
ignore the rest of the instructions.

solprovider

---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Hi Adam,

The log4j warning are caused by a missing log4j.properties file in your
classpath. Solprovider wrote a nice article about searching in Lenya
with an example log4j.properties file
[http://solprovider.com/solprovider/lenya.nsf/Home?readform&pg=search]

The four nulls in the Error output should contain the crawler setup
(Base URL, Scope URL, User Agent and URI List) configured in the
file crawler-live.xconf.
So my guess is that your "-Dcrawler.xconf" parameter is wrong ?


hope that helps

Michael


Adam LIM wrote:
> Hi!!!
> Thank you for ya help. I correct the errors about
> java.lang.NoClassDefFoundError I got but some new errors come up. This what
> the command line returned:
> 
>      [echo] INFO: Crawl and dump hypertext documents
> (/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
>      [echo] INFO: Show configuration
>      [java] log4j:WARN No appenders could be found for logger
> (org.apache.lenya.xml.DOMUtil).
>      [java] log4j:WARN Please initialize the log4j system properly.
>      [java] null
>      [java] null
>      [java] null
>      [java] null
>      [java] java.lang.NullPointerException
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)


---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


RE: Lucene: problem while crawling

Posted by Adam LIM <fu...@axidea.fr>.
Hi!!!
Thank you for ya help. I correct the errors about
java.lang.NoClassDefFoundError I got but some new errors come up. This what
the command line returned:

     [echo] INFO: Crawl and dump hypertext documents
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
live.xconf)
     [echo] INFO: Show configuration
     [java] log4j:WARN No appenders could be found for logger
(org.apache.lenya.xml.DOMUtil).
     [java] log4j:WARN Please initialize the log4j system properly.
     [java] null
     [java] null
     [java] null
     [java] null
     [java] java.lang.NullPointerException
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
     [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
     [java]     at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
     [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
     [java]     at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
     [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
     [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
     [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
     [java]     at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
     [java]     at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
     [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
     [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
     [java]     at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
     [java]     at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
     [java] Caused by: java.lang.NullPointerException
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.resolvePath(CrawlerConf
iguration.java:235)
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.main(CrawlerConfigurati
on.java:110)
     [java]     at sun.reflect.NativeMethodAccessorImpl.invoke0(Native
Method)
     [java]     at
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:39
)
     [java]     at
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl
.java:25)
     [java]     at java.lang.reflect.Method.invoke(Method.java:324)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.run(ExecuteJava.java:193)
     [java]     at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:130)
     [java]     ... 13 more
     [java] --- Nested Exception ---
     [java] java.lang.NullPointerException
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.resolvePath(CrawlerConf
iguration.java:235)
     [java]     at
org.apache.lenya.search.crawler.CrawlerConfiguration.main(CrawlerConfigurati
on.java:110)
     [java]     at sun.reflect.NativeMethodAccessorImpl.invoke0(Native
Method) ............
..........

Have you got these too? 

Thanks ya!

Adam LIM,



-----Message d'origine-----
De : Michael Wohlfart [mailto:michael.wohlfart@zsw-bw.de] 
Envoyé : jeudi 9 juin 2005 10:29
À : user@lenya.apache.org
Objet : Re: Lucene: problem while crawling

Hi Adam,
I got a similar Error, in my case the problem was that some of the
pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
libraries in WEB-INF/lib.
Maybe you should take a look at the pathelement for the log4j
Library and verify that the referred file exists in your WEB-INF/lib.

best regards

Michael



Adam LIM wrote:
> Hi!!!
> I got a big problem wit Lucene and I don't know how to resolve it.
> Could someone explain how to make it work. I wanna crawl my site so I
> executed the following command on my shell as explained in the official
> website:
> 
> /home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
> usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
>
-Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
> /search/lucene-live.xconf crawl
> 
> And this is the return:
> 
> Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
> 
> init:
>      [echo] INFO: Init
> 
> crawl:
>      [echo] INFO: Crawl and dump hypertext documents
>
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
>      [echo] INFO: Show configuration
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at
org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
>      [java]     at
>
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     ... 13 more
>      [java] --- Nested Exception ---
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
>
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at
org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [echo] INFO: Start crawling ...
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at
org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
>      [java]     at
>
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     ... 13 more
>      [java] --- Nested Exception ---
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
>
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at
org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [echo] INFO: Crawling finished
> 
> 
> Thank you in advance
> 
> Adam LIM,
> 
> 
> 
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
> 
> 


---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org




---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org


Re: Lucene: problem while crawling

Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Hi Adam,
I got a similar Error, in my case the problem was that some of the
pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
libraries in WEB-INF/lib.
Maybe you should take a look at the pathelement for the log4j
Library and verify that the referred file exists in your WEB-INF/lib.

best regards

Michael



Adam LIM wrote:
> Hi!!!
> I got a big problem wit Lucene and I don't know how to resolve it.
> Could someone explain how to make it work. I wanna crawl my site so I
> executed the following command on my shell as explained in the official
> website:
> 
> /home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
> usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
> -Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
> /search/lucene-live.xconf crawl
> 
> And this is the return:
> 
> Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
> 
> init:
>      [echo] INFO: Init
> 
> crawl:
>      [echo] INFO: Crawl and dump hypertext documents
> (/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
>      [echo] INFO: Show configuration
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
>      [java]     at
> org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     ... 13 more
>      [java] --- Nested Exception ---
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [echo] INFO: Start crawling ...
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
>      [java]     at
> org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     ... 13 more
>      [java] --- Nested Exception ---
>      [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
>      [java]     at
> org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
>      [java]     at java.lang.Class.forName0(Native Method)
>      [java]     at java.lang.Class.forName(Class.java:219)
>      [java]     at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
>      [java]     at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
>      [java]     at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
>      [java]     at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
>      [java]     at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
>      [java]     at org.apache.tools.ant.Task.perform(Task.java:364)
>      [java]     at org.apache.tools.ant.Target.execute(Target.java:341)
>      [java]     at org.apache.tools.ant.Target.performTasks(Target.java:369)
>      [java]     at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
>      [java]     at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
>      [java]     at org.apache.tools.ant.Main.runBuild(Main.java:673)
>      [java]     at org.apache.tools.ant.Main.startAnt(Main.java:188)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
>      [java]     at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
>      [echo] INFO: Crawling finished
> 
> 
> Thank you in advance
> 
> Adam LIM,
> 
> 
> 
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
> 
> 


---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org