You are viewing a plain text version of this content. The canonical link for it is here.
Posted to user@lenya.apache.org by Adam LIM <fu...@axidea.fr> on 2005/06/09 09:34:43 UTC
Lucene: problem while crawling
Hi!!!
I got a big problem wit Lucene and I don't know how to resolve it.
Could someone explain how to make it work. I wanna crawl my site so I
executed the following command on my shell as explained in the official
website:
/home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
-Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
/search/lucene-live.xconf crawl
And this is the return:
Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
init:
[echo] INFO: Init
crawl:
[echo] INFO: Crawl and dump hypertext documents
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
live.xconf)
[echo] INFO: Show configuration
[java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
[java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
[java] at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
[java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
[java] at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
[java] at org.apache.tools.ant.Task.perform(Task.java:364)
[java] at org.apache.tools.ant.Target.execute(Target.java:341)
[java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
[java] at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
[java] at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
[java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
[java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
[java] at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
[java] at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
[java] Caused by: java.lang.NoClassDefFoundError:
org/apache/log4j/Category
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
ration.java:37)
[java] at java.lang.Class.forName0(Native Method)
[java] at java.lang.Class.forName(Class.java:219)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
[java] ... 13 more
[java] --- Nested Exception ---
[java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
ration.java:37)
[java] at java.lang.Class.forName0(Native Method)
[java] at java.lang.Class.forName(Class.java:219)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
[java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
[java] at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
[java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
[java] at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
[java] at org.apache.tools.ant.Task.perform(Task.java:364)
[java] at org.apache.tools.ant.Target.execute(Target.java:341)
[java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
[java] at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
[java] at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
[java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
[java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
[java] at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
[java] at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
[echo] INFO: Start crawling ...
[java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
[java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
[java] at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
[java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
[java] at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
[java] at org.apache.tools.ant.Task.perform(Task.java:364)
[java] at org.apache.tools.ant.Target.execute(Target.java:341)
[java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
[java] at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
[java] at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
[java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
[java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
[java] at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
[java] at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
[java] Caused by: java.lang.NoClassDefFoundError:
org/apache/log4j/Category
[java] at
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
rawler.java:38)
[java] at java.lang.Class.forName0(Native Method)
[java] at java.lang.Class.forName(Class.java:219)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
[java] ... 13 more
[java] --- Nested Exception ---
[java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
[java] at
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
rawler.java:38)
[java] at java.lang.Class.forName0(Native Method)
[java] at java.lang.Class.forName(Class.java:219)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
[java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
[java] at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
[java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
[java] at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
[java] at org.apache.tools.ant.Task.perform(Task.java:364)
[java] at org.apache.tools.ant.Target.execute(Target.java:341)
[java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
[java] at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
[java] at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
[java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
[java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
[java] at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
[java] at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
[echo] INFO: Crawling finished
Thank you in advance
Adam LIM,
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by so...@gmail.com.
I am not certain it is relevant, but I documented one issue with
searching if installed from apache-lenya-1.2.2-src.tar.gz. Maybe the
"bin" install has a similar problem?
http://solprovider.com/lenya/searchlinux
HTH,
solprovider
P.S: Thanks for letting me know about the URL.
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Seems like this was fixed in the 1.2.3-Release of Lenya, since
I can't reproduce this problem.
However I checked the 1.2.2-bin Distribution and found a similar
issue, I try to explain as far as I understand what is wrong:
The init-target in the crawl_and_index.xml buildfile creates
a classpath which is used to run the crawl-, index- and
search-targets. The classpath is a list of pathelements each
points to a jar-file in WEB-INF/lib. One of the pathelements
has a different version-number (part of the filename) than the
(referring) jar-file in WEB-INF/lib. So the wrong version of
the Java-Library is the cause of the java.lang.NoClassDefFoundError.
The 1.2.2-bin Distribution comes with
xalan-2.6.1-dev-20041008T0304.jar
the pathelement in crawl_and_index.xml is referring to
<pathelement path="${web-inf.dir}/lib/xalan-2.6.0.jar"/>
I am still fighting with subversion so maybe you can do this
one-line-patch for me ;-)
greetings
Michael
Gregor J. Rothfuss wrote:
> Michael Wohlfart wrote:
>
>> I got a similar Error, in my case the problem was that some of the
>> pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
>> libraries in WEB-INF/lib.
>> Maybe you should take a look at the pathelement for the log4j
>> Library and verify that the referred file exists in your WEB-INF/lib.
>
>
> can you describe in detail what was wrong, or better yet, send a patch,
> so that this can be fixed?
>
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
>
>
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by "Gregor J. Rothfuss" <gr...@apache.org>.
Michael Wohlfart wrote:
> I got a similar Error, in my case the problem was that some of the
> pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
> libraries in WEB-INF/lib.
> Maybe you should take a look at the pathelement for the log4j
> Library and verify that the referred file exists in your WEB-INF/lib.
can you describe in detail what was wrong, or better yet, send a patch,
so that this can be fixed?
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by Michael Wohlfart <mi...@zsw-bw.de>.
solprovider@gmail.com wrote:
[...]
> Michael,
> I was going to point to:
> http://lenya.apache.org/1_2_x/how-to/search.html
> when I noticed you already pointed to my site. How did you get the
> long URL instead of http://solprovider.com/lenya/search ? Were you
> using an old bookmark, or did I miss translating a link?
The link was in one of your emails to the list.
best regards
Michael
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by so...@gmail.com.
On 6/9/05, Michael Wohlfart <mi...@zsw-bw.de> wrote:
> The log4j warning are caused by a missing log4j.properties file in your
> classpath. Solprovider wrote a nice article about searching in Lenya
> with an example log4j.properties file
> http://solprovider.com/solprovider/lenya.nsf/Home?readform&pg=search
Michael,
I was going to point to:
http://lenya.apache.org/1_2_x/how-to/search.html
when I noticed you already pointed to my site. How did you get the
long URL instead of http://solprovider.com/lenya/search ? Were you
using an old bookmark, or did I miss translating a link?
Adam,
A usable log4j.properties is #4 under "Indexing on Windows". You can
ignore the rest of the instructions.
solprovider
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Hi Adam,
The log4j warning are caused by a missing log4j.properties file in your
classpath. Solprovider wrote a nice article about searching in Lenya
with an example log4j.properties file
[http://solprovider.com/solprovider/lenya.nsf/Home?readform&pg=search]
The four nulls in the Error output should contain the crawler setup
(Base URL, Scope URL, User Agent and URI List) configured in the
file crawler-live.xconf.
So my guess is that your "-Dcrawler.xconf" parameter is wrong ?
hope that helps
Michael
Adam LIM wrote:
> Hi!!!
> Thank you for ya help. I correct the errors about
> java.lang.NoClassDefFoundError I got but some new errors come up. This what
> the command line returned:
>
> [echo] INFO: Crawl and dump hypertext documents
> (/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
> [echo] INFO: Show configuration
> [java] log4j:WARN No appenders could be found for logger
> (org.apache.lenya.xml.DOMUtil).
> [java] log4j:WARN Please initialize the log4j system properly.
> [java] null
> [java] null
> [java] null
> [java] null
> [java] java.lang.NullPointerException
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
RE: Lucene: problem while crawling
Posted by Adam LIM <fu...@axidea.fr>.
Hi!!!
Thank you for ya help. I correct the errors about
java.lang.NoClassDefFoundError I got but some new errors come up. This what
the command line returned:
[echo] INFO: Crawl and dump hypertext documents
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
live.xconf)
[echo] INFO: Show configuration
[java] log4j:WARN No appenders could be found for logger
(org.apache.lenya.xml.DOMUtil).
[java] log4j:WARN Please initialize the log4j system properly.
[java] null
[java] null
[java] null
[java] null
[java] java.lang.NullPointerException
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
[java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
[java] at
org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
[java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
[java] at
org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
[java] at org.apache.tools.ant.Task.perform(Task.java:364)
[java] at org.apache.tools.ant.Target.execute(Target.java:341)
[java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
[java] at
org.apache.tools.ant.Project.executeTarget(Project.java:1214)
[java] at
org.apache.tools.ant.Project.executeTargets(Project.java:1062)
[java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
[java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
[java] at
org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
[java] at
org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
[java] Caused by: java.lang.NullPointerException
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.resolvePath(CrawlerConf
iguration.java:235)
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.main(CrawlerConfigurati
on.java:110)
[java] at sun.reflect.NativeMethodAccessorImpl.invoke0(Native
Method)
[java] at
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:39
)
[java] at
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl
.java:25)
[java] at java.lang.reflect.Method.invoke(Method.java:324)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.run(ExecuteJava.java:193)
[java] at
org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:130)
[java] ... 13 more
[java] --- Nested Exception ---
[java] java.lang.NullPointerException
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.resolvePath(CrawlerConf
iguration.java:235)
[java] at
org.apache.lenya.search.crawler.CrawlerConfiguration.main(CrawlerConfigurati
on.java:110)
[java] at sun.reflect.NativeMethodAccessorImpl.invoke0(Native
Method) ............
..........
Have you got these too?
Thanks ya!
Adam LIM,
-----Message d'origine-----
De : Michael Wohlfart [mailto:michael.wohlfart@zsw-bw.de]
Envoyé : jeudi 9 juin 2005 10:29
À : user@lenya.apache.org
Objet : Re: Lucene: problem while crawling
Hi Adam,
I got a similar Error, in my case the problem was that some of the
pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
libraries in WEB-INF/lib.
Maybe you should take a look at the pathelement for the log4j
Library and verify that the referred file exists in your WEB-INF/lib.
best regards
Michael
Adam LIM wrote:
> Hi!!!
> I got a big problem wit Lucene and I don't know how to resolve it.
> Could someone explain how to make it work. I wanna crawl my site so I
> executed the following command on my shell as explained in the official
> website:
>
> /home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
> usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
>
-Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
> /search/lucene-live.xconf crawl
>
> And this is the return:
>
> Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
>
> init:
> [echo] INFO: Init
>
> crawl:
> [echo] INFO: Crawl and dump hypertext documents
>
(/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
> [echo] INFO: Show configuration
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at
org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
> [java] at
>
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] ... 13 more
> [java] --- Nested Exception ---
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
>
org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at
org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [echo] INFO: Start crawling ...
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at
org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
> [java] at
>
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] ... 13 more
> [java] --- Nested Exception ---
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
>
org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at
org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at
org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [echo] INFO: Crawling finished
>
>
> Thank you in advance
>
> Adam LIM,
>
>
>
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
>
>
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org
Re: Lucene: problem while crawling
Posted by Michael Wohlfart <mi...@zsw-bw.de>.
Hi Adam,
I got a similar Error, in my case the problem was that some of the
pathelements in webapp/lenya/bin/crawl_and_index.xml didn't match the
libraries in WEB-INF/lib.
Maybe you should take a look at the pathelement for the log4j
Library and verify that the referred file exists in your WEB-INF/lib.
best regards
Michael
Adam LIM wrote:
> Hi!!!
> I got a big problem wit Lucene and I don't know how to resolve it.
> Could someone explain how to make it work. I wanna crawl my site so I
> executed the following command on my shell as explained in the official
> website:
>
> /home/webapp/web_software/lenya-1.2.2/tools/bin/ant -f
> usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
> -Dcrawler.xconf=/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config
> /search/lucene-live.xconf crawl
>
> And this is the return:
>
> Buildfile: /usr/local/tomcat/webapps/lenya/lenya/bin/crawl_and_index.xml
>
> init:
> [echo] INFO: Init
>
> crawl:
> [echo] INFO: Crawl and dump hypertext documents
> (/usr/local/tomcat/webapps/lenya/lenya/pubs/AML-REGION/config/search/lucene-
> live.xconf)
> [echo] INFO: Show configuration
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
> [java] at
> org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] ... 13 more
> [java] --- Nested Exception ---
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.lenya.search.crawler.CrawlerConfiguration.<clinit>(CrawlerConfigu
> ration.java:37)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [echo] INFO: Start crawling ...
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:172)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [java] Caused by: java.lang.NoClassDefFoundError:
> org/apache/log4j/Category
> [java] at
> org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] ... 13 more
> [java] --- Nested Exception ---
> [java] java.lang.NoClassDefFoundError: org/apache/log4j/Category
> [java] at
> org.apache.lenya.search.crawler.IterativeHTMLCrawler.<clinit>(IterativeHTMLC
> rawler.java:38)
> [java] at java.lang.Class.forName0(Native Method)
> [java] at java.lang.Class.forName(Class.java:219)
> [java] at
> org.apache.tools.ant.taskdefs.ExecuteJava.execute(ExecuteJava.java:115)
> [java] at org.apache.tools.ant.taskdefs.Java.run(Java.java:705)
> [java] at
> org.apache.tools.ant.taskdefs.Java.executeJava(Java.java:177)
> [java] at org.apache.tools.ant.taskdefs.Java.execute(Java.java:83)
> [java] at
> org.apache.tools.ant.UnknownElement.execute(UnknownElement.java:275)
> [java] at org.apache.tools.ant.Task.perform(Task.java:364)
> [java] at org.apache.tools.ant.Target.execute(Target.java:341)
> [java] at org.apache.tools.ant.Target.performTasks(Target.java:369)
> [java] at
> org.apache.tools.ant.Project.executeTarget(Project.java:1214)
> [java] at
> org.apache.tools.ant.Project.executeTargets(Project.java:1062)
> [java] at org.apache.tools.ant.Main.runBuild(Main.java:673)
> [java] at org.apache.tools.ant.Main.startAnt(Main.java:188)
> [java] at
> org.apache.tools.ant.launch.Launcher.run(Launcher.java:196)
> [java] at
> org.apache.tools.ant.launch.Launcher.main(Launcher.java:55)
> [echo] INFO: Crawling finished
>
>
> Thank you in advance
>
> Adam LIM,
>
>
>
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
> For additional commands, e-mail: user-help@lenya.apache.org
>
>
---------------------------------------------------------------------
To unsubscribe, e-mail: user-unsubscribe@lenya.apache.org
For additional commands, e-mail: user-help@lenya.apache.org