You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@pdfbox.apache.org by ju...@apache.org on 2010/06/20 22:38:00 UTC

svn commit: r956412 - in /pdfbox/site: publish/references.html src/site/xdoc/references.xml

Author: jukka
Date: Sun Jun 20 20:37:59 2010
New Revision: 956412

URL: http://svn.apache.org/viewvc?rev=956412&view=rev
Log:
site: Add Apache Tika to the list of projects that use PDFBox

Modified:
    pdfbox/site/publish/references.html
    pdfbox/site/src/site/xdoc/references.xml

Modified: pdfbox/site/publish/references.html
URL: http://svn.apache.org/viewvc/pdfbox/site/publish/references.html?rev=956412&r1=956411&r2=956412&view=diff
==============================================================================
--- pdfbox/site/publish/references.html (original)
+++ pdfbox/site/publish/references.html Sun Jun 20 20:37:59 2010
@@ -185,11 +185,12 @@
     <div class="section"><h2>PDFBox References<a name="PDFBox_References"></a></h2>
       <p>
         This page lists projects that utilize PDFBox and articles that
-        have been written about PDFBox.
+        have been written about PDFBox. Please file an
+        <a class="externalLink" href="https://issues.apache.org/jira/browse/PDFBOX">improvement issue</a> to get new projects or articles added
+        to this page, or to update the information on existing links.
       </p>
     </div>
     <div class="section"><h2>Projects<a name="Projects"></a></h2>
-      <p><br /></p>
       <table align="center" border="1" class="bodyTable">
       	<tr class="a">
       		<th align="left">Project Name</th>
@@ -201,114 +202,121 @@
       		<td align="left">LGPL - commercial services/support/training is available</td>
       		<td align="left">Alfresco is an open source, open-standards content repository built by the most experienced content management team that includes the co-founder of Documentum.</td>
       	</tr>
-      	<tr class="a">
+        <tr class="a">
+          <td align="left"><a class="externalLink" href="http://tika.apache.org/">Apache Tika</a></td>
+          <td align="left"><a class="externalLink" href="http://www.apache.org/licenses/LICENSE-2.0">ALv2</a></td>
+          <td align="left">Apache Tika is a toolkit for detecting and extracting metadata
+          and structured text content from various documents using existing
+          parser libraries.</td>
+        </tr>
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.centriccrm.com">Centric CRM</a></td>
       		<td align="left">Free To Use But Restricted/Commercial</td>
       		<td align="left">The Most Advanced Open Source CRM Software.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://webtest.canoo.com/webtest/manual/WebTestHome.html">Canoo Webtest</a></td>
       		<td align="left"><a class="externalLink" href="http://webtest.canoo.com/webtest/manual/license.html">BSD Like</a></td>
       		<td align="left">Free OpenSource tool for XP-style acceptance testing of Java-based Web applications.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://webtest.canoo.com/webtest/manual/WebTestHome.html">contineo</a></td>
       		<td align="left">GPL</td>
       		<td align="left">Contineo is a web based document management system.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://forms.pjc.bean.over-blog.com">DirectPrint</a></td>
       		<td align="left">BSD</td>
       		<td align="left">JavaBean used to get back print features lost in Oracle Reports </td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.jahia.org/">Jahia</a></td>
       		<td align="left"><a class="externalLink" href="http://www.jahia.org/jahia/Jahia/pricing">collaborative source license</a></td>
       		<td align="left">The Jahia product is currently the most powerful, ready-to-use and affordable integrated midrange Java Content Management and Corporate Portal Server.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://jlibrary.sourceforge.net/">jLibrary</a></td>
       		<td align="left">BSD</td>
       		<td align="left">jLibrary is a Document Management System, oriented for personal and enterprise use.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://jomic.sourceforge.net/">Jomic</a></td>
       		<td align="left">GPL</td>
       		<td align="left">Jomic is a viewer for comic book archives.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://jpdfunit.sourceforge.net/">JpdfUnit</a></td>
       		<td align="left">Apache License V2.0</td>
       		<td align="left">JpdfUnit is a framework for testing a generated pdf document with the JUnit Test Framework.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.liferay.com/">Liferay Portal</a></td>
       		<td align="left">MIT</td>
       		<td align="left">Liferay Portal is an open source portal that helps organizations collaborate more efficiently by providing a consolidated view of disparate applications.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://www.bibl.ulaval.ca/lius/index.en.html">LIUS</a></td>
       		<td align="left">GPL</td>
       		<td align="left">LIUS is an indexing Java framework based on the Jakarta Lucene project. The LIUS framework adds to Lucene many files format indexing fonctionalities as: Ms World, Ms Excel, Ms PowerPoint, RTF, PDF, XML, HTML, TXT, Open Office suite and JavaBeans.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.gmod.org/lucegene/">LuceGene</a></td>
       		<td align="left">Artistic License</td>
       		<td align="left">LuceGene is an open-source document/object search and retrieval system specially tuned for bioinformatics text databases and documents.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://www.lutece.paris.fr/">Lutece</a></td>
       		<td align="left">BSD-like</td>
       		<td align="left">Lutece is a portal engine which allows you to easily create your websites or intranets based upon HTML,XML content.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://mmapps.sourceforge.net/lucenemodule/">MMBase Lucene Module</a></td>
       		<td align="left">MPL</td>
       		<td align="left">Lucenemodule is a plugin (module) for the MMBase content management system that enables Lucene full text search through it's content, and thanks to PDFBox also PDF content.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://lucene.apache.org/nutch/">Nutch</a></td>
       		<td align="left">ASL</td>
       		<td align="left">Nutch is open source web-search software. It builds on Lucene, adding web-specifics, such as a crawler, a link-graph database, parsers for HTML and other document formats, etc.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.opencms.org/">OpenCms</a></td>
       		<td align="left"><a class="externalLink" href="http://www.opencms.org/opencms/en/terms.html">Custom</a></td>
       		<td align="left">OpenCms is a professional level Open Source Website Content Management System.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://forge.objectweb.org/projects/ops">Orbeon PresentationServer</a></td>
       		<td align="left">LGPL</td>
       		<td align="left">Orbeon PresentationServer (OPS) is an open source J2EE-based platform for XML-centric web applications. OPS is built around XHTML, XForms, XSLT, XML pipelines, and Web Services, which makes it ideal for applications that capture, process and present XML data.
       		    Commercial consulting/training/support is available through <a class="externalLink" href="http://www.orbeon.com/">orbeon</a>.
       		</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://pdfcat.sourceforge.net">PDFcat</a></td>
       		<td align="left">LGPL</td>
       		<td align="left">PDFcat is multi-platform catalog manager that provides searching capability over documents among virtual catalogs.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://homepage.mac.com/ptwobrussell/podreader.html">PodReader</a></td>
       		<td align="left">GPL</td>
       		<td align="left">PodReader is an application that facilitates making electronic documents like eBooks readable on your iPod.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.searchblox.com">SearchBlox</a></td>
       		<td align="left">Commercial</td>
       		<td align="left">SearchBlox is a high-performance corporate search software designed for the Java 2 Enterprise Edition (J2EE) platform.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://ir.dcs.gla.ac.uk/terrier/">Terrier</a></td>
       		<td align="left">MPL</td>
       		<td align="left">Terrier is software for the rapid development of Web, intranet and desktop search engines.</td>
       	</tr>
-      	<tr class="a">
+      	<tr class="b">
       		<td align="left"><a class="externalLink" href="http://www.triboni.com">Triboni GinkGO</a></td>
       		<td align="left">Commercial</td>
       		<td align="left">Triboni GinkGO is a highly scalable J2EE services platform that is based on a simple XML business object defintion and scripting language. Toghether with XSLT content centric web applications can be configured in a very short time.</td>
       	</tr>
-      	<tr class="b">
+      	<tr class="a">
       		<td align="left"><a class="externalLink" href="http://www.zilverline.org/">Zilverline</a></td>
       		<td align="left"><a class="externalLink" href="http://www.zilverline.org/zilverlineweb/space/license">Collaborative Source License</a></td>
       		<td align="left">Zilverline is a search engine that offers web access to your personal or intranet content.</td>
@@ -317,7 +325,6 @@
     </div>
 
     <div class="section"><h2>Articles/Books<a name="ArticlesBooks"></a></h2>
-      <p><br /></p>
       <table align="center" border="1" class="bodyTable">
       	<tr class="a">
       		<th align="left" width="30%">Article Name</th>

Modified: pdfbox/site/src/site/xdoc/references.xml
URL: http://svn.apache.org/viewvc/pdfbox/site/src/site/xdoc/references.xml?rev=956412&r1=956411&r2=956412&view=diff
==============================================================================
--- pdfbox/site/src/site/xdoc/references.xml (original)
+++ pdfbox/site/src/site/xdoc/references.xml Sun Jun 20 20:37:59 2010
@@ -25,11 +25,13 @@
     <section name="PDFBox References">
       <p>
         This page lists projects that utilize PDFBox and articles that
-        have been written about PDFBox.
+        have been written about PDFBox. Please file an
+        <a href="https://issues.apache.org/jira/browse/PDFBOX"
+          >improvement issue</a> to get new projects or articles added
+        to this page, or to update the information on existing links.
       </p>
     </section>
     <section name="Projects">
-      <p><br/></p>
       <table>
       	<tr>
       		<th>Project Name</th>
@@ -41,6 +43,13 @@
       		<td>LGPL - commercial services/support/training is available</td>
       		<td>Alfresco is an open source, open-standards content repository built by the most experienced content management team that includes the co-founder of Documentum.</td>
       	</tr>
+        <tr>
+          <td><a href="http://tika.apache.org/">Apache Tika</a></td>
+          <td><a href="http://www.apache.org/licenses/LICENSE-2.0">ALv2</a></td>
+          <td>Apache Tika is a toolkit for detecting and extracting metadata
+          and structured text content from various documents using existing
+          parser libraries.</td>
+        </tr>
       	<tr>
       		<td><a href="http://www.centriccrm.com">Centric CRM</a></td>
       		<td>Free To Use But Restricted/Commercial</td>
@@ -157,7 +166,6 @@
     </section>
 
     <section name="Articles/Books">
-      <p><br/></p>
       <table>
       	<tr>
       		<th width="30%">Article Name</th>