You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@stanbol.apache.org by og...@apache.org on 2011/09/21 18:48:36 UTC

svn commit: r1173754 - /incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh

Author: ogrisel
Date: Wed Sep 21 16:48:36 2011
New Revision: 1173754

URL: http://svn.apache.org/viewvc?rev=1173754&view=rev
Log:
STANBOL-323: correct fix for double backslash escaping instead of skipping

Modified:
    incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh

Modified: incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh?rev=1173754&r1=1173753&r2=1173754&view=diff
==============================================================================
--- incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh (original)
+++ incubator/stanbol/trunk/entityhub/indexing/dbpedia/fetch_prepare.sh Wed Sep 21 16:48:36 2011
@@ -50,7 +50,8 @@ wget -c $DBPEDIA/en/short_abstracts_en.n
 if [ ! -f images_en.nt ]
 then
     wget -c $DBPEDIA/en/images_en.nt.bz2
-    bzcat images_en.nt.bz2 | sed 's/\\\\/\\u005c/g' > images_en.nt
+    bzcat images_en.nt.bz2 \
+      | sed 's/\\\\/\\u005c\\u005c/g;s/\\\([^u"]\)/\\u005c\1/g' > images_en.nt
     rm -f images_en.nt.bz2
 fi
 
@@ -58,7 +59,8 @@ fi
 if [ ! -f labels_de.nt ]
 then
     wget -c $DBPEDIA/de/labels_de.nt.bz2
-    bzcat labels_de.nt.bz2 | sed 's/\\\\/\\u005c/g' > labels_de.nt
+    bzcat labels_de.nt.bz2 \
+      | sed 's/\\\\/\\u005c\\u005c/g;s/\\\([^u"]\)/\\u005c\1/g' > labels_de.nt
     rm -f labels_de.nt.bz2
 fi