]> gitweb.fluxo.info Git - httruta.git/commitdiff
Fix entities on httracker_iterate
authorSilvio Rhatto <rhatto@riseup.net>
Tue, 27 Aug 2013 16:19:58 +0000 (13:19 -0300)
committerSilvio Rhatto <rhatto@riseup.net>
Tue, 27 Aug 2013 16:19:58 +0000 (13:19 -0300)
httracker
lib/httracker/functions

index 59fcfa90385890a779b60d4f1fd5dbe82cc2e19c..7fc33c17b656d7f0e29f4987cc489afced022e54 100755 (executable)
--- a/httracker
+++ b/httracker
@@ -8,8 +8,7 @@ source `dirname $0`/lib/httracker/functions || exit 1
 
 # Get URLs from feed
 # Thanks http://stackoverflow.com/questions/443991/how-to-parse-rss-feeds-xml-in-a-shell-script
-curl -s "$FEED" | grep -o '<link>[^<]*' | grep -o "[^>]*$" \
-     | `dirname $0`/lib/httracker/html.sed > $URLS
+curl -s "$FEED" | grep -o '<link>[^<]*' | grep -o "[^>]*$" > $URLS
 
 if [ "$?" != "0" ]; then
   echo "Error downloading feed $FEED, aborting."
index 7a66bc7ed93ad660dfc821f311cdaee064e9bd12..6e5c81b9089a9da6a0785836c9348bb26d548658 100644 (file)
@@ -100,6 +100,8 @@ function httracker_sqlquery {
 # Iterate over all URLs
 function httracker_iterate {
   for link in `cat $URLS | xargs`; do
+    # Fix entities
+    link="`echo $link | `dirname $0`/lib/httracker/html.sed`"
     httracker_get "$link"
   done
 }