aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--lib/httracker/functions2
-rwxr-xr-xlib/httracker/html.sed2
2 files changed, 3 insertions, 1 deletions
diff --git a/lib/httracker/functions b/lib/httracker/functions
index f2dde7f..929d917 100644
--- a/lib/httracker/functions
+++ b/lib/httracker/functions
@@ -101,7 +101,7 @@ function httracker_sqlquery {
function httracker_iterate {
for link in `cat $URLS | xargs`; do
# Fix entities
- link="`echo $link | $BASE/lib/httracker/html.sed`"
+ link="`echo $link | sed -f $BASE/lib/httracker/html.sed`"
httracker_get "$link"
done
}
diff --git a/lib/httracker/html.sed b/lib/httracker/html.sed
index d12f602..859bc25 100755
--- a/lib/httracker/html.sed
+++ b/lib/httracker/html.sed
@@ -481,6 +481,8 @@ s/&#60;/</g
s/&lt;/</g
s/&#62;/>/g
s/&gt;/>/g
+# TODO: Looks like some RSS convert links to entities twice
+s/&amp;amp/\&/g
s/&#38;/\&/g
s/&amp;/\&/g
# http://www.w3schools.com/tags/ref_entities.asp