From 9244037c034569972d24e68702605292161d106d Mon Sep 17 00:00:00 2001 From: Ian Jackson Date: Sun, 30 Oct 2011 13:29:41 +0000 Subject: [PATCH] yoweb-scrape: add a markup massager to cope with broken html from yoweb --- yoweb-scrape | 21 ++++++++++++++++----- 1 file changed, 16 insertions(+), 5 deletions(-) diff --git a/yoweb-scrape b/yoweb-scrape index db5dc13..2bcd518 100755 --- a/yoweb-scrape +++ b/yoweb-scrape @@ -45,6 +45,7 @@ import curses import termios import random import subprocess +import copy from optparse import OptionParser from StringIO import StringIO @@ -107,6 +108,18 @@ def yppsc_dir(): os.environ["YPPSC_YARRG_SRCBASE"] = lib return lib +soup_massage = copy.copy(BeautifulSoup.MARKUP_MASSAGE) +soup_massage.append( + (regexp.compile('(\