X-Git-Url: http://www.chiark.greenend.org.uk/ucgi/~yarrgweb/git?p=ypp-sc-tools.main.git;a=blobdiff_plain;f=yarrg%2Fyppedia-ocean-scraper;fp=yarrg%2Fyppedia-ocean-scraper;h=a85403504aae52764a1a6d96f7202f6444c005ed;hp=ad35c4d708a432566941542156e10339d5ed421f;hb=714a62245610bd19b4056878b808f3d6e59e88c6;hpb=170049a6777baa9d15678e0f13804157bf6c02b0 diff --git a/yarrg/yppedia-ocean-scraper b/yarrg/yppedia-ocean-scraper index ad35c4d..a854035 100755 --- a/yarrg/yppedia-ocean-scraper +++ b/yarrg/yppedia-ocean-scraper @@ -95,8 +95,7 @@ def parse_chart(): return s def parse_ocean(): - firstarch = soup.find('a', attrs = {'title': title_arch_ok}) - debug('fa',firstarch) + content = soup.find('div', attrs = {'id': 'content'}) def findall_title_arch_ok(t): return t.findAll('a', attrs = {'title': title_arch_ok}) @@ -105,7 +104,7 @@ def parse_ocean(): if u.name != 'table': return False return len(findall_title_arch_ok(u)) > 1 - archestable = firstarch.findParent('table', attrs={'border':'1'}) + archestable = content.findChild('table', attrs={'border':'1'}) debug('at',archestable) archsoups = []