chiark / gitweb /
More robust way to find arch/islands table
[ypp-sc-tools.db-live.git] / yarrg / yppedia-ocean-scraper
index ad35c4d708a432566941542156e10339d5ed421f..a85403504aae52764a1a6d96f7202f6444c005ed 100755 (executable)
@@ -95,8 +95,7 @@ def parse_chart():
        return s
 
 def parse_ocean():
-       firstarch = soup.find('a', attrs = {'title': title_arch_ok})
-       debug('fa',firstarch)
+       content = soup.find('div', attrs = {'id': 'content'})
 
        def findall_title_arch_ok(t):
                return t.findAll('a', attrs = {'title': title_arch_ok})
@@ -105,7 +104,7 @@ def parse_ocean():
                if u.name != 'table': return False
                return len(findall_title_arch_ok(u)) > 1
 
-       archestable = firstarch.findParent('table', attrs={'border':'1'})
+       archestable = content.findChild('table', attrs={'border':'1'})
        debug('at',archestable)
 
        archsoups = []