import-feeds: Handle blogs without <link> tags.

This commit is contained in:
Nelson Elhage 2010-02-09 17:23:57 -05:00
parent a7da50b1ff
commit 8ae4ec8890
1 changed files with 10 additions and 4 deletions

View File

@ -1,6 +1,7 @@
#!/usr/bin/python
from lxml import html
import yaml
import sys
import urllib2
import urlparse
@ -18,7 +19,11 @@ def fetch_links(url):
'comments' not in l.attrib.get('title','')]
if candidates:
return candidates[0].attrib['href']
return links[0].attrib['href']
elif links:
return links[0].attrib['href']
else:
print >>sys.stderr, "No link found for %s" % (url,)
return None
for (name, u) in users.items():
for e in u['links']:
@ -27,9 +32,10 @@ for (name, u) in users.items():
if len(e) == 3:
continue
link = fetch_links(url)
if not link.startswith('http:'):
link = urlparse.urljoin(url, link)
e.append(link)
if link:
if not link.startswith('http:'):
link = urlparse.urljoin(url, link)
e.append(link)
with open('bloggers.yml', 'w') as f:
yaml.safe_dump(users, f)