return None
assert response.charset == 'utf-8'
document = response.content.decode(response.charset)
- lxml.etree.fromstring(document)
+ print 'For url %s got page:\n%s' % (url, document)
+ lxml.etree.fromstring(document.replace('<br>', '<br/>'))
assert '<script>' not in document
return document