from urllib.requestimport urlopen
from urllib.errorimport HTTPError
from bs4import BeautifulSoup
def getTitle(url):
try:
html = urlopen(url)
except HTTPErroras e:
return None
try:
bsObj = BeautifulSoup(html.read())
title = bsObj.body.h1
except AttributeError as e:
return None
return title
title = getTitle("http://www.pythonscraping.com/pages/page1.html")
if title ==None:
print("Title could not be found")
else:
print(title)