# strip tags function
def striptags(string):	
	return re.sub(u"<head>[^^]*?</head>|<[^>]*?>|&lt;[^>]*?&gt;|&nbsp;",u" ",string)