', 1)[1]
desc=TAG_RE.sub('', desc)
desc=desc.replace('\n', ' ')
desc=desc[:144]
articleArr[i].description=desc
return articleArr
def buildBlaze():
url='http://theblaze.com'
name='The Blaze'
#DOWNLOAD HOMEPAGE CONTENT
content=urlToContent(url)
#get main headline
h1=content
h1=h1.split('', 1)[1]
h1=h1.split('', 1)[1]
h2=h2.split('', 1)[0]
while '' in h2:
h2=h2.split('', 1)[1]
#h2=h2.split('href="', 1)[1]
x=h2.split('"', 1)[0]
if h1 not in x:
h2s.append(url+x)
#GET TERTIARY HEADLINES
h3=content
h3s=[]
h3=h3.split('', 1)[1]
#this story section goes on forever; just grab the first 5
while len(h3s)<5:
h3=h3.split('' in content:
h1=h1.split('', 1)[1]
h1=h1.split('