From 233eb048a9bc2c4b84e1ae6a47de6b088779ee4e Mon Sep 17 00:00:00 2001 From: sstvinc2 Date: Wed, 15 Feb 2017 23:33:56 -0600 Subject: Fixed NYT, plus other parsing fixes and a minor visual tweak --- parser.py | 19 ++++++++++++++----- 1 file changed, 14 insertions(+), 5 deletions(-) (limited to 'parser.py') diff --git a/parser.py b/parser.py index 53b3261..ef90eee 100644 --- a/parser.py +++ b/parser.py @@ -225,6 +225,8 @@ def buildBlaze(): h1s, h2s, h3s = removeDuplicates(h1s, h2s, h3s) blz=buildNewsSource2(name, url, h1s, h2s, h3s) + blz=removeBadStories(blz, None, ['Tomi Lahren'], None) + #The Blaze has dumb, short description fields, so we need to grab #the first x characters of actual article text instead blz.h1Arr=blazeFixDesc(blz.h1Arr) @@ -502,10 +504,17 @@ def buildNYT(): #this will likely need if/else logic h1=content - #This is with a large headline over a and b columns - h1=h1.split('story theme-summary banner', 1)[1] - h1=h1.split('', 1)[1] + h1=h1.split('