7
7
8
8
import datetime
9
9
from dateutil .relativedelta import relativedelta
10
-
10
+ import logging
11
11
### METHODS
12
12
13
13
def lexical_date_parser (date_to_check ):
@@ -82,7 +82,7 @@ def __init__(self,lang="en",period="",start="",end="",encode="utf-8",region=None
82
82
self .__end = end
83
83
self .__encode = encode
84
84
self .__exception = False
85
- self .__version = '1.6.8 '
85
+ self .__version = '1.6.9 '
86
86
87
87
def getVersion (self ):
88
88
return self .__version
@@ -141,7 +141,8 @@ def build_response(self):
141
141
self .__totalcount = int (stats .group ().replace (',' , '' ))
142
142
else :
143
143
#TODO might want to add output for user to know no data was found
144
- return
144
+ self .__totalcount = None
145
+ logging .debug ('Total count is not available when sort by date' )
145
146
result = self .content .find_all ("a" ,{"jsname" : re .compile (r".*" )})[3 :- 1 ]
146
147
return result
147
148
@@ -165,29 +166,29 @@ def page_at(self, page=1):
165
166
result = self .build_response ()
166
167
for item in result :
167
168
try :
168
- tmp_text = item .find ("div" , { "role" : "heading" } ).text .replace ("\n " ,"" )
169
+ tmp_text = item .find ("h3" ).text .replace ("\n " ,"" )
169
170
except Exception :
170
171
tmp_text = ''
171
172
try :
172
173
tmp_link = item .get ("href" )
173
174
except Exception :
174
175
tmp_link = ''
175
176
try :
176
- tmp_media = item .findAll ( "g-img" )[ 0 ]. parent .text
177
+ tmp_media = item .find ( 'div' ). find ( 'div' ). find ( 'div' ). find_next_sibling ( 'div' ) .text
177
178
except Exception :
178
179
tmp_media = ''
179
180
try :
180
- tmp_date = item .find (" div" , { "role" : "heading" }). next_sibling . findNext ('div' ).text
181
+ tmp_date = item .find (' div' ). find_next_sibling ('div' ). find ( 'span ' ).text
181
182
tmp_date ,tmp_datetime = lexical_date_parser (tmp_date )
182
183
except Exception :
183
184
tmp_date = ''
184
185
tmp_datetime = None
185
186
try :
186
- tmp_desc = item .find (" div" , { "role" : "heading" }). next_sibling . text
187
+ tmp_desc = item .find_next_sibling ( 'div' ). find (' div' ). find_next_sibling ( 'div' ). find ( 'div' ). find ( 'div' ). find ( 'div' ). contents [ 0 ]. replace ( ' \n ' , '' )
187
188
except Exception :
188
189
tmp_desc = ''
189
190
try :
190
- tmp_img = item .findAll ( "g-img" )[ 0 ]. find ("img" ).get ("src" )
191
+ tmp_img = item .find ("img" ).get ("src" )
191
192
except Exception :
192
193
tmp_img = ''
193
194
self .__texts .append (tmp_text )
@@ -221,29 +222,29 @@ def get_page(self, page=1):
221
222
result = self .build_response ()
222
223
for item in result :
223
224
try :
224
- tmp_text = item .find ("div" , { "role" : "heading" } ).text .replace ("\n " ,"" )
225
+ tmp_text = item .find ("h3" ).text .replace ("\n " ,"" )
225
226
except Exception :
226
227
tmp_text = ''
227
228
try :
228
229
tmp_link = item .get ("href" )
229
230
except Exception :
230
231
tmp_link = ''
231
232
try :
232
- tmp_media = item .findAll ( "g-img" )[ 0 ]. parent .text
233
+ tmp_media = item .find ( 'div' ). find ( 'div' ). find ( 'div' ). find_next_sibling ( 'div' ) .text
233
234
except Exception :
234
235
tmp_media = ''
235
236
try :
236
- tmp_date = item .find (" div" , { "role" : "heading" }). next_sibling . findNext ('div' ).text
237
+ tmp_date = item .find (' div' ). find_next_sibling ('div' ). find ( 'span ' ).text
237
238
tmp_date ,tmp_datetime = lexical_date_parser (tmp_date )
238
239
except Exception :
239
240
tmp_date = ''
240
241
tmp_datetime = None
241
242
try :
242
- tmp_desc = item .find (" div" , { "role" : "heading" }). next_sibling . text .replace ('\n ' ,'' )
243
+ tmp_desc = item .find_next_sibling ( 'div' ). find (' div' ). find_next_sibling ( 'div' ). find ( 'div' ). find ( 'div' ). find ( 'div' ). contents [ 0 ] .replace ('\n ' ,'' )
243
244
except Exception :
244
245
tmp_desc = ''
245
246
try :
246
- tmp_img = item .findAll ( "g-img" )[ 0 ]. find ("img" ).get ("src" )
247
+ tmp_img = item .find ("img" ).get ("src" )
247
248
except Exception :
248
249
tmp_img = ''
249
250
self .__texts .append (tmp_text )
0 commit comments