|
@@ -79,7 +79,13 @@ class OrientalDailyPure(BasicNewsRecipe):
|
|
|
|
|
|
|
|
urlRoot = 'https://orientaldaily.on.cc'
|
|
urlRoot = 'https://orientaldaily.on.cc'
|
|
|
url = urlRoot
|
|
url = urlRoot
|
|
|
|
|
+
|
|
|
|
|
+ print ('############ before soup')
|
|
|
|
|
+
|
|
|
soup = self.index_to_soup(url)
|
|
soup = self.index_to_soup(url)
|
|
|
|
|
+
|
|
|
|
|
+ print ('############ after soup')
|
|
|
|
|
+
|
|
|
#lookups = ['news', 'china_world', 'finance', 'lifestyle', 'sport']
|
|
#lookups = ['news', 'china_world', 'finance', 'lifestyle', 'sport']
|
|
|
lookups = ['news', 'china_world', 'finance', 'entertainment', 'lifestyle', 'adult', 'sport']
|
|
lookups = ['news', 'china_world', 'finance', 'entertainment', 'lifestyle', 'adult', 'sport']
|
|
|
# no finanical news on Sunday
|
|
# no finanical news on Sunday
|
|
@@ -131,5 +137,8 @@ class OrientalDailyPure(BasicNewsRecipe):
|
|
|
|
|
|
|
|
def get_browser(self, *args, **kwargs):
|
|
def get_browser(self, *args, **kwargs):
|
|
|
br = BasicNewsRecipe.get_browser(self)
|
|
br = BasicNewsRecipe.get_browser(self)
|
|
|
- br.set_header('User-Agent', value='Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36')
|
|
|
|
|
|
|
+# br.set_header('User-Agent', value='Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36')
|
|
|
|
|
+ br.set_header('User-Agent', 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36')
|
|
|
|
|
+ br.set_header('Accept', 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8')
|
|
|
|
|
+ br.set_header('Accept-Language', 'en-US,en;q=0.5')
|
|
|
return br
|
|
return br
|