definitely removed TotallyCoolPix and NewYorkTimesLens

idleloop-github · idleloop-github · commit f51155749fd7 · 2021-04-05T15:03:25.000+02:00
diff --git a/lib/scrapers.py b/lib/scrapers.py
@@ -44,8 +44,6 @@
     'TimePhotography',
     'ReadingthePictures',
     'Reddit',
-    'TotallyCoolPix',
-    'NewYorkTimesLens',
 )
 
 
@@ -352,147 +350,6 @@ def _get_photos(self, album_url):
         return self._photos[album_url]
 
 
-class TotallyCoolPix(BasePlugin):
-
-    _title = 'TotallyCoolPix.com'
-
-    def _get_albums(self):
-        self._albums = []
-        url = 'https://totallycoolpix.com'
-        html = self._get_html(url)
-        albums = parseDOM( html, 'div', {'class': 'item'} )
-        for id, album in enumerate(albums):
-            if not parseDOM( album, 'a', {'class': 'open'} ):
-                continue
-            title = parseDOM( album, 'h2' )[0]
-            album_url = parseDOM( album, 'a', ret='href' )[0]
-            p = parseDOM( album, 'p' )
-            description = p[0].replace( '<br />', '' ) if p else ''
-            # add date to description:
-            description = stripTags( parseDOM( parseDOM( album, 'li' ), 'a')[0] ) + "\n" + description
-            pic = parseDOM( album, 'img', ret='src' )[0]
-            self._albums.append({
-                'title': title,
-                'album_id': id,
-                'pic': pic,
-                'description': description,
-                'album_url': album_url}
-            )
-        return self._albums
-
-    def _get_photos(self, album_url):
-        self._photos[album_url] = []
-
-        html = self._get_html(album_url)
-        for id, photo in enumerate( parseDOM( html, 'div', attrs={'class': 'image'}) ):
-            img = parseDOM( photo, 'img', ret='src' )[0]
-            if not img:
-                continue
-            if id == 0:
-                album_title = parseDOM( photo, 'h2' )[0]
-                # jump first entry as it is a repetition of the album description
-                continue
-                description = stripTags(self._parser.unescape(parseDOM( html, 'p', attrs={'class': 'desc'} )[0]))
-            else:
-                try:
-                    description = self._parser.unescape(parseDOM( photo, 'p', {'class': 'info-txt'} )[0])
-                except:
-                    description = ''
-            self._photos[album_url].append({
-                'title': '%d - %s' % (id + 1, album_title),
-                'album_title': album_title,
-                'photo_id': id,
-                'pic': img,
-                'description': description,
-                'album_url': album_url
-            })
-        if (id==0):
-            # possibly a video:
-            video = parseDOM( html, 'iframe', ret='src' )[0]
-            self.log('possible video = ' + video)
-            if re.match(r'.+youtube.com/.+', video):
-                video_id = re.sub('.+/', '', video)
-                self.log('youtube video = ' + video_id)
-                xbmc.executebuiltin('PlayMedia(plugin://plugin.video.youtube/play/?video_id=' + video_id + ')')
-            elif re.match(r'.+vimeo.com/.+', video):
-                video_id = re.sub('.+/', '', video)
-                self.log('vimeo video = ' + video_id)
-                xbmc.executebuiltin('PlayMedia(plugin://plugin.video.vimeo/play/?video_id=' + video_id + ')')
-            # if no match: previous processing have retrieved images
-        return self._photos[album_url]
-
-
-class NewYorkTimesLens(BasePlugin):
-
-    _title = 'NewYorkTimes.com: Lens Blog'
-
-    def _get_albums(self):
-        self._albums = []
-        home_url = 'https://www.nytimes.com'
-        url = home_url + '/section/lens'
-        html = self._get_html(url)
-        for id, album in enumerate( parseDOM( html, 'li', attrs={ 'class': 'css-[^"\']+' } ) ):
-            title = parseDOM( album, 'h2' )
-            if not title:
-                continue
-
-            album_url = parseDOM( album, 'a', ret='href' )[0]
-            picture = parseDOM( album, 'img', ret='src' )[0]
-            image = parseDOM( album, 'img', ret='srcSet' )[0]
-            if re.search( r'Medium', image ):
-                image = image.split(',')
-                for picture in image:
-                    if re.search( r'Medium', picture ):
-                        picture = re.search( r'^[^\?]+', picture).group()
-                        break
-            description = parseDOM( album, 'p' )[0].encode('utf-8', 'ignore')
-            date = re.search( r'/(20\d{2}/\d{2}/\d{2})/' ,  album_url )
-            if ( date ):
-                description = date.group(1).encode('utf-8', 'ignore') + "\n" + description
-            self._albums.append({
-               'title': stripTags( title[0] ),
-               'album_id': id,
-               'pic': picture,
-               'description': description,
-               'album_url': home_url + album_url
-               })
-
-        return self._albums
-
-    def _get_photos(self, album_url):
-        self._photos[album_url] = []
-
-        html = self._get_html(album_url)
-        slide_html = parseDOM( html, 'figure', attrs={ 'class': '[^\'"]*?css-[^\'"]+' }, ret='item[IDid]{2}' )
-        summaries = parseDOM( html, 'div', attrs={ 'class': '[^\'"]*?StoryBodyCompanionColumn[^\'"]*' } )
-        for id, slide in enumerate( parseDOM( html, 'figure', attrs={ 'class': '[^\'"]*?css-[^\'"]+' } ) ):
-            picture = slide_html[id]
-            if not picture:
-                continue
-            description = ''
-            for desc in enumerate( parseDOM( parseDOM( slide, 'figcaption' ), 'span', attrs={'class':'[^\'"]*'} ) ):
-                description = description + "\n" + stripTags( desc[1].replace( '</span>', "\n" ) )
-            title = parseDOM( parseDOM( html, 'h1' ), 'span' )[0]
-            self.log( str( len(summaries)/len(slide_html) ) )
-            self.log( str( (1 if len(summaries)/len(slide_html)<1 else int(len(summaries)/len(slide_html))) ) )
-            try:
-                summary = stripTags( u''.join( parseDOM( 
-                        summaries[id*(1 if len(summaries)/len(slide_html)<1 else int(len(summaries)/len(slide_html)))+1], 
-                            'p', attrs={'class': 'css-1ygdjhk e2kc3sl0'} ) ) )
-            except:
-                summary = ''
-            self._photos[album_url].append({
-               'title': title,
-               'album_title': title,
-               'photo_id': id,
-               'pic': picture,
-               'description': description[1:] + summary,
-               'album_url': album_url
-               })
-
-        return self._photos[album_url]
-
-
 class Reddit(BasePlugin):
 
     _title = 'Reddit'
diff --git a/resources/settings.xml b/resources/settings.xml
@@ -24,7 +24,5 @@
         <setting id="enable_TimePhotography" type="bool" label="32405" default="true"/>
         <setting id="enable_ReadingthePictures" type="bool" label="32408" default="true"/>
         <setting id="enable_Reddit" type="bool" label="32407" default="true"/>
-        <setting id="enable_TotallyCoolPix" type="bool" label="32404" default="false"/>
-        <setting id="enable_NewYorkTimesLens" type="bool" label="32406" default="false"/>
     </category>
 </settings>