]> git.nbdom.net Git - nb.git/commitdiff
bin/rss-feedparser
authorNicolas Boisselier <nicolas.boisselier@gmail.com>
Thu, 19 Jul 2018 02:37:40 +0000 (03:37 +0100)
committerNicolas Boisselier <nicolas.boisselier@gmail.com>
Thu, 19 Jul 2018 02:37:40 +0000 (03:37 +0100)
bin/rss-feedparser

index 81e72561eaae2e310d49e759fc921da79a1360e6..cd1a4fb9675dcf6b1539c15acd05d21f1b97044f 100755 (executable)
@@ -74,6 +74,8 @@ def getHeadlines( rss_url ):
 
         if not content:
             content = html
+            content = content[:10000]
+            ##content = content.strsub(1,10000)
             #soup = BeautifulSoup(content,"html.parser")
             #content = soup.get_text()
             content = re.sub(r'\s*\n',' ',content)
@@ -96,8 +98,9 @@ urls = [
     #'https://www.youtube.com/feeds/videos.xml?channel_id=UCUIjs9R044OjAxKzk0xhGoQ',
 ]
 
-for url in sys.argv[1:]:
-    getHeadlines( url )
+if __name__ == '__main__':
+    for url in sys.argv[1:]:
+        getHeadlines( url )
 # NB 25.06.18 for url in urls:
 # NB 25.06.18     getHeadlines( url )
 # NB 25.06.18