scraper now can translate atom feeds too

This commit is contained in:
Martin Rotter 2021-08-26 08:50:46 +02:00
parent 45ee6909ce
commit 4df20e70ed

View File

@ -1,14 +1,15 @@
# Translates entries of RSS 2.0 feed into different locale.
#
# Make sure to have all dependencies installed:
# pip3 install googletrans==4.0.0-rc1
# pip3 install googletrans
# pip3 install asyncio (if using parallel version of the script)
# pip3 install hyper (for HTTP/2 support, much faster than default)
#
# You must provide raw RSS 2.0 UTF-8 feed XML data as input, for example with curl:
# curl 'https://phys.org/rss-feed/' | python ./translate-rss2.py "en" "pt_BR" "true"
# curl 'https://phys.org/rss-feed/' | python ./translate-feed.py "en" "pt_BR" "true"
#
# You must provide three command line arguments:
# translate-rss2.py [FROM-LANGUAGE] [TO-LANGUAGE] [RUN-PARALLEL]
# translate-feed.py [FROM-LANGUAGE] [TO-LANGUAGE] [RUN-PARALLEL]
import json
import re