151 lines
4.1 KiB
C++
Executable File
151 lines
4.1 KiB
C++
Executable File
// For license of this file, see <project-root-folder>/LICENSE.md.
|
|
|
|
#include "services/standard/feedparser.h"
|
|
|
|
#include "exceptions/applicationexception.h"
|
|
#include "miscellaneous/application.h"
|
|
#include "network-web/webfactory.h"
|
|
|
|
#include <QDebug>
|
|
#include <QRegularExpression>
|
|
|
|
#include <utility>
|
|
|
|
FeedParser::FeedParser(QString data) : m_xmlData(std::move(data)), m_mrssNamespace(QSL("http://search.yahoo.com/mrss/")) {
|
|
QString error;
|
|
|
|
if (!m_xml.setContent(m_xmlData, true, &error)) {
|
|
throw ApplicationException(QObject::tr("XML problem: %1").arg(error));
|
|
}
|
|
}
|
|
|
|
QList<Message> FeedParser::messages() {
|
|
QString feed_author = feedAuthor();
|
|
QList<Message> messages;
|
|
QDateTime current_time = QDateTime::currentDateTime();
|
|
|
|
// Pull out all messages.
|
|
QDomNodeList messages_in_xml = messageElements();
|
|
|
|
for (int i = 0; i < messages_in_xml.size(); i++) {
|
|
QDomNode message_item = messages_in_xml.item(i);
|
|
|
|
try {
|
|
Message new_message = extractMessage(message_item.toElement(), current_time);
|
|
|
|
if (new_message.m_author.isEmpty() && !feed_author.isEmpty()) {
|
|
new_message.m_author = feed_author;
|
|
}
|
|
|
|
new_message.m_url = new_message.m_url.replace(QRegularExpression("[\\t\\n]"), QString());
|
|
|
|
messages.append(new_message);
|
|
}
|
|
catch (const ApplicationException& ex) {
|
|
qDebugNN << LOGSEC_CORE
|
|
<< "Problem when extracting message: "
|
|
<< ex.message();
|
|
}
|
|
}
|
|
|
|
return messages;
|
|
}
|
|
|
|
QList<Enclosure> FeedParser::mrssGetEnclosures(const QDomElement& msg_element) const {
|
|
QList<Enclosure> enclosures;
|
|
auto content_list = msg_element.elementsByTagNameNS(m_mrssNamespace, "content");
|
|
|
|
for (int i = 0; i < content_list.size(); i++) {
|
|
QDomElement elem_content = content_list.at(i).toElement();
|
|
QString url = elem_content.attribute(QSL("url"));
|
|
QString type = elem_content.attribute(QSL("type"));
|
|
|
|
if (!url.isEmpty() && !type.isEmpty()) {
|
|
enclosures.append(Enclosure(url, type));
|
|
}
|
|
}
|
|
|
|
auto thumbnail_list = msg_element.elementsByTagNameNS(m_mrssNamespace, "thumbnail");
|
|
|
|
for (int i = 0; i < thumbnail_list.size(); i++) {
|
|
QDomElement elem_content = thumbnail_list.at(i).toElement();
|
|
QString url = elem_content.attribute(QSL("url"));
|
|
|
|
if (!url.isEmpty()) {
|
|
enclosures.append(Enclosure(url, QSL("image/png")));
|
|
}
|
|
}
|
|
|
|
return enclosures;
|
|
}
|
|
|
|
QString FeedParser::mrssTextFromPath(const QDomElement& msg_element, const QString& xml_path) const {
|
|
QString text = msg_element.elementsByTagNameNS(m_mrssNamespace, xml_path).at(0).toElement().text();
|
|
|
|
return text;
|
|
}
|
|
|
|
QString FeedParser::rawXmlChild(const QDomElement& container) const {
|
|
QString raw;
|
|
auto children = container.childNodes();
|
|
|
|
for (int i = 0; i < children.size(); i++) {
|
|
if (children.at(i).isCDATASection()) {
|
|
raw += children.at(i).toCDATASection().data();
|
|
}
|
|
else {
|
|
QString raw_ch;
|
|
QTextStream str(&raw_ch);
|
|
|
|
children.at(i).save(str, 0);
|
|
raw += qApp->web()->unescapeHtml(raw_ch);
|
|
}
|
|
}
|
|
|
|
return raw;
|
|
}
|
|
|
|
QStringList FeedParser::textsFromPath(const QDomElement& element, const QString& namespace_uri,
|
|
const QString& xml_path, bool only_first) const {
|
|
QStringList paths = xml_path.split('/');
|
|
QStringList result;
|
|
QList<QDomElement> current_elements;
|
|
|
|
current_elements.append(element);
|
|
|
|
while (!paths.isEmpty()) {
|
|
QList<QDomElement> next_elements;
|
|
QString next_local_name = paths.takeFirst();
|
|
|
|
for (const QDomElement& elem : current_elements) {
|
|
QDomNodeList elements = elem.elementsByTagNameNS(namespace_uri, next_local_name);
|
|
|
|
for (int i = 0; i < elements.size(); i++) {
|
|
next_elements.append(elements.at(i).toElement());
|
|
|
|
if (only_first) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (next_elements.size() == 1 && only_first) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
current_elements = next_elements;
|
|
}
|
|
|
|
if (!current_elements.isEmpty()) {
|
|
for (const QDomElement& elem : qAsConst(current_elements)) {
|
|
result.append(elem.text());
|
|
}
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
QString FeedParser::feedAuthor() const {
|
|
return "";
|
|
}
|