2022-05-10 10:06:48 +00:00
|
|
|
// Copyright (C) 2016 The Qt Company Ltd.
|
|
|
|
// SPDX-License-Identifier: LicenseRef-Qt-Commercial OR BSD-3-Clause
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
#include <QtCore>
|
|
|
|
|
2019-01-01 14:18:57 +00:00
|
|
|
void parseHtmlFile(QTextStream &out, const QString &fileName)
|
|
|
|
{
|
2011-04-27 10:05:43 +00:00
|
|
|
QFile file(fileName);
|
|
|
|
|
2019-04-30 10:51:36 +00:00
|
|
|
out << "Analysis of HTML file: " << fileName << Qt::endl;
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
if (!file.open(QIODevice::ReadOnly)) {
|
2019-04-30 10:51:36 +00:00
|
|
|
out << " Couldn't open the file." << Qt::endl << Qt::endl << Qt::endl;
|
2011-04-27 10:05:43 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
//! [0]
|
|
|
|
QXmlStreamReader reader(&file);
|
|
|
|
//! [0]
|
|
|
|
|
|
|
|
//! [1]
|
|
|
|
int paragraphCount = 0;
|
|
|
|
QStringList links;
|
|
|
|
QString title;
|
|
|
|
while (!reader.atEnd()) {
|
|
|
|
reader.readNext();
|
|
|
|
if (reader.isStartElement()) {
|
2019-01-01 14:18:57 +00:00
|
|
|
if (reader.name() == QLatin1String("title"))
|
2011-04-27 10:05:43 +00:00
|
|
|
title = reader.readElementText();
|
2019-01-01 14:18:57 +00:00
|
|
|
else if (reader.name() == QLatin1String("a"))
|
|
|
|
links.append(reader.attributes().value(QLatin1String("href")).toString());
|
|
|
|
else if (reader.name() == QLatin1String("p"))
|
2011-04-27 10:05:43 +00:00
|
|
|
++paragraphCount;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//! [1]
|
|
|
|
|
|
|
|
//! [2]
|
|
|
|
if (reader.hasError()) {
|
|
|
|
out << " The HTML file isn't well-formed: " << reader.errorString()
|
2019-04-30 10:51:36 +00:00
|
|
|
<< Qt::endl << Qt::endl << Qt::endl;
|
2011-04-27 10:05:43 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
//! [2]
|
|
|
|
|
2019-04-30 10:51:36 +00:00
|
|
|
out << " Title: \"" << title << '"' << Qt::endl
|
|
|
|
<< " Number of paragraphs: " << paragraphCount << Qt::endl
|
|
|
|
<< " Number of links: " << links.size() << Qt::endl
|
|
|
|
<< " Showing first few links:" << Qt::endl;
|
2011-04-27 10:05:43 +00:00
|
|
|
|
2019-01-01 14:18:57 +00:00
|
|
|
while (links.size() > 5)
|
2011-04-27 10:05:43 +00:00
|
|
|
links.removeLast();
|
|
|
|
|
2022-10-06 09:08:21 +00:00
|
|
|
for (const QString &link : std::as_const(links))
|
2019-04-30 10:51:36 +00:00
|
|
|
out << " " << link << Qt::endl;
|
|
|
|
out << Qt::endl << Qt::endl;
|
2011-04-27 10:05:43 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int main(int argc, char **argv)
|
|
|
|
{
|
2012-12-28 18:09:39 +00:00
|
|
|
// initialize Qt Core application
|
2011-04-27 10:05:43 +00:00
|
|
|
QCoreApplication app(argc, argv);
|
|
|
|
|
|
|
|
// get a list of all html files in the current directory
|
2019-01-01 14:18:57 +00:00
|
|
|
const QStringList filter = { QStringLiteral("*.htm"),
|
|
|
|
QStringLiteral("*.html") };
|
2011-04-27 17:16:41 +00:00
|
|
|
|
2019-01-01 14:18:57 +00:00
|
|
|
const QStringList htmlFiles = QDir(QStringLiteral(":/")).entryList(filter, QDir::Files);
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
QTextStream out(stdout);
|
|
|
|
|
|
|
|
if (htmlFiles.isEmpty()) {
|
|
|
|
out << "No html files available.";
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
// parse each html file and write the result to file/stream
|
2019-01-01 14:18:57 +00:00
|
|
|
for (const QString &file : htmlFiles)
|
|
|
|
parseHtmlFile(out, QStringLiteral(":/") + file);
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|