2011-04-27 10:05:43 +00:00
|
|
|
/****************************************************************************
|
|
|
|
**
|
2016-01-22 12:24:00 +00:00
|
|
|
** Copyright (C) 2016 The Qt Company Ltd.
|
|
|
|
** Contact: https://www.qt.io/licensing/
|
2011-04-27 10:05:43 +00:00
|
|
|
**
|
|
|
|
** This file is part of the examples of the Qt Toolkit.
|
|
|
|
**
|
|
|
|
** $QT_BEGIN_LICENSE:BSD$
|
2016-01-22 12:24:00 +00:00
|
|
|
** Commercial License Usage
|
|
|
|
** Licensees holding valid commercial Qt licenses may use this file in
|
|
|
|
** accordance with the commercial license agreement provided with the
|
|
|
|
** Software or, alternatively, in accordance with the terms contained in
|
|
|
|
** a written agreement between you and The Qt Company. For licensing terms
|
|
|
|
** and conditions see https://www.qt.io/terms-conditions. For further
|
|
|
|
** information use the contact form at https://www.qt.io/contact-us.
|
|
|
|
**
|
|
|
|
** BSD License Usage
|
|
|
|
** Alternatively, you may use this file under the terms of the BSD license
|
|
|
|
** as follows:
|
2011-04-27 10:05:43 +00:00
|
|
|
**
|
|
|
|
** "Redistribution and use in source and binary forms, with or without
|
|
|
|
** modification, are permitted provided that the following conditions are
|
|
|
|
** met:
|
|
|
|
** * Redistributions of source code must retain the above copyright
|
|
|
|
** notice, this list of conditions and the following disclaimer.
|
|
|
|
** * Redistributions in binary form must reproduce the above copyright
|
|
|
|
** notice, this list of conditions and the following disclaimer in
|
|
|
|
** the documentation and/or other materials provided with the
|
|
|
|
** distribution.
|
2015-02-13 11:15:33 +00:00
|
|
|
** * Neither the name of The Qt Company Ltd nor the names of its
|
|
|
|
** contributors may be used to endorse or promote products derived
|
|
|
|
** from this software without specific prior written permission.
|
2012-09-19 12:28:29 +00:00
|
|
|
**
|
2011-04-27 10:05:43 +00:00
|
|
|
**
|
|
|
|
** THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
** "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
** LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
** A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
** OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
** SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
** LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
** DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
** THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
** (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
** OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE."
|
2012-01-24 06:17:24 +00:00
|
|
|
**
|
2011-04-27 10:05:43 +00:00
|
|
|
** $QT_END_LICENSE$
|
|
|
|
**
|
|
|
|
****************************************************************************/
|
|
|
|
|
|
|
|
#include <QtCore>
|
|
|
|
|
|
|
|
void parseHtmlFile(QTextStream &out, const QString &fileName) {
|
|
|
|
QFile file(fileName);
|
|
|
|
|
|
|
|
out << "Analysis of HTML file: " << fileName << endl;
|
|
|
|
|
|
|
|
if (!file.open(QIODevice::ReadOnly)) {
|
|
|
|
out << " Couldn't open the file." << endl << endl << endl;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
//! [0]
|
|
|
|
QXmlStreamReader reader(&file);
|
|
|
|
//! [0]
|
|
|
|
|
|
|
|
//! [1]
|
|
|
|
int paragraphCount = 0;
|
|
|
|
QStringList links;
|
|
|
|
QString title;
|
|
|
|
while (!reader.atEnd()) {
|
|
|
|
reader.readNext();
|
|
|
|
if (reader.isStartElement()) {
|
|
|
|
if (reader.name() == "title")
|
|
|
|
title = reader.readElementText();
|
|
|
|
else if(reader.name() == "a")
|
|
|
|
links.append(reader.attributes().value("href").toString());
|
|
|
|
else if(reader.name() == "p")
|
|
|
|
++paragraphCount;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
//! [1]
|
|
|
|
|
|
|
|
//! [2]
|
|
|
|
if (reader.hasError()) {
|
|
|
|
out << " The HTML file isn't well-formed: " << reader.errorString()
|
|
|
|
<< endl << endl << endl;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
//! [2]
|
|
|
|
|
2015-10-13 07:06:58 +00:00
|
|
|
out << " Title: \"" << title << '"' << endl
|
2011-04-27 10:05:43 +00:00
|
|
|
<< " Number of paragraphs: " << paragraphCount << endl
|
|
|
|
<< " Number of links: " << links.size() << endl
|
|
|
|
<< " Showing first few links:" << endl;
|
|
|
|
|
|
|
|
while(links.size() > 5)
|
|
|
|
links.removeLast();
|
|
|
|
|
|
|
|
foreach(QString link, links)
|
|
|
|
out << " " << link << endl;
|
|
|
|
out << endl << endl;
|
|
|
|
}
|
|
|
|
|
|
|
|
int main(int argc, char **argv)
|
|
|
|
{
|
2012-12-28 18:09:39 +00:00
|
|
|
// initialize Qt Core application
|
2011-04-27 10:05:43 +00:00
|
|
|
QCoreApplication app(argc, argv);
|
|
|
|
|
|
|
|
// get a list of all html files in the current directory
|
|
|
|
QStringList filter;
|
|
|
|
filter << "*.htm";
|
|
|
|
filter << "*.html";
|
2011-04-27 17:16:41 +00:00
|
|
|
|
|
|
|
QStringList htmlFiles = QDir(":/").entryList(filter, QDir::Files);
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
QTextStream out(stdout);
|
|
|
|
|
|
|
|
if (htmlFiles.isEmpty()) {
|
|
|
|
out << "No html files available.";
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
// parse each html file and write the result to file/stream
|
|
|
|
foreach(QString file, htmlFiles)
|
2011-04-27 17:16:41 +00:00
|
|
|
parseHtmlFile(out, ":/" + file);
|
2011-04-27 10:05:43 +00:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|