1
mirror of https://invent.kde.org/network/falkon.git synced 2024-11-14 19:12:11 +01:00
falkonOfficial/src/lib/bookmarksimport/htmlimporter.cpp

155 lines
4.2 KiB
C++
Raw Normal View History

/* ============================================================
* QupZilla - WebKit based browser
* Copyright (C) 2010-2012 David Rosca <nowrep@gmail.com>
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
* ============================================================ */
#include "htmlimporter.h"
#include "bookmarksimportdialog.h"
#include <QRegExp>
HtmlImporter::HtmlImporter(QObject* parent)
: QObject(parent)
, m_error(false)
, m_errorString(BookmarksImportDialog::tr("No Error"))
{
}
void HtmlImporter::setFile(const QString &path)
{
m_path = path;
}
bool HtmlImporter::openFile()
{
m_file.setFileName(m_path);
if (!m_file.open(QFile::ReadOnly)) {
m_error = true;
m_errorString = BookmarksImportDialog::tr("Unable to open file.");
return false;
}
return true;
}
int qzMin(int a, int b)
{
if (a > -1 && b > -1) {
return qMin(a, b);
}
if (a > -1) {
return a;
}
else {
return b;
}
}
QList<BookmarksModel::Bookmark> HtmlImporter::exportBookmarks()
{
QList<BookmarksModel::Bookmark> list;
QString bookmarks = QString::fromUtf8(m_file.readAll());
m_file.close();
// Converting tags to lower case -,-
// For some reason Qt::CaseInsensitive is not everytime insensitive :-D
bookmarks.replace("<DL", "<dl");
bookmarks.replace("</DL", "</dl");
bookmarks.replace("<DT", "<dt");
bookmarks.replace("</DT", "</dt");
bookmarks.replace("<P", "<p");
bookmarks.replace("</P", "</p");
bookmarks.replace("<A", "<a");
bookmarks.replace("</A", "</a");
bookmarks.replace("HREF=", "href=");
bookmarks.replace("<H3", "<h3");
bookmarks.replace("</H3", "</h3");
bookmarks = bookmarks.mid(0, bookmarks.lastIndexOf("</dl><p>"));
int start = bookmarks.indexOf("<dl><p>");
QStringList folders("Html Import");
while (start > 0) {
QString string = bookmarks.mid(start);
int posOfFolder = string.indexOf("<dt><h3");
int posOfEndFolder = string.indexOf("</dl><p>");
int posOfLink = string.indexOf("<dt><a");
int nearest = qzMin(posOfLink, qzMin(posOfFolder, posOfEndFolder));
if (nearest == -1) {
break;
}
if (nearest == posOfFolder) {
// Next is folder
QRegExp rx("<dt><h3(.*)>(.*)</h3>");
rx.setMinimal(true);
rx.indexIn(string);
// QString arguments = rx.cap(1);
QString folderName = rx.cap(2);
folders.append(folderName);
start += posOfFolder + rx.cap(0).size();
}
else if (nearest == posOfEndFolder) {
// Next is end of folder
if (!folders.isEmpty()) {
folders.removeLast();
}
start += posOfEndFolder + 8;
}
else {
// Next is link
QRegExp rx("<dt><a(.*)>(.*)</a>");
rx.setMinimal(true);
rx.indexIn(string);
QString arguments = rx.cap(1);
QString linkName = rx.cap(2);
QRegExp rx2("href=\"(.*)\"");
rx2.setMinimal(true);
rx2.indexIn(arguments);
QUrl url = QUrl::fromEncoded(rx2.cap(1).toUtf8());
start += posOfLink + rx.cap(0).size();
if (linkName.isEmpty() || url.isEmpty() || url.scheme() == "place" || url.scheme() == "about") {
continue;
}
BookmarksModel::Bookmark b;
b.folder = folders.last();
b.title = linkName;
b.url = url;
list.append(b);
}
}
return list;
}