2012-02-29 18:33:50 +01:00
|
|
|
/* ============================================================
|
|
|
|
* QupZilla - WebKit based browser
|
|
|
|
* Copyright (C) 2010-2012 David Rosca <nowrep@gmail.com>
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
* ============================================================ */
|
2011-12-08 21:52:03 +01:00
|
|
|
#include "htmlimporter.h"
|
2012-01-21 20:27:45 +01:00
|
|
|
#include "bookmarksimportdialog.h"
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-02-29 18:33:50 +01:00
|
|
|
#include <QRegExp>
|
|
|
|
|
2011-12-08 21:52:03 +01:00
|
|
|
HtmlImporter::HtmlImporter(QObject* parent)
|
|
|
|
: QObject(parent)
|
|
|
|
, m_error(false)
|
2012-01-21 20:27:45 +01:00
|
|
|
, m_errorString(BookmarksImportDialog::tr("No Error"))
|
2011-12-08 21:52:03 +01:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
void HtmlImporter::setFile(const QString &path)
|
|
|
|
{
|
|
|
|
m_path = path;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool HtmlImporter::openFile()
|
|
|
|
{
|
|
|
|
m_file.setFileName(m_path);
|
|
|
|
|
|
|
|
if (!m_file.open(QFile::ReadOnly)) {
|
|
|
|
m_error = true;
|
2012-01-21 20:27:45 +01:00
|
|
|
m_errorString = BookmarksImportDialog::tr("Unable to open file.");
|
2011-12-08 21:52:03 +01:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
int qzMin(int a, int b)
|
|
|
|
{
|
|
|
|
if (a > -1 && b > -1) {
|
|
|
|
return qMin(a, b);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (a > -1) {
|
|
|
|
return a;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-12-08 21:52:03 +01:00
|
|
|
QList<BookmarksModel::Bookmark> HtmlImporter::exportBookmarks()
|
|
|
|
{
|
|
|
|
QList<BookmarksModel::Bookmark> list;
|
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
QString bookmarks = QString::fromUtf8(m_file.readAll());
|
2011-12-08 21:52:03 +01:00
|
|
|
m_file.close();
|
|
|
|
|
2012-04-04 23:28:19 +02:00
|
|
|
// Converting tags to lower case -,-
|
|
|
|
// For some reason Qt::CaseInsensitive is not everytime insensitive :-D
|
|
|
|
|
|
|
|
bookmarks.replace("<DL", "<dl");
|
|
|
|
bookmarks.replace("</DL", "</dl");
|
|
|
|
bookmarks.replace("<DT", "<dt");
|
|
|
|
bookmarks.replace("</DT", "</dt");
|
|
|
|
bookmarks.replace("<P", "<p");
|
|
|
|
bookmarks.replace("</P", "</p");
|
|
|
|
bookmarks.replace("<A", "<a");
|
|
|
|
bookmarks.replace("</A", "</a");
|
|
|
|
bookmarks.replace("HREF=", "href=");
|
|
|
|
bookmarks.replace("<H3", "<h3");
|
|
|
|
bookmarks.replace("</H3", "</h3");
|
|
|
|
|
2012-07-01 18:11:43 +02:00
|
|
|
bookmarks = bookmarks.left(bookmarks.lastIndexOf("</dl><p>"));
|
2012-04-04 23:28:19 +02:00
|
|
|
int start = bookmarks.indexOf("<dl><p>");
|
2012-03-06 15:28:52 +01:00
|
|
|
|
|
|
|
QStringList folders("Html Import");
|
|
|
|
|
|
|
|
while (start > 0) {
|
|
|
|
QString string = bookmarks.mid(start);
|
|
|
|
|
2012-04-04 23:28:19 +02:00
|
|
|
int posOfFolder = string.indexOf("<dt><h3");
|
|
|
|
int posOfEndFolder = string.indexOf("</dl><p>");
|
|
|
|
int posOfLink = string.indexOf("<dt><a");
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
int nearest = qzMin(posOfLink, qzMin(posOfFolder, posOfEndFolder));
|
|
|
|
if (nearest == -1) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (nearest == posOfFolder) {
|
|
|
|
// Next is folder
|
2012-04-04 23:28:19 +02:00
|
|
|
QRegExp rx("<dt><h3(.*)>(.*)</h3>");
|
2012-03-06 15:28:52 +01:00
|
|
|
rx.setMinimal(true);
|
|
|
|
rx.indexIn(string);
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
// QString arguments = rx.cap(1);
|
2012-08-11 14:53:47 +02:00
|
|
|
QString folderName = rx.cap(2).trimmed();
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
folders.append(folderName);
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-03-06 15:28:52 +01:00
|
|
|
start += posOfFolder + rx.cap(0).size();
|
2011-12-08 21:52:03 +01:00
|
|
|
}
|
2012-03-06 15:28:52 +01:00
|
|
|
else if (nearest == posOfEndFolder) {
|
|
|
|
// Next is end of folder
|
2012-04-04 23:28:19 +02:00
|
|
|
if (!folders.isEmpty()) {
|
|
|
|
folders.removeLast();
|
|
|
|
}
|
2012-03-06 15:28:52 +01:00
|
|
|
|
|
|
|
start += posOfEndFolder + 8;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
// Next is link
|
2012-04-04 23:28:19 +02:00
|
|
|
QRegExp rx("<dt><a(.*)>(.*)</a>");
|
2012-03-06 15:28:52 +01:00
|
|
|
rx.setMinimal(true);
|
|
|
|
rx.indexIn(string);
|
|
|
|
|
|
|
|
QString arguments = rx.cap(1);
|
2012-08-11 14:53:47 +02:00
|
|
|
QString linkName = rx.cap(2).trimmed();
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-04-04 23:28:19 +02:00
|
|
|
QRegExp rx2("href=\"(.*)\"");
|
2012-03-06 15:28:52 +01:00
|
|
|
rx2.setMinimal(true);
|
|
|
|
rx2.indexIn(arguments);
|
2011-12-08 21:52:03 +01:00
|
|
|
|
2012-08-11 14:53:47 +02:00
|
|
|
QUrl url = QUrl::fromEncoded(rx2.cap(1).trimmed().toUtf8());
|
2012-03-06 15:28:52 +01:00
|
|
|
|
|
|
|
start += posOfLink + rx.cap(0).size();
|
|
|
|
|
|
|
|
if (linkName.isEmpty() || url.isEmpty() || url.scheme() == "place" || url.scheme() == "about") {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
BookmarksModel::Bookmark b;
|
|
|
|
b.folder = folders.last();
|
|
|
|
b.title = linkName;
|
|
|
|
b.url = url;
|
|
|
|
|
|
|
|
list.append(b);
|
|
|
|
}
|
2011-12-08 21:52:03 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return list;
|
|
|
|
}
|