2019-07-07 15:29:11 -04:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2019 KeePassXC Team <team@keepassxc.org>
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 2 or (at your option)
|
|
|
|
* version 3 of the License.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "IconDownloader.h"
|
|
|
|
#include "core/Config.h"
|
|
|
|
#include "core/NetworkManager.h"
|
|
|
|
|
2021-07-11 22:10:29 -04:00
|
|
|
#include <QBuffer>
|
2019-07-07 15:29:11 -04:00
|
|
|
#include <QHostInfo>
|
2020-05-27 11:53:42 -04:00
|
|
|
#include <QImageReader>
|
2021-07-11 22:10:29 -04:00
|
|
|
#include <QNetworkReply>
|
2019-07-07 15:29:11 -04:00
|
|
|
|
|
|
|
#define MAX_REDIRECTS 5
|
|
|
|
|
|
|
|
IconDownloader::IconDownloader(QObject* parent)
|
|
|
|
: QObject(parent)
|
|
|
|
, m_reply(nullptr)
|
|
|
|
, m_redirects(0)
|
|
|
|
{
|
|
|
|
m_timeout.setSingleShot(true);
|
|
|
|
connect(&m_timeout, SIGNAL(timeout()), SLOT(abortDownload()));
|
|
|
|
}
|
|
|
|
|
|
|
|
IconDownloader::~IconDownloader()
|
|
|
|
{
|
|
|
|
abortDownload();
|
|
|
|
}
|
|
|
|
|
|
|
|
namespace
|
|
|
|
{
|
|
|
|
// Try to get the 2nd level domain of the host part of a QUrl. For example,
|
|
|
|
// "foo.bar.example.com" would become "example.com", and "foo.bar.example.co.uk"
|
|
|
|
// would become "example.co.uk".
|
|
|
|
QString getSecondLevelDomain(const QUrl& url)
|
|
|
|
{
|
|
|
|
QString fqdn = url.host();
|
|
|
|
fqdn.truncate(fqdn.length() - url.topLevelDomain().length());
|
|
|
|
QStringList parts = fqdn.split('.');
|
|
|
|
QString newdom = parts.takeLast() + url.topLevelDomain();
|
|
|
|
return newdom;
|
|
|
|
}
|
|
|
|
|
|
|
|
QUrl convertVariantToUrl(const QVariant& var)
|
|
|
|
{
|
|
|
|
QUrl url;
|
|
|
|
if (var.canConvert<QUrl>()) {
|
|
|
|
url = var.toUrl();
|
|
|
|
}
|
|
|
|
return url;
|
|
|
|
}
|
|
|
|
|
|
|
|
QUrl getRedirectTarget(QNetworkReply* reply)
|
|
|
|
{
|
|
|
|
QVariant var = reply->attribute(QNetworkRequest::RedirectionTargetAttribute);
|
|
|
|
QUrl url = convertVariantToUrl(var);
|
|
|
|
return url;
|
|
|
|
}
|
|
|
|
} // namespace
|
|
|
|
|
|
|
|
void IconDownloader::setUrl(const QString& entryUrl)
|
|
|
|
{
|
|
|
|
m_url = entryUrl;
|
2020-10-04 14:27:02 -04:00
|
|
|
QUrl url = QUrl::fromUserInput(m_url);
|
|
|
|
if (!url.isValid() || url.host().isEmpty()) {
|
2019-07-07 15:29:11 -04:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
m_redirects = 0;
|
|
|
|
m_urlsToTry.clear();
|
|
|
|
|
2020-10-04 14:27:02 -04:00
|
|
|
// Fall back to https if no scheme is specified
|
|
|
|
// fromUserInput defaults to http. Hence, we need to replace the default scheme should we detect that it has
|
|
|
|
// been added by fromUserInput
|
|
|
|
if (!entryUrl.startsWith(url.scheme())) {
|
|
|
|
url.setScheme("https");
|
|
|
|
} else if (url.scheme() != "https" && url.scheme() != "http") {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Remove query string - if any
|
|
|
|
if (url.hasQuery()) {
|
|
|
|
url.setQuery(QString());
|
|
|
|
}
|
|
|
|
// Remove fragment - if any
|
|
|
|
if (url.hasFragment()) {
|
|
|
|
url.setFragment(QString());
|
2019-07-07 15:29:11 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
QString fullyQualifiedDomain = url.host();
|
|
|
|
|
|
|
|
// Determine if host portion of URL is an IP address by resolving it and
|
|
|
|
// searching for a match with the returned address(es).
|
|
|
|
bool hostIsIp = false;
|
|
|
|
QList<QHostAddress> hostAddressess = QHostInfo::fromName(fullyQualifiedDomain).addresses();
|
2020-10-04 14:27:02 -04:00
|
|
|
hostIsIp =
|
|
|
|
std::any_of(hostAddressess.begin(), hostAddressess.end(), [&fullyQualifiedDomain](const QHostAddress& addr) {
|
|
|
|
return addr.toString() == fullyQualifiedDomain;
|
|
|
|
});
|
2019-07-07 15:29:11 -04:00
|
|
|
|
|
|
|
// Determine the second-level domain, if available
|
|
|
|
QString secondLevelDomain;
|
|
|
|
if (!hostIsIp) {
|
2020-10-04 14:27:02 -04:00
|
|
|
secondLevelDomain = getSecondLevelDomain(url);
|
2019-07-07 15:29:11 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
// Start with the "fallback" url (if enabled) to try to get the best favicon
|
2020-04-25 19:31:38 -04:00
|
|
|
if (config()->get(Config::Security_IconDownloadFallback).toBool()) {
|
2019-07-07 15:29:11 -04:00
|
|
|
QUrl fallbackUrl = QUrl("https://icons.duckduckgo.com");
|
|
|
|
fallbackUrl.setPath("/ip3/" + QUrl::toPercentEncoding(fullyQualifiedDomain) + ".ico");
|
|
|
|
m_urlsToTry.append(fallbackUrl);
|
|
|
|
|
|
|
|
// Also try a direct pull of the second-level domain (if possible)
|
|
|
|
if (!hostIsIp && fullyQualifiedDomain != secondLevelDomain) {
|
|
|
|
fallbackUrl.setPath("/ip3/" + QUrl::toPercentEncoding(secondLevelDomain) + ".ico");
|
|
|
|
m_urlsToTry.append(fallbackUrl);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Add a direct pull of the website's own favicon.ico file
|
2020-10-04 14:27:02 -04:00
|
|
|
QUrl favicon_url = url;
|
|
|
|
favicon_url.setPath("/favicon.ico");
|
|
|
|
m_urlsToTry.append(favicon_url);
|
2019-07-07 15:29:11 -04:00
|
|
|
|
|
|
|
// Also try a direct pull of the second-level domain (if possible)
|
2020-10-04 14:27:02 -04:00
|
|
|
if (!hostIsIp && fullyQualifiedDomain != secondLevelDomain && !secondLevelDomain.isEmpty()) {
|
|
|
|
favicon_url.setHost(secondLevelDomain);
|
|
|
|
m_urlsToTry.append(favicon_url);
|
|
|
|
if (!favicon_url.userInfo().isEmpty() || favicon_url.port() != -1) {
|
|
|
|
// Remove additional fields from the URL as a fallback. Keep only host and scheme
|
|
|
|
// Fragment and query have been removed earlier
|
|
|
|
favicon_url.setPort(-1);
|
|
|
|
favicon_url.setUserInfo(QString());
|
|
|
|
m_urlsToTry.append(favicon_url);
|
|
|
|
}
|
2019-07-07 15:29:11 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void IconDownloader::download()
|
|
|
|
{
|
2020-02-20 13:38:07 -05:00
|
|
|
if (m_urlsToTry.isEmpty()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2019-07-07 15:29:11 -04:00
|
|
|
if (!m_timeout.isActive()) {
|
2020-04-25 19:31:38 -04:00
|
|
|
int timeout = config()->get(Config::FaviconDownloadTimeout).toInt();
|
2019-07-07 15:29:11 -04:00
|
|
|
m_timeout.start(timeout * 1000);
|
|
|
|
|
|
|
|
// Use the first URL to start the download process
|
|
|
|
// If a favicon is not found, the next URL will be tried
|
|
|
|
fetchFavicon(m_urlsToTry.takeFirst());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void IconDownloader::abortDownload()
|
|
|
|
{
|
|
|
|
if (m_reply) {
|
|
|
|
m_reply->abort();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void IconDownloader::fetchFavicon(const QUrl& url)
|
|
|
|
{
|
|
|
|
m_bytesReceived.clear();
|
|
|
|
m_fetchUrl = url;
|
|
|
|
|
|
|
|
QNetworkRequest request(url);
|
|
|
|
m_reply = getNetMgr()->get(request);
|
|
|
|
|
|
|
|
connect(m_reply, &QNetworkReply::finished, this, &IconDownloader::fetchFinished);
|
|
|
|
connect(m_reply, &QIODevice::readyRead, this, &IconDownloader::fetchReadyRead);
|
|
|
|
}
|
|
|
|
|
|
|
|
void IconDownloader::fetchReadyRead()
|
|
|
|
{
|
|
|
|
m_bytesReceived += m_reply->readAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
void IconDownloader::fetchFinished()
|
|
|
|
{
|
|
|
|
QImage image;
|
|
|
|
QString url = m_url;
|
|
|
|
|
|
|
|
bool error = (m_reply->error() != QNetworkReply::NoError);
|
|
|
|
QUrl redirectTarget = getRedirectTarget(m_reply);
|
|
|
|
|
|
|
|
m_reply->deleteLater();
|
|
|
|
m_reply = nullptr;
|
|
|
|
|
|
|
|
if (!error) {
|
|
|
|
if (redirectTarget.isValid()) {
|
|
|
|
// Redirected, we need to follow it, or fall through if we have
|
|
|
|
// done too many redirects already.
|
|
|
|
if (m_redirects < MAX_REDIRECTS) {
|
|
|
|
m_redirects++;
|
|
|
|
if (redirectTarget.isRelative()) {
|
|
|
|
redirectTarget = m_fetchUrl.resolved(redirectTarget);
|
|
|
|
}
|
|
|
|
m_urlsToTry.prepend(redirectTarget);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// No redirect, and we theoretically have some icon data now.
|
2020-05-27 11:53:42 -04:00
|
|
|
image = parseImage(m_bytesReceived);
|
2019-07-07 15:29:11 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!image.isNull()) {
|
|
|
|
// Valid icon received
|
|
|
|
m_timeout.stop();
|
|
|
|
emit finished(url, image);
|
|
|
|
} else if (!m_urlsToTry.empty()) {
|
|
|
|
// Try the next url
|
|
|
|
m_redirects = 0;
|
|
|
|
fetchFavicon(m_urlsToTry.takeFirst());
|
|
|
|
} else {
|
|
|
|
// No icon found
|
|
|
|
m_timeout.stop();
|
|
|
|
emit finished(url, image);
|
|
|
|
}
|
|
|
|
}
|
2020-05-27 11:53:42 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Parse fetched image bytes.
|
|
|
|
*
|
|
|
|
* Parses the given byte array into a QImage. Unlike QImage::loadFromData(), this method
|
|
|
|
* tries to extract the highest resolution image from .ICO files.
|
|
|
|
*
|
|
|
|
* @param imageBytes raw image bytes
|
|
|
|
* @return parsed image
|
|
|
|
*/
|
|
|
|
QImage IconDownloader::parseImage(QByteArray& imageBytes) const
|
|
|
|
{
|
|
|
|
QBuffer buff(&imageBytes);
|
|
|
|
buff.open(QIODevice::ReadOnly);
|
|
|
|
QImageReader reader(&buff);
|
|
|
|
|
|
|
|
if (reader.imageCount() <= 0) {
|
|
|
|
return reader.read();
|
|
|
|
}
|
|
|
|
|
|
|
|
QImage img;
|
|
|
|
for (int i = 0; i < reader.imageCount(); ++i) {
|
|
|
|
if (img.isNull() || reader.size().width() > img.size().width()) {
|
|
|
|
img = reader.read();
|
|
|
|
}
|
|
|
|
reader.jumpToNextImage();
|
|
|
|
}
|
|
|
|
|
|
|
|
return img;
|
|
|
|
}
|