1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
|
/* ============================================================
*
* This file is a part of the rekonq project
*
* Copyright (C) 2010 by Benjamin Poulain <ikipou at gmail dot com>
*
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation; either version 2 of
* the License or (at your option) version 3 or any later version
* accepted by the membership of KDE e.V. (or its successor approved
* by the membership of KDE e.V.), which shall act as a proxy
* defined in Section 14 of version 3 of the license.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
* ============================================================ */
// Self Includes
#include "adblockrulefallbackimpl.h"
// Rekonq Includes
#include "rekonq_defines.h"
// Qt Includes
#include <QStringList>
static inline bool isRegExpFilter(const QString &filter)
{
return filter.startsWith(QL1C('/')) && filter.endsWith(QL1C('/'));
}
AdBlockRuleFallbackImpl::AdBlockRuleFallbackImpl(const QString &filter)
: AdBlockRuleImpl(filter)
{
m_regExp.setCaseSensitivity(Qt::CaseInsensitive);
m_regExp.setPatternSyntax(QRegExp::RegExp2);
QString parsedLine = filter;
const int optionsNumber = parsedLine.lastIndexOf(QL1C('$'));
if (optionsNumber >= 0 && !isRegExpFilter(parsedLine)) {
const QStringList options(parsedLine.mid(optionsNumber + 1).split(QL1C(',')));
if (options.contains(QL1S("match-case")))
m_regExp.setCaseSensitivity(Qt::CaseSensitive);
parsedLine = parsedLine.left(optionsNumber);
}
if (isRegExpFilter(parsedLine))
parsedLine = parsedLine.mid(1, parsedLine.length() - 2);
else
parsedLine = convertPatternToRegExp(parsedLine);
m_regExp.setPattern(parsedLine);
}
bool AdBlockRuleFallbackImpl::match(const QString &encodedUrl) const
{
return m_regExp.indexIn(encodedUrl) != -1;
}
QString AdBlockRuleFallbackImpl::convertPatternToRegExp(const QString &wildcardPattern)
{
QString pattern = wildcardPattern;
// remove multiple wildcards
pattern.replace(QRegExp(QL1S("\\*+")), QL1S("*"));
// remove anchors following separator placeholder
pattern.replace(QRegExp(QL1S("\\^\\|$")), QL1S("^"));
// remove leading wildcards
pattern.replace(QRegExp(QL1S("^(\\*)")), QL1S(""));
// remove trailing wildcards
pattern.replace(QRegExp(QL1S("(\\*)$")), QL1S(""));
// escape special symbols
pattern.replace(QRegExp(QL1S("(\\W)")), QL1S("\\\\1"));
// process extended anchor at expression start
pattern.replace(QRegExp(QL1S("^\\\\\\|\\\\\\|")), QL1S("^[\\w\\-]+:\\/+(?!\\/)(?:[^\\/]+\\.)?"));
// process separator placeholders
pattern.replace(QRegExp(QL1S("\\\\\\^")), QL1S("(?:[^\\w\\d\\-.%]|$)"));
// process anchor at expression start
pattern.replace(QRegExp(QL1S("^\\\\\\|")), QL1S("^"));
// process anchor at expression end
pattern.replace(QRegExp(QL1S("\\\\\\|$")), QL1S("$"));
// replace wildcards by .*
pattern.replace(QRegExp(QL1S("\\\\\\*")), QL1S(".*"));
// Finally, return...
return pattern;
}
|