mirror of
https://github.com/d47081/qBittorrent.git
synced 2025-01-25 22:14:32 +00:00
Merge pull request #6344 from magao/issue6337
Fix regex RSS matching. Closes #6337.
This commit is contained in:
commit
c39056f1a8
@ -50,48 +50,51 @@ DownloadRule::DownloadRule()
|
|||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool DownloadRule::matches(const QString &articleTitle, const QString &expression) const
|
||||||
|
{
|
||||||
|
static QRegExp whitespace("\\s+");
|
||||||
|
|
||||||
|
if (expression.isEmpty()) {
|
||||||
|
// A regex of the form "expr|" will always match, so do the same for wildcards
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else if (m_useRegex) {
|
||||||
|
QRegExp reg(expression, Qt::CaseInsensitive, QRegExp::RegExp);
|
||||||
|
return reg.indexIn(articleTitle) > -1;
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
// Only match if every wildcard token (separated by spaces) is present in the article name.
|
||||||
|
// Order of wildcard tokens is unimportant (if order is important, they should have used *).
|
||||||
|
foreach (const QString &wildcard, expression.split(whitespace, QString::SplitBehavior::SkipEmptyParts)) {
|
||||||
|
QRegExp reg(wildcard, Qt::CaseInsensitive, QRegExp::Wildcard);
|
||||||
|
|
||||||
|
if (reg.indexIn(articleTitle) == -1)
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
bool DownloadRule::matches(const QString &articleTitle) const
|
bool DownloadRule::matches(const QString &articleTitle) const
|
||||||
{
|
{
|
||||||
QRegExp whitespace("\\s+");
|
|
||||||
|
|
||||||
if (!m_mustContain.empty()) {
|
if (!m_mustContain.empty()) {
|
||||||
bool logged = false;
|
bool logged = false;
|
||||||
bool foundMustContain = true;
|
bool foundMustContain = false;
|
||||||
|
|
||||||
// Each expression is either a regex, or a set of wildcards separated by whitespace.
|
// Each expression is either a regex, or a set of wildcards separated by whitespace.
|
||||||
// Accept if any complete expression matches.
|
// Accept if any complete expression matches.
|
||||||
foreach (const QString &expression, m_mustContain) {
|
foreach (const QString &expression, m_mustContain) {
|
||||||
if (expression.isEmpty())
|
|
||||||
continue;
|
|
||||||
|
|
||||||
if (!logged) {
|
if (!logged) {
|
||||||
qDebug() << "Checking matching expressions:" << m_mustContain.join("|");
|
qDebug() << "Checking matching" << (m_useRegex ? "regex:" : "wildcard expressions:") << m_mustContain.join("|");
|
||||||
logged = true;
|
logged = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (m_useRegex) {
|
// A regex of the form "expr|" will always match, so do the same for wildcards
|
||||||
QRegExp reg(expression, Qt::CaseInsensitive, QRegExp::RegExp);
|
foundMustContain = matches(articleTitle, expression);
|
||||||
|
|
||||||
if (reg.indexIn(articleTitle) > -1)
|
|
||||||
foundMustContain = true;
|
|
||||||
}
|
|
||||||
else {
|
|
||||||
// Only accept if every wildcard token (separated by spaces) is present in the article name.
|
|
||||||
// Order of wildcard tokens is unimportant (if order is important, they should have used *).
|
|
||||||
foundMustContain = true;
|
|
||||||
|
|
||||||
foreach (const QString &wildcard, expression.split(whitespace, QString::SplitBehavior::SkipEmptyParts)) {
|
|
||||||
QRegExp reg(wildcard, Qt::CaseInsensitive, QRegExp::Wildcard);
|
|
||||||
|
|
||||||
if (reg.indexIn(articleTitle) == -1) {
|
|
||||||
foundMustContain = false;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
if (foundMustContain) {
|
if (foundMustContain) {
|
||||||
qDebug() << "Found matching expression:" << expression;
|
qDebug() << "Found matching" << (m_useRegex ? "regex:" : "wildcard expression:") << expression;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -106,38 +109,14 @@ bool DownloadRule::matches(const QString &articleTitle) const
|
|||||||
// Each expression is either a regex, or a set of wildcards separated by whitespace.
|
// Each expression is either a regex, or a set of wildcards separated by whitespace.
|
||||||
// Reject if any complete expression matches.
|
// Reject if any complete expression matches.
|
||||||
foreach (const QString &expression, m_mustNotContain) {
|
foreach (const QString &expression, m_mustNotContain) {
|
||||||
if (expression.isEmpty())
|
|
||||||
continue;
|
|
||||||
|
|
||||||
if (!logged) {
|
if (!logged) {
|
||||||
qDebug() << "Checking not matching expressions:" << m_mustNotContain.join("|");
|
qDebug() << "Checking not matching" << (m_useRegex ? "regex:" : "wildcard expressions:") << m_mustNotContain.join("|");
|
||||||
logged = true;
|
logged = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (m_useRegex) {
|
// A regex of the form "expr|" will always match, so do the same for wildcards
|
||||||
QRegExp reg(expression, Qt::CaseInsensitive, QRegExp::RegExp);
|
if (matches(articleTitle, expression)) {
|
||||||
|
qDebug() << "Found not matching" << (m_useRegex ? "regex:" : "wildcard expression:") << expression;
|
||||||
if (reg.indexIn(articleTitle) > -1) {
|
|
||||||
qDebug() << "Found not matching expression:" << expression;
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Only reject if every wildcard token (separated by spaces) is present in the article name.
|
|
||||||
// Order of wildcard tokens is unimportant (if order is important, they should have used *).
|
|
||||||
bool foundMustNotContain = true;
|
|
||||||
|
|
||||||
foreach (const QString &wildcard, expression.split(whitespace, QString::SplitBehavior::SkipEmptyParts)) {
|
|
||||||
QRegExp reg(wildcard, Qt::CaseInsensitive, QRegExp::Wildcard);
|
|
||||||
|
|
||||||
if (reg.indexIn(articleTitle) == -1) {
|
|
||||||
foundMustNotContain = false;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
if (foundMustNotContain) {
|
|
||||||
qDebug()<< "Found not matching expression:" << expression;
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -241,6 +220,10 @@ void DownloadRule::setMustContain(const QString &tokens)
|
|||||||
m_mustContain = QStringList() << tokens;
|
m_mustContain = QStringList() << tokens;
|
||||||
else
|
else
|
||||||
m_mustContain = tokens.split("|");
|
m_mustContain = tokens.split("|");
|
||||||
|
|
||||||
|
// Check for single empty string - if so, no condition
|
||||||
|
if ((m_mustContain.size() == 1) && m_mustContain[0].isEmpty())
|
||||||
|
m_mustContain.clear();
|
||||||
}
|
}
|
||||||
|
|
||||||
void DownloadRule::setMustNotContain(const QString &tokens)
|
void DownloadRule::setMustNotContain(const QString &tokens)
|
||||||
@ -249,6 +232,10 @@ void DownloadRule::setMustNotContain(const QString &tokens)
|
|||||||
m_mustNotContain = QStringList() << tokens;
|
m_mustNotContain = QStringList() << tokens;
|
||||||
else
|
else
|
||||||
m_mustNotContain = tokens.split("|");
|
m_mustNotContain = tokens.split("|");
|
||||||
|
|
||||||
|
// Check for single empty string - if so, no condition
|
||||||
|
if ((m_mustNotContain.size() == 1) && m_mustNotContain[0].isEmpty())
|
||||||
|
m_mustNotContain.clear();
|
||||||
}
|
}
|
||||||
|
|
||||||
QStringList DownloadRule::rssFeeds() const
|
QStringList DownloadRule::rssFeeds() const
|
||||||
|
@ -88,6 +88,8 @@ namespace Rss
|
|||||||
bool operator==(const DownloadRule &other) const;
|
bool operator==(const DownloadRule &other) const;
|
||||||
|
|
||||||
private:
|
private:
|
||||||
|
bool matches(const QString &articleTitle, const QString &expression) const;
|
||||||
|
|
||||||
QString m_name;
|
QString m_name;
|
||||||
QStringList m_mustContain;
|
QStringList m_mustContain;
|
||||||
QStringList m_mustNotContain;
|
QStringList m_mustNotContain;
|
||||||
|
@ -673,8 +673,6 @@ void AutomatedRssDownloader::updateFieldsToolTips(bool regex)
|
|||||||
QString tip;
|
QString tip;
|
||||||
if (regex) {
|
if (regex) {
|
||||||
tip = "<p>" + tr("Regex mode: use Perl-like regular expressions") + "</p>";
|
tip = "<p>" + tr("Regex mode: use Perl-like regular expressions") + "</p>";
|
||||||
ui->lineContains->setToolTip(tip);
|
|
||||||
ui->lineNotContains->setToolTip(tip);
|
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
tip = "<p>" + tr("Wildcard mode: you can use") + "<ul>"
|
tip = "<p>" + tr("Wildcard mode: you can use") + "<ul>"
|
||||||
@ -683,9 +681,18 @@ void AutomatedRssDownloader::updateFieldsToolTips(bool regex)
|
|||||||
+ "<li>" + tr("Whitespaces count as AND operators (all words, any order)") + "</li>"
|
+ "<li>" + tr("Whitespaces count as AND operators (all words, any order)") + "</li>"
|
||||||
+ "<li>" + tr("| is used as OR operator") + "</li></ul></p>"
|
+ "<li>" + tr("| is used as OR operator") + "</li></ul></p>"
|
||||||
+ "<p>" + tr("If word order is important use * instead of whitespace.") + "</p>";
|
+ "<p>" + tr("If word order is important use * instead of whitespace.") + "</p>";
|
||||||
ui->lineContains->setToolTip(tip);
|
|
||||||
ui->lineNotContains->setToolTip(tip);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Whether regex or wildcard, warn about a potential gotcha for users.
|
||||||
|
// Explanatory string broken over multiple lines for readability (and multiple
|
||||||
|
// statements to prevent uncrustify indenting excessively.
|
||||||
|
tip += "<p>";
|
||||||
|
tip += tr("An expression with an empty %1 clause (e.g. %2)",
|
||||||
|
"We talk about regex/wildcards in the RSS filters section here."
|
||||||
|
" So a valid sentence would be: An expression with an empty | clause (e.g. expr|)"
|
||||||
|
).arg("<tt>|</tt>").arg("<tt>expr|</tt>");
|
||||||
|
ui->lineContains->setToolTip(tip + tr(" will match all articles.") + "</p>");
|
||||||
|
ui->lineNotContains->setToolTip(tip + tr(" will exclude all articles.") + "</p>");
|
||||||
}
|
}
|
||||||
|
|
||||||
void AutomatedRssDownloader::updateMustLineValidity()
|
void AutomatedRssDownloader::updateMustLineValidity()
|
||||||
|
Loading…
x
Reference in New Issue
Block a user