UsenetSearch/include/usenetsearch/Filter.h

52 lines
1.4 KiB
C
Raw Normal View History

2021-10-08 22:31:23 +00:00
/*
Copyright© 2021 John Sennesael
UsenetSearch is Free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
UsenetSearch is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with UsenetSearch. If not, see <https://www.gnu.org/licenses/>.
*/
#pragma once
#include <codecvt>
#include <locale>
#include <regex>
2021-10-08 22:31:23 +00:00
#include <string>
#include <unordered_map>
#include "usenetsearch/Configuration.h"
2021-10-08 22:31:23 +00:00
namespace usenetsearch {
class Filter
{
Configuration& m_config;
2021-10-08 22:31:23 +00:00
std::wstring_convert<std::codecvt_utf8_utf16<wchar_t>> m_conv;
std::vector<std::string> m_noSubtokenWords;
std::unordered_map<std::unique_ptr<std::wregex>, std::wstring>
m_eraseTokenRegexes;
2021-10-08 22:31:23 +00:00
public:
explicit Filter(Configuration& config);
void Init();
2021-10-08 22:31:23 +00:00
std::string ProcessSearchString(const std::string& searchString);
std::string ProcessToken(
const std::string& token,
const std::string& searchString
);
2021-10-08 22:31:23 +00:00
};
} // namespace usenetsearch