2021-12-05 17:54:36 +00:00
|
|
|
#include "dChatFilter.h"
|
|
|
|
#include "BinaryIO.h"
|
|
|
|
#include <fstream>
|
|
|
|
#include <string>
|
|
|
|
#include <functional>
|
|
|
|
#include <algorithm>
|
|
|
|
#include <sstream>
|
|
|
|
#include <regex>
|
|
|
|
|
|
|
|
#include "dCommonVars.h"
|
|
|
|
#include "dLogger.h"
|
2022-07-17 06:54:36 +00:00
|
|
|
#include "dConfig.h"
|
|
|
|
#include "Database.h"
|
2021-12-05 17:54:36 +00:00
|
|
|
#include "Game.h"
|
2023-03-24 23:16:45 +00:00
|
|
|
#include "eGameMasterLevel.h"
|
2021-12-05 17:54:36 +00:00
|
|
|
|
|
|
|
using namespace dChatFilterDCF;
|
|
|
|
|
|
|
|
dChatFilter::dChatFilter(const std::string& filepath, bool dontGenerateDCF) {
|
|
|
|
m_DontGenerateDCF = dontGenerateDCF;
|
|
|
|
|
|
|
|
if (!BinaryIO::DoesFileExist(filepath + ".dcf") || m_DontGenerateDCF) {
|
2022-07-17 08:40:34 +00:00
|
|
|
ReadWordlistPlaintext(filepath + ".txt", true);
|
|
|
|
if (!m_DontGenerateDCF) ExportWordlistToDCF(filepath + ".dcf", true);
|
2022-07-17 06:54:36 +00:00
|
|
|
} else if (!ReadWordlistDCF(filepath + ".dcf", true)) {
|
2022-07-17 08:40:34 +00:00
|
|
|
ReadWordlistPlaintext(filepath + ".txt", true);
|
|
|
|
ExportWordlistToDCF(filepath + ".dcf", true);
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2022-07-17 06:54:36 +00:00
|
|
|
if (BinaryIO::DoesFileExist("blacklist.dcf")) {
|
|
|
|
ReadWordlistDCF("blacklist.dcf", false);
|
|
|
|
}
|
|
|
|
|
2021-12-05 17:54:36 +00:00
|
|
|
//Read player names that are ok as well:
|
|
|
|
auto stmt = Database::CreatePreppedStmt("select name from charinfo;");
|
|
|
|
auto res = stmt->executeQuery();
|
|
|
|
while (res->next()) {
|
|
|
|
std::string line = res->getString(1).c_str();
|
|
|
|
std::transform(line.begin(), line.end(), line.begin(), ::tolower); //Transform to lowercase
|
2022-07-18 09:01:43 +00:00
|
|
|
m_ApprovedWords.push_back(CalculateHash(line));
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
delete res;
|
|
|
|
delete stmt;
|
|
|
|
}
|
|
|
|
|
|
|
|
dChatFilter::~dChatFilter() {
|
2022-07-18 09:01:43 +00:00
|
|
|
m_ApprovedWords.clear();
|
|
|
|
m_DeniedWords.clear();
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2022-07-17 08:40:34 +00:00
|
|
|
void dChatFilter::ReadWordlistPlaintext(const std::string& filepath, bool whiteList) {
|
2021-12-05 17:54:36 +00:00
|
|
|
std::ifstream file(filepath);
|
|
|
|
if (file) {
|
|
|
|
std::string line;
|
|
|
|
while (std::getline(file, line)) {
|
2021-12-07 20:03:55 +00:00
|
|
|
line.erase(std::remove(line.begin(), line.end(), '\r'), line.end());
|
2021-12-05 17:54:36 +00:00
|
|
|
std::transform(line.begin(), line.end(), line.begin(), ::tolower); //Transform to lowercase
|
2022-07-18 09:01:43 +00:00
|
|
|
if (whiteList) m_ApprovedWords.push_back(CalculateHash(line));
|
|
|
|
else m_DeniedWords.push_back(CalculateHash(line));
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-07-17 06:54:36 +00:00
|
|
|
bool dChatFilter::ReadWordlistDCF(const std::string& filepath, bool whiteList) {
|
2021-12-05 17:54:36 +00:00
|
|
|
std::ifstream file(filepath, std::ios::binary);
|
|
|
|
if (file) {
|
|
|
|
fileHeader hdr;
|
|
|
|
BinaryIO::BinaryRead(file, hdr);
|
|
|
|
if (hdr.header != header) {
|
|
|
|
file.close();
|
2021-12-07 20:03:55 +00:00
|
|
|
return false;
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2021-12-07 20:03:55 +00:00
|
|
|
if (hdr.formatVersion == formatVersion) {
|
2021-12-05 17:54:36 +00:00
|
|
|
size_t wordsToRead = 0;
|
|
|
|
BinaryIO::BinaryRead(file, wordsToRead);
|
2022-07-18 09:01:43 +00:00
|
|
|
if (whiteList) m_ApprovedWords.reserve(wordsToRead);
|
|
|
|
else m_DeniedWords.reserve(wordsToRead);
|
2021-12-05 17:54:36 +00:00
|
|
|
|
|
|
|
size_t word = 0;
|
|
|
|
for (size_t i = 0; i < wordsToRead; ++i) {
|
|
|
|
BinaryIO::BinaryRead(file, word);
|
2022-07-18 09:01:43 +00:00
|
|
|
if (whiteList) m_ApprovedWords.push_back(word);
|
|
|
|
else m_DeniedWords.push_back(word);
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
2021-12-07 20:03:55 +00:00
|
|
|
|
|
|
|
return true;
|
2021-12-05 17:54:36 +00:00
|
|
|
} else {
|
|
|
|
file.close();
|
2021-12-07 20:03:55 +00:00
|
|
|
return false;
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
}
|
2021-12-07 20:03:55 +00:00
|
|
|
|
|
|
|
return false;
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2022-07-17 08:40:34 +00:00
|
|
|
void dChatFilter::ExportWordlistToDCF(const std::string& filepath, bool whiteList) {
|
2021-12-07 20:03:55 +00:00
|
|
|
std::ofstream file(filepath, std::ios::binary | std::ios_base::out);
|
2021-12-05 17:54:36 +00:00
|
|
|
if (file) {
|
|
|
|
BinaryIO::BinaryWrite(file, uint32_t(dChatFilterDCF::header));
|
|
|
|
BinaryIO::BinaryWrite(file, uint32_t(dChatFilterDCF::formatVersion));
|
2022-07-18 09:01:43 +00:00
|
|
|
BinaryIO::BinaryWrite(file, size_t(whiteList ? m_ApprovedWords.size() : m_DeniedWords.size()));
|
2021-12-05 17:54:36 +00:00
|
|
|
|
2022-07-18 09:01:43 +00:00
|
|
|
for (size_t word : whiteList ? m_ApprovedWords : m_DeniedWords) {
|
2021-12-05 17:54:36 +00:00
|
|
|
BinaryIO::BinaryWrite(file, word);
|
|
|
|
}
|
|
|
|
|
|
|
|
file.close();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-24 23:16:45 +00:00
|
|
|
std::vector<std::pair<uint8_t, uint8_t>> dChatFilter::IsSentenceOkay(const std::string& message, eGameMasterLevel gmLevel, bool whiteList) {
|
|
|
|
if (gmLevel > eGameMasterLevel::FORUM_MODERATOR) return { }; //If anything but a forum mod, return true.
|
2022-07-17 06:54:36 +00:00
|
|
|
if (message.empty()) return { };
|
2022-07-18 09:01:43 +00:00
|
|
|
if (!whiteList && m_DeniedWords.empty()) return { { 0, message.length() } };
|
2021-12-05 17:54:36 +00:00
|
|
|
|
|
|
|
std::stringstream sMessage(message);
|
2021-12-07 20:03:55 +00:00
|
|
|
std::string segment;
|
2021-12-05 17:54:36 +00:00
|
|
|
std::regex reg("(!*|\\?*|\\;*|\\.*|\\,*)");
|
|
|
|
|
2022-07-18 09:01:43 +00:00
|
|
|
std::vector<std::pair<uint8_t, uint8_t>> listOfBadSegments = std::vector<std::pair<uint8_t, uint8_t>>();
|
|
|
|
|
|
|
|
uint32_t position = 0;
|
2022-07-17 06:54:36 +00:00
|
|
|
|
2021-12-07 20:03:55 +00:00
|
|
|
while (std::getline(sMessage, segment, ' ')) {
|
2022-07-17 06:54:36 +00:00
|
|
|
std::string originalSegment = segment;
|
|
|
|
|
2021-12-07 20:03:55 +00:00
|
|
|
std::transform(segment.begin(), segment.end(), segment.begin(), ::tolower); //Transform to lowercase
|
|
|
|
segment = std::regex_replace(segment, reg, "");
|
|
|
|
|
|
|
|
size_t hash = CalculateHash(segment);
|
2021-12-05 17:54:36 +00:00
|
|
|
|
2022-07-17 08:40:34 +00:00
|
|
|
if (std::find(m_UserUnapprovedWordCache.begin(), m_UserUnapprovedWordCache.end(), hash) != m_UserUnapprovedWordCache.end() && whiteList) {
|
2022-07-18 09:01:43 +00:00
|
|
|
listOfBadSegments.emplace_back(position, originalSegment.length());
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2022-07-18 09:01:43 +00:00
|
|
|
if (std::find(m_ApprovedWords.begin(), m_ApprovedWords.end(), hash) == m_ApprovedWords.end() && whiteList) {
|
2022-07-17 08:40:34 +00:00
|
|
|
m_UserUnapprovedWordCache.push_back(hash);
|
2022-07-18 09:01:43 +00:00
|
|
|
listOfBadSegments.emplace_back(position, originalSegment.length());
|
2022-07-17 06:54:36 +00:00
|
|
|
}
|
2022-07-28 13:39:57 +00:00
|
|
|
|
2022-07-18 09:01:43 +00:00
|
|
|
if (std::find(m_DeniedWords.begin(), m_DeniedWords.end(), hash) != m_DeniedWords.end() && !whiteList) {
|
2022-07-17 08:40:34 +00:00
|
|
|
m_UserUnapprovedWordCache.push_back(hash);
|
2022-07-18 09:01:43 +00:00
|
|
|
listOfBadSegments.emplace_back(position, originalSegment.length());
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
2022-07-18 09:01:43 +00:00
|
|
|
|
|
|
|
position += segment.length() + 1;
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
2022-07-17 06:54:36 +00:00
|
|
|
return listOfBadSegments;
|
2021-12-05 17:54:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
size_t dChatFilter::CalculateHash(const std::string& word) {
|
|
|
|
std::hash<std::string> hash{};
|
|
|
|
|
|
|
|
size_t value = hash(word);
|
|
|
|
|
|
|
|
return value;
|
2022-07-18 09:01:43 +00:00
|
|
|
}
|