Files
privacore-open-source-searc…/FxCheckSpam.h

66 lines
1.6 KiB
C
Raw Normal View History

2017-10-26 12:20:04 +02:00
//
// Copyright (C) 2017 Privacore ApS - https://www.privacore.com
//
// This program is free software: you can redistribute it and/or modify
// it under the terms of the GNU Affero General Public License as
// published by the Free Software Foundation, either version 3 of the
// License, or (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU Affero General Public License for more details.
//
// You should have received a copy of the GNU Affero General Public License
// along with this program. If not, see <http://www.gnu.org/licenses/>.
//
// License TL;DR: If you change this file, you must publish your changes.
//
#ifndef FXCHECKSPAM_H_
#define FXCHECKSPAM_H_
2017-10-26 12:20:04 +02:00
#include <inttypes.h>
#include <stddef.h>
#include <string>
#include "FxTermCheckList.h"
2017-10-26 12:20:04 +02:00
class CheckSpam {
2017-10-26 12:20:04 +02:00
public:
CheckSpam(XmlDoc *xd, bool debug=false);
~CheckSpam();
2017-10-26 12:20:04 +02:00
bool init();
bool isDocSpam();
2017-10-26 12:20:04 +02:00
int32_t getScore();
int32_t getNumUniqueMatchedWords();
int32_t getNumUniqueMatchedPhrases();
2017-10-26 12:20:04 +02:00
int32_t getNumWordsChecked();
bool hasEmptyDocumentBody();
const char *getReason();
const char *getDebugInfo();
private:
Url *m_url;
Xml *m_xml;
Words *m_words;
Phrases *m_phrases;
char *m_debbuf;
int m_debbufUsed;
int m_debbufSize;
std::string m_reason;
int32_t m_docMatchScore;
int32_t m_numUniqueMatchedWords;
int32_t m_numUniqueMatchedPhrases;
2017-10-26 12:20:04 +02:00
int32_t m_numWordsChecked;
bool m_emptyDocumentBody;
bool m_resultValid;
bool m_result;
};
extern TermCheckList g_checkSpamList;
2017-10-26 12:20:04 +02:00
#endif