51 lines
1.5 KiB
C++
51 lines
1.5 KiB
C++
//
|
|
// Copyright (C) 2017 Privacore ApS - https://www.privacore.com
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Affero General Public License as
|
|
// published by the Free Software Foundation, either version 3 of the
|
|
// License, or (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Affero General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
//
|
|
// License TL;DR: If you change this file, you must publish your changes.
|
|
//
|
|
#ifndef FXTERMCHECKLIST_H_
|
|
#define FXTERMCHECKLIST_H_
|
|
|
|
#include <inttypes.h>
|
|
#include <stddef.h>
|
|
#include <string>
|
|
#include "HashTableX.h"
|
|
|
|
class Phrases;
|
|
class TokenizerResult;
|
|
class Xml;
|
|
class XmlDoc;
|
|
class Url;
|
|
|
|
class TermCheckList {
|
|
public:
|
|
TermCheckList();
|
|
~TermCheckList();
|
|
bool init(const char *fname1, const char *fname2=NULL);
|
|
|
|
bool getScore(const TokenizerResult &tr, Phrases *p, HashTableX *uniqueTermIds, int32_t *docScore, int32_t *numUniqueWords, int32_t *numUniquePhrases, char *debbuf, int32_t &debbuf_used, int32_t debbuf_size);
|
|
|
|
private:
|
|
bool loadScoredTermList(HashTableX *ht, const char *filename);
|
|
|
|
HashTableX m_terms;
|
|
|
|
bool m_initialized;
|
|
};
|
|
|
|
|
|
#endif
|