fix a couple cores.

This commit is contained in:
Matt Wells
2013-10-07 11:59:07 -07:00
parent 3780789201
commit 0b338161e4
3 changed files with 20 additions and 4 deletions

@ -1080,7 +1080,7 @@ bool printDiffbotDropDown ( SafeBuf *sb,char *name,char *THIS , SafeBuf *sx) {
//char *p = cr->m_diffbotApiList.getBufStart();
char *p =
"None|none,"
"All|http://www.diffbot.com/api/analzye?mode=auto&url=,"
"All|http://www.diffbot.com/api/analyze?mode=auto,"
"Article (autodetect)|http://www.diffbot.com/api/analyze?mode=article,"
"Article (force)|http://www.diffbot.com/api/article?,"
"Product (autodetect)|http://www.diffbot.com/api/analyze?mode=product,"

@ -185,6 +185,13 @@ void RdbDump::doneDumping ( ) {
"db: Dumped %li positive and %li negative recs. Total = %li.",
m_totalPosDumped , m_totalNegDumped ,
m_totalPosDumped + m_totalNegDumped );
// map verify
log("db: map # pos=%lli neg=%lli",
m_map->getNumPositiveRecs(),
m_map->getNumNegativeRecs()
);
// free the list's memory
if ( m_list ) m_list->freeList();
// reset verify buffer
@ -567,6 +574,10 @@ bool RdbDump::dumpList ( RdbList *list , long niceness , bool recall ) {
// write thread is out
m_writing = true;
//m_bytesWritten = 0;
// sanity check
log("dump: writing %li bytes at offset %lli",m_bytesToWrite,offset);
// . if we're called by RdbMerge directly use m_callback/m_state
// . otherwise, use doneWritingWrapper() which will call dumpTree()
// . BigFile::write() return 0 if blocked,-1 on error,>0 on completion

@ -11836,10 +11836,13 @@ void gotDiffbotReplyWrapper ( void *state , TcpSocket *s ) {
XmlDoc *THIS = (XmlDoc *)state;
bool hadError = false;
// wha?
if ( g_errno ) {
log("diffbot: http error2 %s",mstrerror(g_errno));
THIS->m_diffbotReplyError = g_errno;
hadError = true;
}
//char *buf = s->m_readBuf;
@ -11847,8 +11850,6 @@ void gotDiffbotReplyWrapper ( void *state , TcpSocket *s ) {
// is now responsible for that
//s->m_readBuf = NULL;
bool hadError = false;
// set the mime
HttpMime mime;
if ( s->m_readOffset>0 &&
@ -11859,6 +11860,7 @@ void gotDiffbotReplyWrapper ( void *state , TcpSocket *s ) {
// note it
log("xmldoc: error setting diffbot mime");
THIS->m_diffbotReplyError = EDIFFBOTMIMEERROR;
hadError = true;
}
// check the status
@ -11866,6 +11868,7 @@ void gotDiffbotReplyWrapper ( void *state , TcpSocket *s ) {
THIS->m_diffbotReplyError = EDIFFBOTBADHTTPSTATUS;
log("xmldoc: diffbot reply mime was %li",
mime.getHttpStatus());
hadError = true;
}
@ -11894,7 +11897,9 @@ void gotDiffbotReplyWrapper ( void *state , TcpSocket *s ) {
// count it for stats
THIS->m_cr->m_localCrawlInfo.m_pageProcessSuccesses++;
// log it
log("build: processed page %s",THIS->m_firstUrl.m_url);
log("build: processed page %s (pageLen=%li)",
THIS->m_firstUrl.m_url,
pageLen);
// sanity!
// crap, this can happen if we try to get the metalist
// of an old page for purposes of incremental indexing or