Merge branch 'diffbot' into diffbot-testing

This commit is contained in:
Matt Wells
2014-05-28 09:59:39 -07:00
2 changed files with 8 additions and 3 deletions

@ -468,14 +468,17 @@ geo_ip_table.o: geo_ip_table.cpp geo_ip_table.h
# move this tarball into ~/rpmbuild/?????
# then run rpmbuild -ba gb-1.0.spec to build the rpms
# rpm --nodeps --ignorearch -ivh gb-1.0-... to install the pkg
# rpm -ivh gb-1.0-... to install the pkg
tarball-testing:
# git archive --format=tar master | gzip > gb.tar
git archive --format=tar --prefix=gb-1.0/ testing > gb-1.0.tar
tarball-master:
master-rpm:
# git archive --format=tar master | gzip > gb.tar
git archive --format=tar --prefix=gb-1.0/ master > gb-1.0.tar
mv gb-1.0.tar /home/mwells/rpmbuild/SOURCES/
rpmbuild -ba gb-1.0.spec
scp /home/mwells/rpmbuild/RPMS/x86_64/gb-*rpm www.gigablast.com:/w/html/
install:
# gigablast will copy over the necessary files. it has a list of the

@ -1300,7 +1300,9 @@ bool XmlDoc::set4 ( SpiderRequest *sreq ,
// now we can have url-based page reindex requests because
// if we have a diffbot json object fake url reindex request
// we add a spider request of the PARENT url for it as page reindex
if ( is_digit ( sreq->m_url[0] ) ) {
//if ( is_digit ( sreq->m_url[0] ) ) {
// watch out for 0.r.msn.com!!
if ( sreq->m_urlIsDocId ) {
m_docId = atoll(sreq->m_url);
// assume its good
m_docIdValid = true;