HCE Project Python language Distributed Tasks Manager Application, Distributed Crawler Application and client API bindings.
2.0.0-chaika
Hierarchical Cluster Engine Python language binding
|
Public Member Functions | |
def | __init__ (self, keyValueStorageDir, rawDataDir, dBDataTask, siteTask=None) |
def | newSiteCreate (self, initUrl, queryCallback) |
def | fillSiteRelatedFields (self, urlObj, queryCallback) |
def | resolveSiteIdByURL (self, url, queryCallback) |
def | calcSiteIdByUrl (self, url) |
def | siteTableOperation (self, urlObj, queryCallback) |
def | process (self, urls, queryCallback) |
def | urlInsertWithGoodSietId (self, urlObj, statusInit, queryCallback) |
def | selectURL (self, urlObject, queryCallback) |
def | addURL (self, urlObject, queryCallback) |
def | attributesSet (self, attributes, queryCallback) |
Public Member Functions inherited from dc_db.BaseTask.BaseTask | |
def | isSiteExist (self, siteId, queryCallback, userId=None) |
def | generateCriterionSQL (self, criterions, additionWhere=None, siteId=None) |
def | fetchByCriterions (self, criterions, queryCallback) |
def | dbLock (self, mutexName, queryCallback, sleepTime=1, mutexLockTTL=Constants.DEFAULT_LOCK_TTL) |
def | dbUnlock (self, mutexName, queryCallback) |
def | createUrlsInsertQuery (self, siteId, localKeys, localValues) |
def | copyUrlsToDcUrls (self, siteId, queryCallback) |
def | statisticLogUpdate (self, localObj, urlMd5, siteId, status, queryCallback, isInsert=False) |
def | calculateMd5FormUrl (self, url, urlType, useNormilize=False) |
Public Attributes | |
siteTask | |
recalculator | |
urlMd5 | |
urlUpdateTask | |
Static Public Attributes | |
int | CODE_GOOD_INSERT = 0 |
int | CODE_BAD_INSERT = 1 |
int | CODE_ALREADY_EXIST = 2 |
Additional Inherited Members | |
Static Public Member Functions inherited from dc_db.BaseTask.BaseTask | |
def | readValueFromSiteProp (siteId, propName, queryCallback, urlMd5=None) |
Definition at line 24 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.__init__ | ( | self, | |
keyValueStorageDir, | |||
rawDataDir, | |||
dBDataTask, | |||
siteTask = None |
|||
) |
Definition at line 32 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.addURL | ( | self, | |
urlObject, | |||
queryCallback | |||
) |
Definition at line 210 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.attributesSet | ( | self, | |
attributes, | |||
queryCallback | |||
) |
Definition at line 229 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.calcSiteIdByUrl | ( | self, | |
url | |||
) |
def dc_db.URLNewTask.URLNewTask.fillSiteRelatedFields | ( | self, | |
urlObj, | |||
queryCallback | |||
) |
Definition at line 55 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.newSiteCreate | ( | self, | |
initUrl, | |||
queryCallback | |||
) |
Definition at line 44 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.process | ( | self, | |
urls, | |||
queryCallback | |||
) |
Definition at line 134 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.resolveSiteIdByURL | ( | self, | |
url, | |||
queryCallback | |||
) |
def dc_db.URLNewTask.URLNewTask.selectURL | ( | self, | |
urlObject, | |||
queryCallback | |||
) |
def dc_db.URLNewTask.URLNewTask.siteTableOperation | ( | self, | |
urlObj, | |||
queryCallback | |||
) |
Definition at line 96 of file URLNewTask.py.
def dc_db.URLNewTask.URLNewTask.urlInsertWithGoodSietId | ( | self, | |
urlObj, | |||
statusInit, | |||
queryCallback | |||
) |
Definition at line 165 of file URLNewTask.py.
|
static |
Definition at line 28 of file URLNewTask.py.
|
static |
Definition at line 27 of file URLNewTask.py.
|
static |
Definition at line 26 of file URLNewTask.py.
dc_db.URLNewTask.URLNewTask.recalculator |
Definition at line 35 of file URLNewTask.py.
dc_db.URLNewTask.URLNewTask.siteTask |
Definition at line 34 of file URLNewTask.py.
dc_db.URLNewTask.URLNewTask.urlMd5 |
Definition at line 36 of file URLNewTask.py.
dc_db.URLNewTask.URLNewTask.urlUpdateTask |
Definition at line 37 of file URLNewTask.py.