HCE Project Python language Distributed Tasks Manager Application, Distributed Crawler Application and client API bindings.
2.0.0-chaika
Hierarchical Cluster Engine Python language binding
|
Classes | |
class | StatFreqConstants |
Functions | |
def | readDataTimeField (fName, row) |
def | stripSymbol (incomeStr, symbol=None) |
def | getFieldsValuesTuple (obj, inputDict, excludeList=None) |
def | cleateFieldsValuesLists (fields, values) |
def | createFieldsValuesString (fields, values, excludeList=None) |
Variables | |
string | APP_NAME = "db-task" |
int | DEFAULT_LOCK_TTL = 600 |
int | DB_DATA_KVDB = 0 |
int | DB_DATA_MYSQL = 1 |
int | TASK_DUPLICATE_ERR = 2020 |
string | TASK_DUPLICATE_ERR_MSG = "Duplicate site" |
int | TASK_SQL_ERR = 2021 |
string | TASK_SQL_ERR_MSG = "Some SQL error, look log file for details" |
int | EXEC_INDEX = 0 |
int | EXEC_NAME = 1 |
string | PRIMARY_DB_ID = "primaryDB" |
string | SECONDARY_DB_ID = "secondaryDB" |
string | THIRD_DB_ID = "thirdDB" |
string | FOURTH_DB_ID = "fourthDB" |
string | FIFTH_DB_ID = "fifthDB" |
string | STAT_DB_ID = "statDB" |
string | LOG_DB_ID = "logDB" |
string | ATT_DB_ID = "attDB" |
string | STAT_DOMAINS_DB_ID = "statDomainsDB" |
string | DB_STORAGE_TABLE_NAME = "articles" |
int | DB_LOCK_APPLICATION_ID = 0 |
string | FETCH_LOCK_NAME = "SELECT_LOCK" |
string | COMA_SEPARATOR = "," |
string | FIELD_QUOTE_SEPARATOR = "`" |
int | EXIT_CODE_OK = 0 |
int | EXIT_CODE_CONFIG_ERROR = 1 |
int | EXIT_CODE_GLOBAL_ERROR = 2 |
int | EXIT_CODE_MYSQL_ERROR = 3 |
LOGGER_NAME = APP_CONSTS.LOGGER_NAME | |
string | DC_SITES = "dc_sites" |
string | DC_URLS = "dc_urls" |
string | DC_URLS_TABLE_NAME_TEMPLATE = "urls_%s" |
string | URL_URL_SQL_UPDATE = 'UPDATE ' + DC_URLS_TABLE_NAME_TEMPLATE + ' SET %s WHERE' |
string | URL_URL_SQL_SELECT_COUNT = 'SELECT COUNT(*) FROM ' + DC_URLS_TABLE_NAME_TEMPLATE + ' WHERE ' |
string | DC_CONTENTS_TABLE_NAME_TEMPLATE = "contents_%s" |
string | DC_FREQ_TABLE_NAME_TEMPLATE = "freq_%s" |
string | DC_LOG_TABLE_NAME_TEMPLATE = "log_%s" |
string | DC_ATT_TABLE_NAME_TEMPLATE = "att_%s" |
string | USE_SQL_TEMPLATE = "USE `%s`" |
string | SELECT_DB_STORAGE = "SELECT * FROM `%s` WHERE Id = '%s'" |
string | INSERT_COMMON_TEMPLATE = "INSERT INTO `%s` SET %s" |
string | SITE_SQL_TEMPLATE = "INSERT INTO `sites` %s VALUES %s" |
string | SITE_FILTER_SQL_TEMPLATE |
string | SITE_FILTER_SQL_UPDATE |
string | SITE_PROP_SQL_TEMPLATE = "INSERT INTO `sites_properties` SET `Site_Id`='%s', `Name`='%s', `Value`='%s'" |
string | SITE_PROP_SQL_ADDITIONS = ", `URLMD5`='%s'" |
string | SITE_PROP_SQL_SHOT = "INSERT INTO `sites_properties` SET %s" |
string | SITE_PROP_SQL_UPDATE = "UPDATE `sites_properties` SET %s WHERE `Site_Id`='%s' AND `Name`='%s'" |
string | SITE_URL_SQL_TEMPLATE = "INSERT INTO `sites_urls` SET %s" |
string | SITE_URL_SQL_UPDATE = "UPDATE `sites_urls` SET %s WHERE `Site_Id`='%s'" |
string | SITE_URL_SQL_SELECT_COUNT = 'SELECT COUNT(*) FROM `sites_urls` WHERE ' |
string | DEL_BY_ID_QUERY_TEMPLATE = "DELETE FROM `%s` WHERE `Site_Id` = '%s'" |
string | SQL_CHECK_TABLE_EXIST_TEMPLATE |
string | DC_SITE_URL_SQL_TEMPLATE = "INSERT INTO `%s` (`Site_Id`, `URL`) VALUES('%s', '%s')" |
string | SELECT_SQL_TEMPLATE = """ SELECT * FROM `%s` WHERE %s""" |
string | SELECT_SQL_TEMPLATE_SIMPLE = """ SELECT %s FROM `%s`""" |
string | SELECT_SITE_ID_BY_URL |
string | CHECK_TABLE_SQL_ADDITION = "`User_Id` = %s" |
string | SQL_CREATE_QUERY_TEMPLATE = "CREATE TABLE IF NOT EXISTS `%s` LIKE dc_urls.%s" |
string | CHECK_TABLE_SQL_TEMPLATE = " SELECT COUNT(*) FROM sites WHERE `Id` = '%s'" |
string | KEY_VALUE_FILE_NAME_TEMPLATE = "%s.db" |
logOperationsDict | |
siteDict | |
list | siteExcludeList = ["Id"] |
propDict | |
filterDict | |
URLTableDict | |
ProxyTableDict | |
AttrTableDict | |
list | urlExcludeList = ["URL", "URLMd5"] |
list | proxyExcludeList = ["Id", "Site_Id", "Host", "CDate"] |
SiteURLTableDitct = dict(URLTableDict.items() + {"userId": "User_Id"}.items()) | |
dictionary | DbContentFields |
string | SITE_ID_NAME = "SITE_ID" |
@package: dc @author igor @link: http://hierarchical-cluster-engine.com/ @copyright: Copyright © 2013-2014 IOIX Ukraine @license: http://hierarchical-cluster-engine.com/license/ @since: 0.1
def dc_db.Constants.cleateFieldsValuesLists | ( | fields, | |
values | |||
) |
Definition at line 337 of file Constants.py.
def dc_db.Constants.createFieldsValuesString | ( | fields, | |
values, | |||
excludeList = None |
|||
) |
Definition at line 357 of file Constants.py.
def dc_db.Constants.getFieldsValuesTuple | ( | obj, | |
inputDict, | |||
excludeList = None |
|||
) |
Definition at line 307 of file Constants.py.
def dc_db.Constants.readDataTimeField | ( | fName, | |
row | |||
) |
Definition at line 282 of file Constants.py.
def dc_db.Constants.stripSymbol | ( | incomeStr, | |
symbol = None |
|||
) |
string dc_db.Constants.APP_NAME = "db-task" |
Definition at line 13 of file Constants.py.
string dc_db.Constants.ATT_DB_ID = "attDB" |
Definition at line 34 of file Constants.py.
dc_db.Constants.AttrTableDict |
Definition at line 260 of file Constants.py.
string dc_db.Constants.CHECK_TABLE_SQL_ADDITION = "`User_Id` = %s" |
Definition at line 95 of file Constants.py.
string dc_db.Constants.CHECK_TABLE_SQL_TEMPLATE = " SELECT COUNT(*) FROM sites WHERE `Id` = '%s'" |
Definition at line 99 of file Constants.py.
string dc_db.Constants.COMA_SEPARATOR = "," |
Definition at line 42 of file Constants.py.
int dc_db.Constants.DB_DATA_KVDB = 0 |
Definition at line 16 of file Constants.py.
int dc_db.Constants.DB_DATA_MYSQL = 1 |
Definition at line 17 of file Constants.py.
int dc_db.Constants.DB_LOCK_APPLICATION_ID = 0 |
Definition at line 39 of file Constants.py.
string dc_db.Constants.DB_STORAGE_TABLE_NAME = "articles" |
Definition at line 37 of file Constants.py.
dictionary dc_db.Constants.DbContentFields |
Definition at line 271 of file Constants.py.
string dc_db.Constants.DC_ATT_TABLE_NAME_TEMPLATE = "att_%s" |
Definition at line 64 of file Constants.py.
string dc_db.Constants.DC_CONTENTS_TABLE_NAME_TEMPLATE = "contents_%s" |
Definition at line 61 of file Constants.py.
string dc_db.Constants.DC_FREQ_TABLE_NAME_TEMPLATE = "freq_%s" |
Definition at line 62 of file Constants.py.
string dc_db.Constants.DC_LOG_TABLE_NAME_TEMPLATE = "log_%s" |
Definition at line 63 of file Constants.py.
string dc_db.Constants.DC_SITE_URL_SQL_TEMPLATE = "INSERT INTO `%s` (`Site_Id`, `URL`) VALUES('%s', '%s')" |
Definition at line 89 of file Constants.py.
string dc_db.Constants.DC_SITES = "dc_sites" |
Definition at line 54 of file Constants.py.
string dc_db.Constants.DC_URLS = "dc_urls" |
Definition at line 55 of file Constants.py.
string dc_db.Constants.DC_URLS_TABLE_NAME_TEMPLATE = "urls_%s" |
Definition at line 58 of file Constants.py.
int dc_db.Constants.DEFAULT_LOCK_TTL = 600 |
Definition at line 14 of file Constants.py.
string dc_db.Constants.DEL_BY_ID_QUERY_TEMPLATE = "DELETE FROM `%s` WHERE `Site_Id` = '%s'" |
Definition at line 85 of file Constants.py.
int dc_db.Constants.EXEC_INDEX = 0 |
Definition at line 24 of file Constants.py.
int dc_db.Constants.EXEC_NAME = 1 |
Definition at line 25 of file Constants.py.
int dc_db.Constants.EXIT_CODE_CONFIG_ERROR = 1 |
Definition at line 46 of file Constants.py.
int dc_db.Constants.EXIT_CODE_GLOBAL_ERROR = 2 |
Definition at line 47 of file Constants.py.
int dc_db.Constants.EXIT_CODE_MYSQL_ERROR = 3 |
Definition at line 48 of file Constants.py.
int dc_db.Constants.EXIT_CODE_OK = 0 |
Definition at line 45 of file Constants.py.
string dc_db.Constants.FETCH_LOCK_NAME = "SELECT_LOCK" |
Definition at line 40 of file Constants.py.
string dc_db.Constants.FIELD_QUOTE_SEPARATOR = "`" |
Definition at line 43 of file Constants.py.
string dc_db.Constants.FIFTH_DB_ID = "fifthDB" |
Definition at line 31 of file Constants.py.
dc_db.Constants.filterDict |
Definition at line 177 of file Constants.py.
string dc_db.Constants.FOURTH_DB_ID = "fourthDB" |
Definition at line 30 of file Constants.py.
string dc_db.Constants.INSERT_COMMON_TEMPLATE = "INSERT INTO `%s` SET %s" |
Definition at line 70 of file Constants.py.
string dc_db.Constants.KEY_VALUE_FILE_NAME_TEMPLATE = "%s.db" |
Definition at line 103 of file Constants.py.
string dc_db.Constants.LOG_DB_ID = "logDB" |
Definition at line 33 of file Constants.py.
dc_db.Constants.LOGGER_NAME = APP_CONSTS.LOGGER_NAME |
Definition at line 51 of file Constants.py.
dc_db.Constants.logOperationsDict |
Definition at line 117 of file Constants.py.
string dc_db.Constants.PRIMARY_DB_ID = "primaryDB" |
Definition at line 27 of file Constants.py.
dc_db.Constants.propDict |
Definition at line 168 of file Constants.py.
list dc_db.Constants.proxyExcludeList = ["Id", "Site_Id", "Host", "CDate"] |
Definition at line 267 of file Constants.py.
dc_db.Constants.ProxyTableDict |
Definition at line 235 of file Constants.py.
string dc_db.Constants.SECONDARY_DB_ID = "secondaryDB" |
Definition at line 28 of file Constants.py.
string dc_db.Constants.SELECT_DB_STORAGE = "SELECT * FROM `%s` WHERE Id = '%s'" |
Definition at line 68 of file Constants.py.
string dc_db.Constants.SELECT_SITE_ID_BY_URL |
Definition at line 93 of file Constants.py.
string dc_db.Constants.SELECT_SQL_TEMPLATE = """ SELECT * FROM `%s` WHERE %s""" |
Definition at line 91 of file Constants.py.
string dc_db.Constants.SELECT_SQL_TEMPLATE_SIMPLE = """ SELECT %s FROM `%s`""" |
Definition at line 92 of file Constants.py.
string dc_db.Constants.SITE_FILTER_SQL_TEMPLATE |
Definition at line 73 of file Constants.py.
string dc_db.Constants.SITE_FILTER_SQL_UPDATE |
Definition at line 75 of file Constants.py.
string dc_db.Constants.SITE_ID_NAME = "SITE_ID" |
Definition at line 274 of file Constants.py.
string dc_db.Constants.SITE_PROP_SQL_ADDITIONS = ", `URLMD5`='%s'" |
Definition at line 78 of file Constants.py.
string dc_db.Constants.SITE_PROP_SQL_SHOT = "INSERT INTO `sites_properties` SET %s" |
Definition at line 79 of file Constants.py.
string dc_db.Constants.SITE_PROP_SQL_TEMPLATE = "INSERT INTO `sites_properties` SET `Site_Id`='%s', `Name`='%s', `Value`='%s'" |
Definition at line 77 of file Constants.py.
string dc_db.Constants.SITE_PROP_SQL_UPDATE = "UPDATE `sites_properties` SET %s WHERE `Site_Id`='%s' AND `Name`='%s'" |
Definition at line 80 of file Constants.py.
string dc_db.Constants.SITE_SQL_TEMPLATE = "INSERT INTO `sites` %s VALUES %s" |
Definition at line 71 of file Constants.py.
string dc_db.Constants.SITE_URL_SQL_SELECT_COUNT = 'SELECT COUNT(*) FROM `sites_urls` WHERE ' |
Definition at line 83 of file Constants.py.
string dc_db.Constants.SITE_URL_SQL_TEMPLATE = "INSERT INTO `sites_urls` SET %s" |
Definition at line 81 of file Constants.py.
string dc_db.Constants.SITE_URL_SQL_UPDATE = "UPDATE `sites_urls` SET %s WHERE `Site_Id`='%s'" |
Definition at line 82 of file Constants.py.
dc_db.Constants.siteDict |
Definition at line 131 of file Constants.py.
list dc_db.Constants.siteExcludeList = ["Id"] |
Definition at line 166 of file Constants.py.
dc_db.Constants.SiteURLTableDitct = dict(URLTableDict.items() + {"userId": "User_Id"}.items()) |
Definition at line 269 of file Constants.py.
string dc_db.Constants.SQL_CHECK_TABLE_EXIST_TEMPLATE |
Definition at line 87 of file Constants.py.
string dc_db.Constants.SQL_CREATE_QUERY_TEMPLATE = "CREATE TABLE IF NOT EXISTS `%s` LIKE dc_urls.%s" |
Definition at line 96 of file Constants.py.
string dc_db.Constants.STAT_DB_ID = "statDB" |
Definition at line 32 of file Constants.py.
string dc_db.Constants.STAT_DOMAINS_DB_ID = "statDomainsDB" |
Definition at line 35 of file Constants.py.
int dc_db.Constants.TASK_DUPLICATE_ERR = 2020 |
Definition at line 19 of file Constants.py.
string dc_db.Constants.TASK_DUPLICATE_ERR_MSG = "Duplicate site" |
Definition at line 20 of file Constants.py.
int dc_db.Constants.TASK_SQL_ERR = 2021 |
Definition at line 21 of file Constants.py.
string dc_db.Constants.TASK_SQL_ERR_MSG = "Some SQL error, look log file for details" |
Definition at line 22 of file Constants.py.
string dc_db.Constants.THIRD_DB_ID = "thirdDB" |
Definition at line 29 of file Constants.py.
string dc_db.Constants.URL_URL_SQL_SELECT_COUNT = 'SELECT COUNT(*) FROM ' + DC_URLS_TABLE_NAME_TEMPLATE + ' WHERE ' |
Definition at line 60 of file Constants.py.
string dc_db.Constants.URL_URL_SQL_UPDATE = 'UPDATE ' + DC_URLS_TABLE_NAME_TEMPLATE + ' SET %s WHERE' |
Definition at line 59 of file Constants.py.
list dc_db.Constants.urlExcludeList = ["URL", "URLMd5"] |
Definition at line 266 of file Constants.py.
dc_db.Constants.URLTableDict |
Definition at line 192 of file Constants.py.
string dc_db.Constants.USE_SQL_TEMPLATE = "USE `%s`" |
Definition at line 67 of file Constants.py.