HCE Project Python language Distributed Tasks Manager Application, Distributed Crawler Application and client API bindings.
2.0.0-chaika
Hierarchical Cluster Engine Python language binding
|
Public Member Functions | |
def | __init__ (self, config, templ=None, domain=None, processorProperties=None) |
def | __str__ (self) |
def | __repr__ (self) |
def | loadScraperProperties (self, scraperPropFileName) |
def | isTagNotFilled (self, result, tagName) |
def | isTagValueNotEmpty (self, tagValue) |
def | tagValueElemValidate (self, tagValueElem, conditionElem) |
def | tagValueValidate (self, tagName, tagValue) |
def | addTag (self, result, tag_name, tag_value, xpath="", isDefaultTag=False, callAdjustment=True, tagType=None, allowNotFilled=False) |
def | calculateMetrics (self, response) |
def | rankReading (self, exctractorName) |
Public Attributes | |
config | |
processorProperties | |
name | |
rank | |
process_mode | |
modules | |
data | |
db_dc_scraper_db | |
DBConnector | |
imgDelimiter | |
tagsValidator | |
Static Public Attributes | |
properties = None | |
dictionary | tag |
dictionary | tagsMask |
Definition at line 101 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.__init__ | ( | self, | |
config, | |||
templ = None , |
|||
domain = None , |
|||
processorProperties = None |
|||
) |
Definition at line 161 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.__repr__ | ( | self | ) |
Definition at line 197 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.__str__ | ( | self | ) |
Definition at line 193 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.addTag | ( | self, | |
result, | |||
tag_name, | |||
tag_value, | |||
xpath = "" , |
|||
isDefaultTag = False , |
|||
callAdjustment = True , |
|||
tagType = None , |
|||
allowNotFilled = False |
|||
) |
Definition at line 291 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.calculateMetrics | ( | self, | |
response | |||
) |
Definition at line 331 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.isTagNotFilled | ( | self, | |
result, | |||
tagName | |||
) |
def dc_processor.base_extractor.BaseExtractor.isTagValueNotEmpty | ( | self, | |
tagValue | |||
) |
def dc_processor.base_extractor.BaseExtractor.loadScraperProperties | ( | self, | |
scraperPropFileName | |||
) |
Definition at line 205 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.rankReading | ( | self, | |
exctractorName | |||
) |
Definition at line 343 of file base_extractor.py.
def dc_processor.base_extractor.BaseExtractor.tagValueElemValidate | ( | self, | |
tagValueElem, | |||
conditionElem | |||
) |
def dc_processor.base_extractor.BaseExtractor.tagValueValidate | ( | self, | |
tagName, | |||
tagValue | |||
) |
Definition at line 268 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.config |
Definition at line 162 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.data |
Definition at line 177 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.db_dc_scraper_db |
Definition at line 178 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.DBConnector |
Definition at line 179 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.imgDelimiter |
Definition at line 181 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.modules |
Definition at line 175 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.name |
Definition at line 170 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.process_mode |
Definition at line 174 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.processorProperties |
Definition at line 163 of file base_extractor.py.
|
static |
Definition at line 103 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.rank |
Definition at line 171 of file base_extractor.py.
|
static |
Definition at line 105 of file base_extractor.py.
|
static |
Definition at line 124 of file base_extractor.py.
dc_processor.base_extractor.BaseExtractor.tagsValidator |
Definition at line 184 of file base_extractor.py.