__init__(self, config, templ=None, domain=None, processorProperties=None) | dc_processor.scrapy_extractor.ScrapyExtractor | |
__repr__(self) | dc_processor.base_extractor.BaseExtractor | |
__str__(self) | dc_processor.base_extractor.BaseExtractor | |
addTag(self, result, tag_name, tag_value, xpath="", isDefaultTag=False, callAdjustment=True, tagType=None, allowNotFilled=False) | dc_processor.base_extractor.BaseExtractor | |
blockedByXpathTags | dc_processor.scrapy_extractor.ScrapyExtractor | |
calculateMetrics(self, response) | dc_processor.base_extractor.BaseExtractor | |
closeVoid | dc_processor.scrapy_extractor.ScrapyExtractor | |
config | dc_processor.base_extractor.BaseExtractor | |
data | dc_processor.base_extractor.BaseExtractor | |
db_dc_scraper_db | dc_processor.base_extractor.BaseExtractor | |
DBConnector | dc_processor.base_extractor.BaseExtractor | |
DISABLE_XPATH_CHARS_LIST | dc_processor.scrapy_extractor.ScrapyExtractor | static |
extractTag(self, tagName, result, template, textHandler=None, delimiter=' ') | dc_processor.scrapy_extractor.ScrapyExtractor | |
extractTags(self, resource, result) | dc_processor.scrapy_extractor.ScrapyExtractor | |
extractTagsForOneTemplate(self, resource, result, template) | dc_processor.scrapy_extractor.ScrapyExtractor | |
generateTemplatesFromRowTemplates(self, rowTemplates, domain=None) | dc_processor.scrapy_extractor.ScrapyExtractor | |
imgDelimiter | dc_processor.base_extractor.BaseExtractor | |
innerTextTagReplacers | dc_processor.scrapy_extractor.ScrapyExtractor | |
isTagNotFilled(self, result, tagName) | dc_processor.base_extractor.BaseExtractor | |
isTagValueNotEmpty(self, tagValue) | dc_processor.base_extractor.BaseExtractor | |
keepAttributes | dc_processor.scrapy_extractor.ScrapyExtractor | |
loadScraperProperties(self, scraperPropFileName) | dc_processor.base_extractor.BaseExtractor | |
modules | dc_processor.base_extractor.BaseExtractor | |
name | dc_processor.scrapy_extractor.ScrapyExtractor | |
pasteLists(self, lhs, rhs) | dc_processor.scrapy_extractor.ScrapyExtractor | |
postExclude | dc_processor.scrapy_extractor.ScrapyExtractor | |
postReplace | dc_processor.scrapy_extractor.ScrapyExtractor | |
process_mode | dc_processor.base_extractor.BaseExtractor | |
processorProperties | dc_processor.base_extractor.BaseExtractor | |
properties | dc_processor.base_extractor.BaseExtractor | static |
rank | dc_processor.base_extractor.BaseExtractor | |
rankReading(self, exctractorName) | dc_processor.base_extractor.BaseExtractor | |
resource | dc_processor.scrapy_extractor.ScrapyExtractor | |
sel | dc_processor.scrapy_extractor.ScrapyExtractor | |
SELF_NAME | dc_processor.scrapy_extractor.ScrapyExtractor | static |
tag | dc_processor.base_extractor.BaseExtractor | static |
tagsMask | dc_processor.base_extractor.BaseExtractor | static |
tagsValidator | dc_processor.base_extractor.BaseExtractor | |
tagValueElemValidate(self, tagValueElem, conditionElem) | dc_processor.base_extractor.BaseExtractor | |
tagValueValidate(self, tagName, tagValue) | dc_processor.base_extractor.BaseExtractor | |
TEMPLATE_FILE_RULE_EXCLUDE | dc_processor.scrapy_extractor.ScrapyExtractor | static |
TEMPLATE_FILE_RULE_REPLACE | dc_processor.scrapy_extractor.ScrapyExtractor | static |
TEMPLATE_FILE_RULE_XPATH | dc_processor.scrapy_extractor.ScrapyExtractor | static |
templateLoad(self, config, templ=None, domain=None) | dc_processor.scrapy_extractor.ScrapyExtractor | |
templatePreparer(self, jsonBuf, domains, globalTemplate) | dc_processor.scrapy_extractor.ScrapyExtractor | |
templates | dc_processor.scrapy_extractor.ScrapyExtractor | |