class documentation

class FilteringLinkExtractor:

Known subclasses: scrapy.linkextractors.lxmlhtml.LxmlLinkExtractor

View In Hierarchy

Undocumented

Method __init__ Undocumented
Method __new__ Undocumented
Method ​_extract​_links Undocumented
Method ​_link​_allowed Undocumented
Method ​_process​_links Undocumented
Method matches Undocumented
Class Variable ​_csstranslator Undocumented
Instance Variable allow​_domains Undocumented
Instance Variable allow​_res Undocumented
Instance Variable canonicalize Undocumented
Instance Variable deny​_domains Undocumented
Instance Variable deny​_extensions Undocumented
Instance Variable deny​_res Undocumented
Instance Variable link​_extractor Undocumented
Instance Variable restrict​_text Undocumented
Instance Variable restrict​_xpaths Undocumented
def __init__(self, link_extractor, allow, deny, allow_domains, deny_domains, restrict_xpaths, canonicalize, deny_extensions, restrict_css, restrict_text):
def __new__(cls, *args, **kwargs):

Undocumented

def _extract_links(self, *args, **kwargs):

Undocumented

def _link_allowed(self, link):

Undocumented

def _process_links(self, links):

Undocumented

def matches(self, url):

Undocumented

_csstranslator =

Undocumented

allow_domains =

Undocumented

allow_res =

Undocumented

canonicalize =

Undocumented

deny_domains =

Undocumented

deny_extensions =

Undocumented

deny_res =

Undocumented

link_extractor =

Undocumented

restrict_text =

Undocumented

restrict_xpaths =

Undocumented