Python Examples of HTMLParser.HTMLParser.__init_

Source File: scraping.py From cryptocurrency_arbitrage with GNU General Public License v3.0

6 votes

def __init__(self):
        HTMLParser.__init__(self)
        self.messageId = None
        self.messageTime = None
        self.messageUser = None
        self.messageText = None
        self.messages = []
        self.reserves24change = None
        self.reservesALFAcashier = None
        self.usersOnline = None
        self.botsOnline = None

        self.inMessageA = False
        self.inMessageSpan = False
        self.in24changeSpan = False
        self.inALFAcashierSpan = False
        self.inUsersOnlineDiv = False

        self.devOnline = False
        self.supportOnline = False
        self.adminOnline = False

Source File: build_perf.py From fplutil with Apache License 2.0

6 votes

def __init__(self, error, command, returnstatus, stdout=None, stderr=None):
    """Initialize this instance.

    Args:
      error: Error message.
      command: Command that failed.
      returnstatus: Status of the command that failed.
      stdout: Standard output stream of the failed command.
      stderr: Standard error stream of the failed command.
    """
    super(CommandError, self).__init__(error)
    self.command = command
    self.returnstatus = returnstatus
    self.stdout = stdout
    self.stderr = stderr
    self.error = error

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

6 votes

def __init__(self, data):
        """
        The data holds the characters.

        Example:

        html = Html()
        data = '<body><em>alpha</em></body>'
        dom = html.feed(data)
        x = dom.fst('em')
        x.append(Data('\nbeta'))

        It outputs.

        <body ><em >alpha
        beta</em></body>
        """

        Root.__init__(self, DATA)
        self.data = data

Source File: Formatter.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

6 votes

def __init__(self, *args, **kwargs):
        '''
            __init__ - Create an AdvancedTagSlim object.

                @see AdvancedTag

                Extra arguments:

                  slimSelfClosing <bool> default False - If True, will use slim-endings on self-closing tags,

                    i.e. <br/> instead of <br />

                    This may break xhtml compatibility but modern browsers are okay with it.
        '''
        if 'slimSelfClosing' in kwargs:
            slimSelfClosing = kwargs.pop('slimSelfClosing')
        else:
            slimSelfClosing = False
        AdvancedTag.__init__(self, *args, **kwargs)

        object.__setattr__(self, 'slimSelfClosing', slimSelfClosing)

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, data):
        Root.__init__(self, META)
        self.data = data

Source File: scraping.py From cryptocurrency_arbitrage with GNU General Public License v3.0

5 votes

def __init__(self):
        self.messages = None
        self.reserves24change = None
        self.reservesALFAcashier = None
        self.usersOnline = None
        self.botsOnline = None
        self.devOnline = False
        self.supportOnline = False
        self.adminOnline = False

Source File: prettytable.py From smod-1 with GNU General Public License v2.0

5 votes

def __init__(self, **kwargs):
        HTMLParser.__init__(self)
        self.kwargs = kwargs
        self.tables = []
        self.last_row = []
        self.rows = []
        self.max_row_width = 0
        self.active = None
        self.last_content = ""
        self.is_last_row_header = False

Source File: paraparser.py From Fluid-Designer with GNU General Public License v3.0

5 votes

def __init__(self,v):
        self._value = v*0.01

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, data):
        Root.__init__(self, COMMENT)
        self.data = data

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, name, attr=None):
        """
        See help(Tag).
        """
        if attr is None:
            attr = {}
        Root.__init__(self, name, attr)

Source File: gencon-hotel-check.py From gencon-hotel-check with GNU General Public License v3.0

5 votes

def __init__(self, resp):
		HTMLParser.__init__(self)
		self.json = None
		self.feed(resp.read().decode('utf8'))
		self.close()

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, data):
        Root.__init__(self, AMP)
        self.data = data

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, data):
        Root.__init__(self, PI)
        self.data = data

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self):
        HTMLParser.__init__(self)
        self.structure = Tree()

Source File: recipe-576884.py From code with MIT License

5 votes

def __init__(self, starting_url, depth, max_span):
        HTMLParser.__init__(self)
        self.url = starting_url
        self.db = {self.url: 1}
        self.node = [self.url]

        self.depth = depth # recursion depth max
        self.max_span = max_span # max links obtained per url
        self.links_found = 0

Source File: build_perf.py From fplutil with Apache License 2.0

5 votes

def __init__(self):
    """Initialize this instance."""
    HTMLParser.__init__(self)
    self.tables = collections.defaultdict(list)
    self.reset_parse_state()

Source File: ehp.py From script.elementum.burst with Do What The F*ck You Want To Public License

5 votes

def __init__(self, name, attr=None):
        """
        The parameter name is the xml/html tag's name.

        Example:

        d = {'style': 'background:blue;'}
        x = Tag('p', d)
        """
        if attr is None:
            attr = {}
        Root.__init__(self, name, attr)

Source File: prettytable.py From Hatkey with GNU General Public License v3.0

5 votes

def __init__(self, **kwargs):
        HTMLParser.__init__(self)
        self.kwargs = kwargs
        self.tables = []
        self.last_row = []
        self.rows = []
        self.max_row_width = 0
        self.active = None
        self.last_content = ""
        self.is_last_row_header = False

Source File: parser.py From webtech with GNU Lesser General Public License v3.0

5 votes

def __init__(self):
        HTMLParser.__init__(self)
        self.meta = {}
        self.scripts = []

Source File: gsearch.py From Google-Alfred3-Workflow with MIT License

5 votes

def __init__(self):
        HTMLParser.__init__(self)
        self.result_info = []
        self.link = ''
        self.title = ''

Source File: gsearch.py From Google-Alfred3-Workflow with MIT License

5 votes

def __init__(self, query, port):

        self.query = query.encode('utf-8')
        self.url = u"http://www.google.com/search?" + \
            urlencode({'q': self.query}) + u"&pws=0&gl=us&gws_rd=cr"
        self.header = 'Mozilla/5.001 (windows; U; NT4.0; en-US; rv:1.0) Gecko/25250101'
        self.SOCKS5_PROXY_HOST = '127.0.0.1'
        self.SOCKS5_PROXY_PORT = port

Source File: Formatter.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def __init__(self, encoding='utf-8', slimSelfClosing=False):
        '''
            __init__ - Create an AdvancedHTMLSlimTagMiniFormatter

                @see AdvancedHTMLMiniFormatter

                @param slimSelfClosing <bool> Default False - If True, will use slim self-closing tags,

                    e.x. <br /> becomes <br/>
        '''

        AdvancedHTMLMiniFormatter.__init__(self, encoding=encoding)

        self.slimSelfClosing = slimSelfClosing

Source File: Formatter.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def __init__(self, indent='    ', encoding='utf-8', slimSelfClosing=False):
        '''
            __init__ - Construct an AdvancedHTMLSlimTagFormatter

                @see AdvancedHTMLFormatter

                @param slimSelfClosing <bool> Default False - If True, will use slim self-closing tags,

                    e.x. <br /> becomes <br/>
        '''

        AdvancedHTMLFormatter.__init__(self, indent=indent, encoding=encoding)

        self.slimSelfClosing = slimSelfClosing

Source File: Formatter.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def __init__(self, indent='  ', encoding='utf-8'):
        '''
            Create a pretty formatter.

            @param indent <str/int>, Default '    ' [4 spaces] - Either a space/tab/newline that represents one level of indent, or an integer to use that number of spaces

            @param encoding <str/None>, Default 'utf-8', - Use this encoding for the document. None to not mess with encoding
        '''
        HTMLParser.__init__(self)

        # Do not automatically convert charrefs in python3
        self.convert_charrefs = False

        self.parsedData = []
        self.reset = self._reset
        self.decl = None
        self.currentIndentLevel = 0
        self.indent = indent
        self.encoding = encoding

        self.inPreformatted = 0

        self.root = None

        self._inTag = []
        self.doctype = None

Source File: Parser.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def _reset(self):
        '''
            _reset - reset this object. Assigned to .reset after __init__ call.
        '''
        AdvancedHTMLParser.reset(self)

        self._resetIndexInternal()

#vim: set ts=4 sw=4 expandtab

Source File: Parser.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def __init__(self, filename=None, encoding='utf-8', indexIDs=True, indexNames=True, indexClassNames=True, indexTagNames=True):
        '''
            __init__ - Creates an Advanced HTML parser object, with specific indexing settings.

                For the various index* arguments, if True the index will be collected and use (if useIndex=True [default] on get* function)

                @param filename <str>         - Optional filename to parse. Otherwise use parseFile or parseStr methods.
                @param encoding <str> - Specifies the document encoding. Default utf-8
                @param indexIDs <bool>        - True to create an index for getElementByID method.  <default True>
                @param indexNames <bool>      - True to create an index for getElementsByName method  <default True>
                @param indexClassNames <bool> - True to create an index for getElementsByClassName method. <default True>
                @param indexTagNames <bool>   - True to create an index for tag names. <default True>

                For indexing other attributes, see the more generic addIndexOnAttribute

        '''
        self.indexFunctions = []
        self.otherAttributeIndexFunctions = {}
        self._otherAttributeIndexes = {}
        self.indexIDs = indexIDs
        self.indexNames = indexNames
        self.indexClassNames = indexClassNames
        self.indexTagNames = indexTagNames

        self._resetIndexInternal()

        AdvancedHTMLParser.__init__(self, filename, encoding)

        if filename is not None:
            self.parseFile(filename)

###########################################
#####        INTERNAL               #######
###########################################

Source File: Parser.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def _reset(self):
        '''
            _reset - reset this object. Assigned to .reset after __init__ call.
        '''
        HTMLParser.reset(self)

        self.root = None
        self.doctype = None
        self._inTag = []

Source File: Parser.py From AdvancedHTMLParser with GNU Lesser General Public License v3.0

5 votes

def __init__(self, filename=None, encoding='utf-8'):
        '''
            __init__ - Creates an Advanced HTML parser object. For read-only parsing, consider IndexedAdvancedHTMLParser for faster searching.

                @param filename <str>         - Optional filename to parse. Otherwise use parseFile or parseStr methods.
                @param encoding <str>         - Specifies the document encoding. Default utf-8

        '''
        HTMLParser.__init__(self)
        # Do not automatically convert charrefs in python3
        self.convert_charrefs = False

        # Encoding to use for this document
        self.encoding = encoding

        self._inTag = []
        self.root = None
        self.doctype = None

        self.reset = self._reset # Must assign after first call, otherwise members won't yet be present

        if filename is not None:
            self.parseFile(filename)

###########################################
#####        INTERNAL               #######
###########################################

Source File: prettytable.py From paper.io.sessdsa with GNU General Public License v3.0

5 votes

def __init__(self, **kwargs):
        HTMLParser.__init__(self)
        self.kwargs = kwargs
        self.tables = []
        self.last_row = []
        self.rows = []
        self.max_row_width = 0
        self.active = None
        self.last_content = ""
        self.is_last_row_header = False

Source File: fb_parser.py From facebook-discussion-tk with MIT License

5 votes

def __init__(self, callback_found_name, callback_found_fb_id):
        HTMLParser.__init__(self)
        self.callback_found_name = callback_found_name
        self.callback_found_fb_id = callback_found_fb_id
        self.tag_level_a = 0
        self.tag_level_a_target = None

Python HTMLParser.HTMLParser.__init__() Examples

Python HTMLParser.HTMLParser.init() Examples