#!/usr/bin/python
#
# Copyright 2011 Google Inc. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""HTMLStripper based on HTMLParser."""


__author__ = 'wclarkso@google.com (Will Clarkson)'

import html.parser


class HTMLStripper(html.parser.HTMLParser):
  """Simple class to strip tags from HTML."""

  def __init__(self):
    html.parser.HTMLParser.__init__(self)
    self.reset()
    self.fed = []

  def handle_data(self, d):
    self.fed.append(d)

  def GetFedData(self):
    return ''.join(self.fed)

  def ClearFedData(self):
    self.fed = []
