src/third_party/blink/Tools/Scripts/webkitpy/layout_tests/reftests/extract_reference_link.py - cobalt - Git at Google

 # Copyright (C) 2011 Google Inc. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.

 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 """Utility module for reftests."""


 from HTMLParser import HTMLParser


 class ExtractReferenceLinkParser(HTMLParser):

     def __init__(self):
         HTMLParser.__init__(self)
         self.matches = []
         self.mismatches = []

     def handle_starttag(self, tag, attrs):
         if tag != "link":
             return
         attrs = dict(attrs)
         if not "rel" in attrs:
             return
         if not "href" in attrs:
             return
         if attrs["rel"] == "match":
             self.matches.append(attrs["href"])
         if attrs["rel"] == "mismatch":
             self.mismatches.append(attrs["href"])


 def get_reference_link(html_string):
     """Returns reference links in the given html_string.

     Returns:
         a tuple of two URL lists, (matches, mismatches).
     """
     parser = ExtractReferenceLinkParser()
     parser.feed(html_string)
     parser.close()

     return parser.matches, parser.mismatches
	# Copyright (C) 2011 Google Inc. All rights reserved.
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.

	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	"""Utility module for reftests."""


	from HTMLParser import HTMLParser


	class ExtractReferenceLinkParser(HTMLParser):

	def __init__(self):
	HTMLParser.__init__(self)
	self.matches = []
	self.mismatches = []

	def handle_starttag(self, tag, attrs):
	if tag != "link":
	return
	attrs = dict(attrs)
	if not "rel" in attrs:
	return
	if not "href" in attrs:
	return
	if attrs["rel"] == "match":
	self.matches.append(attrs["href"])
	if attrs["rel"] == "mismatch":
	self.mismatches.append(attrs["href"])


	def get_reference_link(html_string):
	"""Returns reference links in the given html_string.

	Returns:
	a tuple of two URL lists, (matches, mismatches).
	"""
	parser = ExtractReferenceLinkParser()
	parser.feed(html_string)
	parser.close()

	return parser.matches, parser.mismatches