本文整理汇总了Python中translate.storage.html.htmlfile函数的典型用法代码示例。如果您正苦于以下问题:Python htmlfile函数的具体用法?Python htmlfile怎么用?Python htmlfile使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。
在下文中一共展示了htmlfile函数的11个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: test_escaping_script_and_pre
def test_escaping_script_and_pre(self):
"""<script> and <pre> can contain < and > and these should not be
interpretted as tags"""
h = html.htmlfile()
store = h.parsestring("<p>We are here</p><script>Some </tag>like data<script></p>")
print store.units[0].source
assert len(store.units) == 1
示例2: mergestore
def mergestore(self, inputstore, templatetext, includefuzzy):
"""converts a file to .po format"""
self.inputstore = inputstore
self.inputstore.makeindex()
self.includefuzzy = includefuzzy
output_store = html.htmlfile(inputfile=templatetext, callback=self.lookup)
return output_store.filesrc
示例3: test_extraction_attr_title
def test_extraction_attr_title(self):
"""Check that we can extract title attribute"""
h = html.htmlfile()
# Example form http://www.w3schools.com/tags/att_global_title.asp
store = h.parsestring("""
<p><abbr title="World Health Organization">WHO</abbr> was founded in 1948.</p>
<p title="Free Web tutorials">W3Schools.com</p>""")
print(store.units[0].source)
assert len(store.units) == 4
assert store.units[0].source == "World Health Organization"
# FIXME this is not ideal we need to either drop title= as we've
# extracted it already or not extract it earlier
assert store.units[1].source == '<abbr title="World Health Organization">WHO</abbr> was founded in 1948.'
assert store.units[2].source == "Free Web tutorials"
assert store.units[3].source == "W3Schools.com"
# Example from http://www.netmechanic.com/news/vol6/html_no1.htm
store = h.parsestring("""
<table width="100" border="2" title="Henry Jacobs Camp summer 2003 schedule">
""")
assert len(store.units) == 1
assert store.units[0].source == "Henry Jacobs Camp summer 2003 schedule"
# FIXME this doesn't extract as I'd have expected
#store = h.parsestring("""
# <a href="page1.html" title="HS Jacobs - a UAHC camp in Utica, MS">Henry S. Jacobs Camp</a>
#""")
#assert len(store.units) == 2
#assert store.units[0].source == "HS Jacobs - a UAHC camp in Utica, MS"
#assert store.units[1].source == "Henry S. Jacobs Camp"
store = h.parsestring("""
<form name="application" title="Henry Jacobs camper application" method=" " action=" ">
""")
assert len(store.units) == 1
assert store.units[0].source == "Henry Jacobs camper application"
示例4: test_extraction_attr_alt
def test_extraction_attr_alt(self):
"""Check that we can extract title attribute"""
h = html.htmlfile()
# Example from http://www.netmechanic.com/news/vol6/html_no1.htm
store = h.parsestring("""
<img src="cafeteria.jpg" height="200" width="200" alt="UAHC campers enjoy a meal in the camp cafeteria">
""")
assert len(store.units) == 1
assert store.units[0].source == "UAHC campers enjoy a meal in the camp cafeteria"
示例5: convertfile
def convertfile(self, inputfile, filename, includeuntagged=False,
duplicatestyle="msgctxt", keepcomments=False):
"""converts a html file to .po format"""
thetargetfile = po.pofile()
htmlparser = html.htmlfile(includeuntaggeddata=includeuntagged,
inputfile=inputfile)
for htmlunit in htmlparser.units:
thepo = thetargetfile.addsourceunit(htmlunit.source)
thepo.addlocations(htmlunit.getlocations())
if keepcomments:
thepo.addnote(htmlunit.getnotes(), "developer")
thetargetfile.removeduplicates(duplicatestyle)
return thetargetfile
示例6: test_extraction_tag_figcaption
def test_extraction_tag_figcaption(self):
"""Check that we can extract figcaption"""
h = html.htmlfile()
# Example form http://www.w3schools.com/tags/tag_figcaption.asp
store = h.parsestring("""
<figure>
<img src="img_pulpit.jpg" alt="The Pulpit Rock" width="304" height="228">
<figcaption>Fig1. - A view of the pulpit rock in Norway.</figcaption>
</figure>""")
print(store.units[0].source)
assert len(store.units) == 2
assert store.units[0].source == "The Pulpit Rock"
assert store.units[1].source == "Fig1. - A view of the pulpit rock in Norway."
示例7: test_extraction_tag_caption_td_th
def test_extraction_tag_caption_td_th(self):
"""Check that we can extract table related translatable: th, td and caption"""
h = html.htmlfile()
# Example form http://www.w3schools.com/tags/tag_caption.asp
store = h.parsestring("""
<table>
<caption>Monthly savings</caption>
<tr>
<th>Month</th>
<th>Savings</th>
</tr>
<tr>
<td>January</td>
<td>$100</td>
</tr>
</table>""")
print(store.units[0].source)
assert len(store.units) == 5
assert store.units[0].source == "Monthly savings"
assert store.units[1].source == "Month"
assert store.units[2].source == "Savings"
assert store.units[3].source == "January"
assert store.units[4].source == "$100"
示例8: test_self_closing_tags
def test_self_closing_tags(self):
h = html.htmlfile()
store = h.parsestring("<h3>Some text <img><br><img></h3>")
assert len(store.units) == 1
示例9: test_pi_escaping
def test_pi_escaping():
h = html.htmlfile()
assert h.pi_escape('<a href="<?=($a < $b ? $foo : ($b > c ? $bar : $cat))?>">') == '<a href="<?=($a %lt; $b ? $foo : ($b %gt; c ? $bar : $cat))?>">'
示例10: test_strip_html_with_pi
def test_strip_html_with_pi():
h = html.htmlfile()
assert html.strip_html(h.pi_escape('<a href="<?$var?>">Something</a>')) == "Something"
assert html.strip_html(h.pi_escape('<a href="<?=($a < $b ? $foo : ($b > c ? $bar : $cat))?>">Something</a>')) == "Something"
示例11: test_guess_encoding
def test_guess_encoding():
"""Read an encoding header to guess the encoding correctly"""
h = html.htmlfile()
assert h.guess_encoding('''<META HTTP-EQUIV="CONTENT-TYPE" CONTENT="text/html; charset=UTF-8">''') == "UTF-8"
assert h.guess_encoding('''<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN" "http://www.w3.org/TR/REC-html40/loose.dtd"><html><head><meta http-equiv="Content-Type" content="text/html; charset=ISO-8859-1"><!-- base href="http://home.online.no/~rut-aane/linux.html" --><link rel="shortcut icon" href="http://home.online.no/~rut-aane/peng16x16a.gif"><meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1"><meta name="Description" content="Linux newbie stuff and a little about Watching TV under Linux"><meta name="MSSmartTagsPreventParsing" content="TRUE"><meta name="GENERATOR" content="Mozilla/4.7 [en] (X11; I; Linux 2.2.5-15 i586) [Netscape]"><title>Some Linux for beginners</title><style type="text/css">''') == "iso-8859-1"