html5lib/html5lib-pythonPublic

NotificationsYou must be signed in to change notification settings
Fork302
Star1.2k

Commitf1d1d0a

committed

Merge remote-tracking branch 'origin/master' into escape-characters-serializer

2 parents9dac020 +f130676 commitf1d1d0aCopy full SHA for f1d1d0a

File tree

6 files changed

+60

-38

lines changed

CHANGES.rst
README.rst
html5lib
- __init__.py
- tests
  - test_treewalkers.py
- treewalkers
  - _base.py
setup.py

6 files changed

+60

-38

lines changed

`‎CHANGES.rst‎`

Lines changed: 25 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,31 @@`
`1`	`1`	`Change Log`
`2`	`2`	`----------`
`3`	`3`
	`4`	`+0.99`
	`5`	`+~~~~`
	`6`	`+`
	`7`	`+Released on September 10, 2013`
	`8`	`+`
	`9`	`+* No library changes from 1.0b3; released as 0.99 as pip has changed`
	`10`	`+ behaviour from 1.4 to avoid installing pre-release versions per`
	`11`	`+ PEP 440.`
	`12`	`+`
	`13`	`+`
	`14`	`+1.0b3`
	`15`	`+~~~~~`
	`16`	`+`
	`17`	`+Released on July 24, 2013`
	`18`	`+`
	`19`	+* Removed ``RecursiveTreeWalker`` from ``treewalkers._base``. Any
	`20`	`+ implementation using it should be moved to`
	`21`	+ ``NonRecursiveTreeWalker``, as everything bundled with html5lib has
	`22`	`+ for years.`
	`23`	`+`
	`24`	+* Fix #67 so that ``BufferedStream`` to correctly returns a bytes
	`25`	`+ object, thereby fixing any case where html5lib is passed a`
	`26`	`+ non-seekable RawIOBase-like object.`
	`27`	`+`
	`28`	`+`
`4`	`29`	`1.0b2`
`5`	`30`	`~~~~~`
`6`	`31`

`‎README.rst‎`

Lines changed: 23 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -41,6 +41,29 @@ a treebuilder:`
`41`	`41`	`withopen("mydocument.html","rb")as f:`
`42`	`42`	`lxml_etree_document= html5lib.parse(f,treebuilder="lxml")`
`43`	`43`
	`44`	+When using with ``urllib2`` (Python 2), the charset from HTTP should be
	`45`	`+pass into html5lib as follows:`
	`46`	`+`
	`47`	`+..code-block::python`
	`48`	`+`
	`49`	`+from contextlibimport closing`
	`50`	`+from urllib2import urlopen`
	`51`	`+import html5lib`
	`52`	`+`
	`53`	`+with closing(urlopen("http://example.com/"))as f:`
	`54`	`+ document= html5lib.parse(f,encoding=f.info().getparam("charset"))`
	`55`	`+`
	`56`	+When using with ``urllib.request`` (Python 3), the charset from HTTP
	`57`	`+should be pass into html5lib as follows:`
	`58`	`+`
	`59`	`+..code-block::python`
	`60`	`+`
	`61`	`+from urllib.requestimport urlopen`
	`62`	`+import html5lib`
	`63`	`+`
	`64`	`+with urlopen("http://example.com/")as f:`
	`65`	`+ document= html5lib.parse(f,encoding=f.info().get_content_charset())`
	`66`	`+`
`44`	`67`	`To have more control over the parser, create a parser object explicitly.`
`45`	`68`	`For instance, to make the parser raise exceptions on parse errors, use:`
`46`	`69`

`‎html5lib/init.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -20,4 +20,4 @@`
`20`	`20`
`21`	`21`	`__all__= ["HTMLParser","parse","parseFragment","getTreeBuilder",`
`22`	`22`	`"getTreeWalker","serialize"]`
`23`		`-__version__="1.0b2"`
	`23`	`+__version__="0.999-dev"`

`‎html5lib/tests/test_treewalkers.py‎`

Lines changed: 0 additions & 10 deletions

Original file line number	Diff line number	Diff line change
`@@ -83,16 +83,6 @@ def PullDOMAdapter(node):`
`83`	`83`	`"walker":treewalkers.getTreeWalker("lxml")}`
`84`	`84`
`85`	`85`
`86`		`-# Try whatever etree implementations are available from a list that are`
`87`		`-#"supposed" to work`
`88`		`-try:`
`89`		`-importpxdom`
`90`		`-treeTypes['pxdom']= \`
`91`		`- {"builder":treebuilders.getTreeBuilder("dom",pxdom),`
`92`		`-"walker":treewalkers.getTreeWalker("dom")}`
`93`		`-exceptImportError:`
`94`		`-pass`
`95`		`-`
`96`	`86`	`try:`
`97`	`87`	`fromgenshi.coreimportQName,Attrs`
`98`	`88`	`fromgenshi.coreimportSTART,END,TEXT,COMMENT,DOCTYPE`

`‎html5lib/treewalkers/_base.py‎`

Lines changed: 10 additions & 26 deletions

Original file line number	Diff line number	Diff line change
`@@ -4,6 +4,16 @@`
`4`	`4`	`importgettext`
`5`	`5`	`_=gettext.gettext`
`6`	`6`
	`7`	`+fromxml.domimportNode`
	`8`	`+`
	`9`	`+DOCUMENT=Node.DOCUMENT_NODE`
	`10`	`+DOCTYPE=Node.DOCUMENT_TYPE_NODE`
	`11`	`+TEXT=Node.TEXT_NODE`
	`12`	`+ELEMENT=Node.ELEMENT_NODE`
	`13`	`+COMMENT=Node.COMMENT_NODE`
	`14`	`+ENTITY=Node.ENTITY_NODE`
	`15`	`+UNKNOWN="<#UNKNOWN#>"`
	`16`	`+`
`7`	`17`	`from ..constantsimportvoidElements,spaceCharacters`
`8`	`18`	`spaceCharacters="".join(spaceCharacters)`
`9`	`19`
`@@ -115,32 +125,6 @@ def unknown(self, nodeType):`
`115`	`125`	`returnself.error(_("Unknown node type: ")+nodeType)`
`116`	`126`
`117`	`127`
`118`		`-classRecursiveTreeWalker(TreeWalker):`
`119`		`-defwalkChildren(self,node):`
`120`		`-raiseNotImplementedError`
`121`		`-`
`122`		`-defelement(self,node,namespace,name,attrs,hasChildren):`
`123`		`-ifnameinvoidElements:`
`124`		`-fortokeninself.emptyTag(namespace,name,attrs,hasChildren):`
`125`		`-yieldtoken`
`126`		`-else:`
`127`		`-yieldself.startTag(name,attrs)`
`128`		`-ifhasChildren:`
`129`		`-fortokeninself.walkChildren(node):`
`130`		`-yieldtoken`
`131`		`-yieldself.endTag(name)`
`132`		`-`
`133`		`-fromxml.domimportNode`
`134`		`-`
`135`		`-DOCUMENT=Node.DOCUMENT_NODE`
`136`		`-DOCTYPE=Node.DOCUMENT_TYPE_NODE`
`137`		`-TEXT=Node.TEXT_NODE`
`138`		`-ELEMENT=Node.ELEMENT_NODE`
`139`		`-COMMENT=Node.COMMENT_NODE`
`140`		`-ENTITY=Node.ENTITY_NODE`
`141`		`-UNKNOWN="<#UNKNOWN#>"`
`142`		`-`
`143`		`-`
`144`	`128`	`classNonRecursiveTreeWalker(TreeWalker):`
`145`	`129`	`defgetNodeDetails(self,node):`
`146`	`130`	`raiseNotImplementedError`

`‎setup.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,7 @@`
`29`	`29`	`long_description=readme_file.read()+'\n'+changes_file.read()`
`30`	`30`
`31`	`31`	`setup(name='html5lib',`
`32`		`-version='1.0b2',`
	`32`	`+version='0.999-dev',`
`33`	`33`	`url='https://github.com/html5lib/html5lib-python',`
`34`	`34`	`license="MIT License",`
`35`	`35`	`description='HTML parser based on the WHATWG HTML specifcation',`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitf1d1d0a

File tree

6 files changed

6 files changed

`‎CHANGES.rst‎`

`‎README.rst‎`

`‎html5lib/init.py‎`

`‎html5lib/tests/test_treewalkers.py‎`

`‎html5lib/treewalkers/_base.py‎`

`‎setup.py‎`

0 commit comments

Movatterモバイル変換

File tree

6 files changed

6 files changed

‎CHANGES.rst‎

‎README.rst‎

‎html5lib/__init__.py‎

‎html5lib/tests/test_treewalkers.py‎

‎html5lib/treewalkers/_base.py‎

‎setup.py‎

0 commit comments

`‎CHANGES.rst‎`

`‎README.rst‎`

`‎html5lib/init.py‎`

`‎html5lib/tests/test_treewalkers.py‎`

`‎html5lib/treewalkers/_base.py‎`

`‎setup.py‎`