PyXML 개론

2002-11-26

python setup.py install

from xml.dom.ext.reader import Sax2

DOC = """

  Christopher Okibgo
  For he was a shrub among the poplars, 
  Needing more roots
  More sap to grow to sunlight, 
  Thirsting for sunlight

"""

# XML 판독 객체를 만들어라
reader = Sax2.Reader()
# 한 문자열에서 XML로부터 해석된 4DOM 문서 노드 하나를 만들어라
doc_node = reader.fromString(DOC)

# 문서 노드에서 통상적인 DOM 연산을 실행할 수 있다
verse_element = doc_node.documentElement
# 게다가 노드 리스트(Node lists) 그리고 이름있는 노드 맵(named node maps)과 같은 것들을 위한
# "파이썬적인" 지름길도 사용할 수 있다.
# verse 요소의 첫 번째 자손은 공백 텍스트 노드이다
# 두 번째 자손은 attribution 요소이다
attribution_element = verse_element.childNodes[1]
# attribution_string은 "Christopher Okibgo"이 된다
attribution_string = attribution_element.firstChild.data

from xml.dom.ext.reader import HtmlLib

# HTML 판독 객체를 하나 만들어라
reader = HtmlLib.Reader()
# URL에 위치한 HTML에서 해석된 4DOM 문서를 하나 만들어라
doc_node = reader.fromUri("http://www.python.org")

# 그 HTML 문서의 제목을 취하라
title_elem = doc_node.documentElement.getElementsByTagName("TITLE")[0]
# title_string은 "Python Language Website"가 된다
title_string = title_elem.firstChild.data

from xml.dom.ext import StripXml, Print
# 적절한 장소에서 공백을 제거하고 같은 노드를 반환하라
StripXml(doc_node)
# 직렬화된 XML 노드를 표준출력(stdout)에 써라
Print(doc_node)
# 직렬화된 XML 노드를 파일에 써라
f = open("tmp.xml", "w")
Print(doc_node, stream=f)
f.close()

from xml.dom import implementation
from xml.dom import EMPTY_NAMESPACE, XML_NAMESPACE
from xml.dom.ext import Print

# doctype 이름으로 "message"를 사용하여 문서 형 노드 하나를 만들어라 
# 빈 시스템ID(system ID)와 빈 공개ID(public ID) (즉, DTD 정보 없음)
doctype = implementation.createDocumentType("message", None, None)

# 문서 노드를 작성하라, 이 문서 노드는 또한 문서 요소 노드 하나를 만든다
# 그 문서 요소에 대하여, 빈 네임스페이스 URI와 그리고 지역적 이름으로 "message"를 사용하라
doc = implementation.createDocument(EMPTY_NAMESPACE, "message", doctype)

# 문서 요소를 확보하라
msg_elem = doc.documentElement

# 새 요소에 xml:lang 속성을 만들어라
msg_elem.setAttributeNS(XML_NAMESPACE, "xml:lang", "en")

# 약간의 내용을 구비한 텍스트 노드 하나를 만들어라
new_text = doc.createTextNode("You need Python")

# 새로운 텍스트 노드를 문서 요소에 추가하라
msg_elem.appendChild(new_text)

# 그 결과를 인쇄하라
Print(doc)

from xml.ns import XSLT
# XSLT 네임스페이스(namespace) http://www.w3.org/1999/XSL/Transform
NS = XSLT.BASE

from xml.xpath import Context, Evaluate
# 주어진 DOM 노드에 맞는 XPath 상황판(context)을 만들어라
# 상황판 리스트에 다른 노드들이 없다면
# (리스트 크기가 1, 현재 위치 1)
# 그리고 주어진 접두사/네임스페이스(prefix/namespace) 짝짓기(mapping)
con = Context.Context(doc, 1, 1, processorNss={"xsl": NS})

# XPath 표현식을 평가해서 그 결과를 반환하라
# 노드들을 담은 파이썬 리스트
result = Evaluate("//xsl:*", context=con)

from xml.marshal.generic import Marshaller
marshal = Marshaller()
obj = {1: [2, 3], "a": "b"}
# 문자열로 쏟아부어라(Dump)
xml_form = marshal.dumps(obj)

    1
    23
    a
    b

IT/모바일

PyXML 개론