我是Haskell的初学者。我希望能够在Haskell中解析Project Gutenberg RDF元数据,但我真的不知道从哪里开始。它是RDF XML,所以它基本上是XML,带有一些时髦的命名空间。我看到那里有rdf4h库,但看起来很复杂。对于解析XML,有一堆库,但大多数使用箭头和我不理解的东西,看起来不必要复杂。还有其他库,如xml,但我找不到任何教程,文档似乎只是代码注释。我只是想知道是否有人想过这样的问题,以及是否有一个我没有考虑的解决方案。提前谢谢!
编辑:这是一个例子:
<?xml version="1.0" encoding="utf-8"?>
<rdf:RDF xml:base="http://www.gutenberg.org/"
xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
xmlns:dcterms="http://purl.org/dc/terms/"
xmlns:cc="http://web.resource.org/cc/"
xmlns:dcam="http://purl.org/dc/dcam/"
xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
xmlns:pgterms="http://www.gutenberg.org/2009/pgterms/"
>
<cc:Work rdf:about="">
<rdfs:comment>Archives containing the RDF files for *all* our books can be downloaded at
http://www.gutenberg.org/wiki/Gutenberg:Feeds#The_Complete_Project_Gutenberg_Catalog</rdfs:comment>
<cc:license rdf:resource="https://creativecommons.org/publicdomain/zero/1.0/"/>
</cc:Work>
<pgterms:ebook rdf:about="ebooks/20">
<pgterms:bookshelf>
<rdf:Description rdf:nodeID="N3f8445072d8e4499b2646626f94866e0">
<rdf:value>Poetry</rdf:value>
<dcam:memberOf rdf:resource="2009/pgterms/Bookshelf"/>
</rdf:Description>
</pgterms:bookshelf>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.rdf">
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-16T05:01:13.615047</dcterms:modified>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">12133</dcterms:extent>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="N735ba077c8424051b6470a92682aaa5e">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/rdf+xml</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">1991-10-01</dcterms:issued>
<dcterms:title>Paradise Lost</dcterms:title>
<dcterms:subject>
<rdf:Description rdf:nodeID="Ne259525c666c4886a996acbdddca0682">
<rdf:value>PR</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCC"/>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/files/20/20.txt">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">507133</dcterms:extent>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2011-03-02T06:33:54</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="Nbd1740a2927845058b0fe43326dcc48b">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain; charset=us-ascii</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.epub.images">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="Nb08f3d2980e64e91a402eb5b205c10bc">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/epub+zip</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">232622</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:17.425321</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.kindle.images">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">933970</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="Nff1df57b9552466d96b114f20424b5a2">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/x-mobipocket-ebook</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:21.321235</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:language>
<rdf:Description rdf:nodeID="N91273d0bffc74be393cda307d2b05137">
<rdf:value rdf:datatype="http://purl.org/dc/terms/RFC4646">en</rdf:value>
</rdf:Description>
</dcterms:language>
<dcterms:subject>
<rdf:Description rdf:nodeID="N5e35fb378b37483ca6ef7a08f27cf936">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Eve (Biblical figure) -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:license rdf:resource="license"/>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.html.images">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">614618</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:16.685338</dcterms:modified>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="N7567260ec2fd48c0be3d2858e08ac35d">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/html</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.epub.noimages">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:17.695324</dcterms:modified>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">232623</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="Nb640302bc2a84a31b0e154318df817d1">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/epub+zip</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.kindle.noimages">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">933967</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:24.846165</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="N1857bba1f5484e3d84846e1a554ec593">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/x-mobipocket-ebook</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:publisher>Project Gutenberg</dcterms:publisher>
<dcterms:rights>Public domain in the USA.</dcterms:rights>
<dcterms:creator>
<pgterms:agent rdf:about="2009/agents/17">
<pgterms:deathdate rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">1674</pgterms:deathdate>
<pgterms:webpage rdf:resource="http://en.wikipedia.org/wiki/John_Milton"/>
<pgterms:name>Milton, John</pgterms:name>
<pgterms:birthdate rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">1608</pgterms:birthdate>
</pgterms:agent>
</dcterms:creator>
<dcterms:type>
<rdf:Description rdf:nodeID="N0f6e6d76b1ff4ea9a2c5c37949efe82b">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/DCMIType"/>
<rdf:value>Text</rdf:value>
</rdf:Description>
</dcterms:type>
<dcterms:subject>
<rdf:Description rdf:nodeID="N202624c4b5994d39a3ab8bf0a2a31d95">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Adam (Biblical figure) -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.html.noimages">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">614618</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N79f919d14da448e19eb05c444322ddd2">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/html</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:16.955332</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<pgterms:bookshelf>
<rdf:Description rdf:nodeID="Nec598f664c934ed49ba3c0168ef09615">
<rdf:value>Banned Books from Anne Haight's list</rdf:value>
<dcam:memberOf rdf:resource="2009/pgterms/Bookshelf"/>
</rdf:Description>
</pgterms:bookshelf>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.txt.utf-8">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">507105</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N069b84f8b10844e9a6c713f4c163880b">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:15.953358</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:subject>
<rdf:Description rdf:nodeID="Nb489692851fa496d96b1a7fdf7a71b21">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Fall of man -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<pgterms:downloads rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">2088</pgterms:downloads>
<dcterms:subject>
<rdf:Description rdf:nodeID="Naa6849a7660b4039baadec8af58f0c58">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Bible. Genesis -- History of Biblical events -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/files/20/20.zip">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">205748</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N19cf968278bc4922bd87b17209c20d94">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain; charset=us-ascii</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2011-03-02T06:34:42</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="N94c2881f340a49c18246b69af3abcf12">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/zip</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
</pgterms:ebook>
<rdf:Description rdf:about="http://en.wikipedia.org/wiki/John_Milton">
<dcterms:description>Wikipedia</dcterms:description>
</rdf:Description>
</rdf:RDF>