【发布时间】:2018-03-15 22:23:07
【问题描述】:
我是 Haskell 初学者。我有来自 Project Gutenberg 的 RDF XML,如下所示:
<?xml version="1.0" encoding="utf-8"?>
<rdf:RDF xml:base="http://www.gutenberg.org/"
xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
xmlns:dcterms="http://purl.org/dc/terms/"
xmlns:cc="http://web.resource.org/cc/"
xmlns:dcam="http://purl.org/dc/dcam/"
xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
xmlns:pgterms="http://www.gutenberg.org/2009/pgterms/"
>
<cc:Work rdf:about="">
<rdfs:comment>Archives containing the RDF files for *all* our books can be downloaded at
http://www.gutenberg.org/wiki/Gutenberg:Feeds#The_Complete_Project_Gutenberg_Catalog</rdfs:comment>
<cc:license rdf:resource="https://creativecommons.org/publicdomain/zero/1.0/"/>
</cc:Work>
<pgterms:ebook rdf:about="ebooks/20">
<pgterms:bookshelf>
<rdf:Description rdf:nodeID="N3f8445072d8e4499b2646626f94866e0">
<rdf:value>Poetry</rdf:value>
<dcam:memberOf rdf:resource="2009/pgterms/Bookshelf"/>
</rdf:Description>
</pgterms:bookshelf>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.rdf">
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-16T05:01:13.615047</dcterms:modified>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">12133</dcterms:extent>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="N735ba077c8424051b6470a92682aaa5e">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/rdf+xml</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">1991-10-01</dcterms:issued>
<dcterms:title>Paradise Lost</dcterms:title>
<dcterms:subject>
<rdf:Description rdf:nodeID="Ne259525c666c4886a996acbdddca0682">
<rdf:value>PR</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCC"/>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/files/20/20.txt">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">507133</dcterms:extent>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2011-03-02T06:33:54</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="Nbd1740a2927845058b0fe43326dcc48b">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain; charset=us-ascii</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.epub.images">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="Nb08f3d2980e64e91a402eb5b205c10bc">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/epub+zip</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">232622</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:17.425321</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.kindle.images">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">933970</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="Nff1df57b9552466d96b114f20424b5a2">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/x-mobipocket-ebook</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:21.321235</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:language>
<rdf:Description rdf:nodeID="N91273d0bffc74be393cda307d2b05137">
<rdf:value rdf:datatype="http://purl.org/dc/terms/RFC4646">en</rdf:value>
</rdf:Description>
</dcterms:language>
<dcterms:subject>
<rdf:Description rdf:nodeID="N5e35fb378b37483ca6ef7a08f27cf936">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Eve (Biblical figure) -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:license rdf:resource="license"/>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.html.images">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">614618</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:16.685338</dcterms:modified>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:format>
<rdf:Description rdf:nodeID="N7567260ec2fd48c0be3d2858e08ac35d">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/html</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.epub.noimages">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:17.695324</dcterms:modified>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">232623</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="Nb640302bc2a84a31b0e154318df817d1">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/epub+zip</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.kindle.noimages">
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">933967</dcterms:extent>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:24.846165</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="N1857bba1f5484e3d84846e1a554ec593">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/x-mobipocket-ebook</rdf:value>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:publisher>Project Gutenberg</dcterms:publisher>
<dcterms:rights>Public domain in the USA.</dcterms:rights>
<dcterms:creator>
<pgterms:agent rdf:about="2009/agents/17">
<pgterms:deathdate rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">1674</pgterms:deathdate>
<pgterms:webpage rdf:resource="http://en.wikipedia.org/wiki/John_Milton"/>
<pgterms:name>Milton, John</pgterms:name>
<pgterms:birthdate rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">1608</pgterms:birthdate>
</pgterms:agent>
</dcterms:creator>
<dcterms:type>
<rdf:Description rdf:nodeID="N0f6e6d76b1ff4ea9a2c5c37949efe82b">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/DCMIType"/>
<rdf:value>Text</rdf:value>
</rdf:Description>
</dcterms:type>
<dcterms:subject>
<rdf:Description rdf:nodeID="N202624c4b5994d39a3ab8bf0a2a31d95">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Adam (Biblical figure) -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.html.noimages">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">614618</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N79f919d14da448e19eb05c444322ddd2">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/html</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:16.955332</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<pgterms:bookshelf>
<rdf:Description rdf:nodeID="Nec598f664c934ed49ba3c0168ef09615">
<rdf:value>Banned Books from Anne Haight's list</rdf:value>
<dcam:memberOf rdf:resource="2009/pgterms/Bookshelf"/>
</rdf:Description>
</pgterms:bookshelf>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/ebooks/20.txt.utf-8">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">507105</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N069b84f8b10844e9a6c713f4c163880b">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2017-03-01T01:04:15.953358</dcterms:modified>
</pgterms:file>
</dcterms:hasFormat>
<dcterms:subject>
<rdf:Description rdf:nodeID="Nb489692851fa496d96b1a7fdf7a71b21">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Fall of man -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<pgterms:downloads rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">2088</pgterms:downloads>
<dcterms:subject>
<rdf:Description rdf:nodeID="Naa6849a7660b4039baadec8af58f0c58">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/LCSH"/>
<rdf:value>Bible. Genesis -- History of Biblical events -- Poetry</rdf:value>
</rdf:Description>
</dcterms:subject>
<dcterms:hasFormat>
<pgterms:file rdf:about="http://www.gutenberg.org/files/20/20.zip">
<dcterms:extent rdf:datatype="http://www.w3.org/2001/XMLSchema#integer">205748</dcterms:extent>
<dcterms:format>
<rdf:Description rdf:nodeID="N19cf968278bc4922bd87b17209c20d94">
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">text/plain; charset=us-ascii</rdf:value>
</rdf:Description>
</dcterms:format>
<dcterms:isFormatOf rdf:resource="ebooks/20"/>
<dcterms:modified rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime">2011-03-02T06:34:42</dcterms:modified>
<dcterms:format>
<rdf:Description rdf:nodeID="N94c2881f340a49c18246b69af3abcf12">
<rdf:value rdf:datatype="http://purl.org/dc/terms/IMT">application/zip</rdf:value>
<dcam:memberOf rdf:resource="http://purl.org/dc/terms/IMT"/>
</rdf:Description>
</dcterms:format>
</pgterms:file>
</dcterms:hasFormat>
</pgterms:ebook>
<rdf:Description rdf:about="http://en.wikipedia.org/wiki/John_Milton">
<dcterms:description>Wikipedia</dcterms:description>
</rdf:Description>
</rdf:RDF>
并且我想将这些信息转换成可以查询和操作的常规 Haskell 数据结构。例如,我可能想查询该作品的标题,或获取其所有 Wikipedia URL。
我注意到有an RDF library in Haskell, rdh4h 并且它有一个XML 解析器。但是我无法对文档进行正面或反面,而且似乎任何地方都没有教程。
我想过做的另一件事是将所有这些 RDF/XML 文件导入某种数据库,然后使用 Haskell 以某种方式查询该数据库。但我不确定哪个数据库是合适的,或者这是否可能。
当然,我可以将其视为 XML 数据,而忽略 RDF 方面,但这似乎需要大量工作,而且我必须为我想要的这个 XML 文件中的每一件事编写一些非常长的数据结构出去。
有人对如何使用 Haskell 查询这样的数据有任何想法吗?
【问题讨论】:
-
我太累了,但为什么没有任何东西“让 [..] 工作”?你收到类型错误了吗?
-
调试我尝试编写的内容是没有用的,因为我不知道自己在做什么。真的,我只是在寻找有关如何在 Haskell 中查询 RDF 数据的想法。更新了我的问题,使其更加明确。