使用Raptor RDF Parser Toolkit生成FOAF rdfxml文件

时间:2018-01-22 17:25:34

标签: c++ rdf linked-data foaf redland

我想使用Raptor RDF Parser Toolkit编写一个C / C ++程序来生成以下输出(使用RDF Validator检查):

<?xml version="1.0" encoding="utf-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
          xmlns:foaf="http://xmlns.com/foaf/0.1/">

   <foaf:Person xml:lang="en">
     <foaf:name>Jimmy Wales</foaf:name>
     <foaf:mbox rdf:resource="mailto:jwales@bomis.com"/>
     <foaf:nick>Jimbo</foaf:nick>
     <!-- photo -->
     <foaf:depiction
       rdf:resource="http://upload.wikimedia.org/wikipedia/commons/1/19/Jimbo_Wales_in_France_cropped.jpg" />
   </foaf:Person>

 </rdf:RDF>

数据模型的三元组如下所示:

Number  Subject Predicate   Object
1   genid:A4486 http://www.w3.org/1999/02/22-rdf-syntax-ns#type http://xmlns.com/foaf/0.1/Person
2   genid:A4486 http://xmlns.com/foaf/0.1/name  "Jimmy Wales"@en
3   genid:A4486 http://xmlns.com/foaf/0.1/mbox  mailto:jwales@bomis.com
4   genid:A4486 http://xmlns.com/foaf/0.1/nick  "Jimbo"@en
5   genid:A4486 http://xmlns.com/foaf/0.1/depiction http://upload.wikimedia.org/wikipedia/commons/1/19/Jimbo_Wales_in_France_cropped.jpg

仅供记录,我使用的是Visual Studio 2017 x64。 我想出了以下代码:

#include "raptor2/raptor2.h"

int main(int argc, char* argv[]) {
    FILE* outfile = fopen("myTestfile.rdf", "w");

    raptor_world* world = raptor_new_world();
    rdf_serializer = raptor_new_serializer(world, "rdfxml" /* "turtle" */);
    raptor_serializer_start_to_file_handle(rdf_serializer, nullptr, outfile);

    const unsigned char* prefix = (const unsigned char*)"foaf";
    raptor_uri* uri = raptor_new_uri(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/");
    raptor_serializer_set_namespace(rdf_serializer, uri, prefix);

    {
        raptor_statement* triple = nullptr;
        triple = raptor_new_statement(world);

        triple->subject = raptor_new_term_from_uri_string(world, (const unsigned char*)"genid:A4486");
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://www.w3.org/1999/02/22-rdf-syntax-ns#type");
        triple->object = raptor_new_term_from_literal(world, (unsigned char*)"http://xmlns.com/foaf/0.1/Person", nullptr, nullptr);
        raptor_serializer_serialize_statement(rdf_serializer, triple);
        raptor_free_statement(triple);
    }

    {
        raptor_statement* triple = nullptr;
        triple = raptor_new_statement(world);

        triple->subject = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/Person");
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/name");
        triple->object = raptor_new_term_from_literal(world, (unsigned char*)"Jimmy Wales", nullptr, nullptr);
        raptor_serializer_serialize_statement(rdf_serializer, triple);
        raptor_free_statement(triple);
    }

    {
        raptor_statement* triple = nullptr;
        triple = raptor_new_statement(world);

        triple->subject = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/Person");
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/mbox");
        triple->object = raptor_new_term_from_literal(world, (unsigned char*)"mailto:jwales@bomis.com", nullptr, nullptr);
        raptor_serializer_serialize_statement(rdf_serializer, triple);
        raptor_free_statement(triple);
    }

    raptor_serializer_serialize_end(rdf_serializer);
    raptor_free_serializer(rdf_serializer);
    raptor_free_world(world);

    fclose(outfile);
}

生成的文件如下所示:

<?xml version="1.0" encoding="utf-8"?>
<rdf:RDF xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
  <rdf:Description rdf:about="genid:A4486">
    <rdf:type>http://xmlns.com/foaf/0.1/Person</rdf:type>
  </rdf:Description>
  <rdf:Description rdf:about="http://xmlns.com/foaf/0.1/Person">
    <foaf:name>Jimmy Wales</foaf:name>
  </rdf:Description>
  <rdf:Description rdf:about="http://xmlns.com/foaf/0.1/Person">
    <foaf:mbox>mailto:jwales@bomis.com</foaf:mbox>
  </rdf:Description>
</rdf:RDF>

我在这里做错了什么?我想产生如上所示的相同结果。而不是<foaf:Person>标记,而是创建<rdf:Description>标记。

海龟输出(raptor_new_serializer(world, "turtle"))如下所示:

@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
@prefix foaf: <http://xmlns.com/foaf/0.1/> .

<genid:A4486>
    a "http://xmlns.com/foaf/0.1/Person" .

foaf:Person
    foaf:mbox "mailto:jwales@bomis.com" ;
    foaf:name "Jimmy Wales" .

1 个答案:

答案 0 :(得分:1)

您的代码中存在三个问题。

  1. 您正在混合使用不同类型的RDF terms

    • URI和文字(第20,42行),
    • URI和空白节点(第18,29,40行)。
  2. 要输出typed nodes,您应该使用rdfxml-abbrev序列化(第7行)。

  3. 你混淆了哪些东西是连通的,以及哪种方式(第29,40行):

    • 您需要构建此结构:

      as to be

    • 相反,你正在构建这样的东西:

      as is

  4. 此代码效果很好:

    #include <stdio.h>
    #include <raptor/raptor2.h>
    #include <stdlib.h>
    
    int
    main(int argc, char *argv[])
    {
      raptor_world *world = NULL;
      raptor_serializer* rdf_serializer = NULL;
      unsigned char *uri_string;
      raptor_uri *base_uri;
      raptor_statement* triple;
    
      world = raptor_new_world();
    
      uri_string = raptor_uri_filename_to_uri_string(argv[1]);
      base_uri = raptor_new_uri(world, uri_string);
    
      rdf_serializer = raptor_new_serializer(world, "rdfxml-abbrev");
      raptor_serializer_start_to_file_handle(rdf_serializer, base_uri, stdout);
    
      const unsigned char* foaf_prefix = (const unsigned char*)"foaf";
      raptor_uri* foaf_uri = raptor_new_uri(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/");
      raptor_serializer_set_namespace(rdf_serializer, foaf_uri, foaf_prefix);
    
      const unsigned char* rdf_prefix = (const unsigned char*)"rdf";
      raptor_uri* rdf_uri = raptor_new_uri(world, (const unsigned char*)"http://www.w3.org/1999/02/22-rdf-syntax-ns#");
      raptor_serializer_set_namespace(rdf_serializer, rdf_uri, rdf_prefix);
    
      {
        raptor_statement* triple = NULL; triple = raptor_new_statement(world);
    
        triple->subject = raptor_new_term_from_blank(world, (const unsigned char*)"b1");
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/name");
        triple->object = raptor_new_term_from_literal(world, (unsigned char*)"Jimmy Wales", NULL, NULL);
    
        raptor_serializer_serialize_statement(rdf_serializer, triple); raptor_free_statement(triple);
      }
    
      {
        raptor_statement* triple = NULL; triple = raptor_new_statement(world);
    
        triple->subject = raptor_new_term_from_blank(world, (const unsigned char*)"b1");  
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://xmlns.com/foaf/0.1/mbox");
        triple->object = raptor_new_term_from_uri_string(world, (unsigned char*)"mailto:jwales@bomis.com");
    
        raptor_serializer_serialize_statement(rdf_serializer, triple); raptor_free_statement(triple);
      }
    
      {
        raptor_statement* triple = NULL; triple = raptor_new_statement(world);
    
        triple->subject = raptor_new_term_from_blank (world, (const unsigned char*)"b1");  
        triple->predicate = raptor_new_term_from_uri_string(world, (const unsigned char*)"http://www.w3.org/1999/02/22-rdf-syntax-ns#type");
        triple->object = raptor_new_term_from_uri_string(world, (unsigned char*)"http://xmlns.com/foaf/0.1/Person");
    
        raptor_serializer_serialize_statement(rdf_serializer, triple); raptor_free_statement(triple);
      }
    
      raptor_serializer_serialize_end(rdf_serializer);
      raptor_free_serializer(rdf_serializer);
      raptor_free_uri(base_uri);
      raptor_free_memory(uri_string);
      raptor_free_world(world);
      return 0;
    }
    

    输出结果为:

    <?xml version="1.0" encoding="utf-8"?>
    <rdf:RDF xmlns:foaf="http://xmlns.com/foaf/0.1/"
       xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
      <foaf:Person>
        <foaf:mbox rdf:resource="mailto:jwales@bomis.com"/>
        <foaf:name>Jimmy Wales</foaf:name>
      </foaf:Person>
    </rdf:RDF>