我们如何将XSL转换为XML格式

时间:2019-03-27 06:03:06

标签: java xml csv xslt

我正在尝试将XML文件转换为CSV文件。 (基本上将数据从XML转换为表格格式) 但是我需要将XSL文件用于该特定XML文件以进行CSV转换。 这是一个复杂的XML。我在这里菜鸟。

这是示例XML文件。 我需要提取相关的所有字段,例如 1. MetaversionOID 2. StudyOID 3. LocationOID

<ODM
    xmlns="http://www.cdisc.org/ns/odm/v1.3"
    xmlns:p1="https://www.protocolfirst.com/ns/odm/v1.3.2" CreationDateTime="2019-03-25T06:33:43.806Z" FileOID="9c94b49a-0110-418b-a8e9-adb5d557b106" ODMVersion="1.3.2" FileType="Snapshot" AsOfDateTime="2019-03-25T06:33:43.806Z" SourceSystem="ProtocolFirst EDC">
    <ClinicalData MetaDataVersionOID="1.0" StudyOID="BAML-S16 AGI-IDH1">
        <SubjectData SubjectKey="101-155-16">
            <StudyEventData StudyEventOID="1.01" p1:Name="Screening (Master)" p1:CreationDateTime="2018-11-01T14:45:12.997Z" p1:Branch="1.0" p1:NotDone="N" p1:VisitDate="2018-10-18T04:00:00.000Z">
                <FormData FormOID="demo" p1:Name="Demographics" p1:Started="Y" p1:NotDone="N">
                    <ItemGroupData ItemGroupOID="demo">
                        <ItemData ItemOID="2a48d0b6-de96-4da9-8b90-c9d555ccbc45" p1:FieldName="Date of Birth" p1:EntryType="Transcription" Value="1950-08-24" p1:TimezoneOffset="-04:00">
                            <AuditRecord>
                                <UserRef UserOID="molly.vittorio@osumc.edu"/>
                                <DateTimeStamp>2018-11-05T16:30:42.220Z</DateTimeStamp>
                            </AuditRecord>
                        </ItemData>
                        <ItemData ItemOID="73bce803-1540-479f-8022-1a814f5bfa8e" p1:FieldName="Sex" p1:EntryType="Transcription" Value="M" p1:DisplayValue="Male">
                            <AuditRecord>
                                <UserRef UserOID="molly.vittorio@osumc.edu"/>
                                <DateTimeStamp>2018-11-05T16:30:43.007Z</DateTimeStamp>
                            </AuditRecord>
                        </ItemData>
                        <ItemData ItemOID="bc160779-263c-40ca-97ce-72c8f07f907c" p1:FieldName="Ethnicity" p1:EntryType="Transcription" Value="NOT HISPANIC OR LATINO" p1:DisplayValue="Not Hispanic or Latino">
                            <AuditRecord>
                                <UserRef UserOID="molly.vittorio@osumc.edu"/>
                                <DateTimeStamp>2018-11-05T16:30:46.151Z</DateTimeStamp>
                            </AuditRecord>
                        </ItemData>
                        <ItemData ItemOID="8f064011-8e2b-486b-8b60-c2f744ca5235" p1:FieldName="Race" p1:EntryType="Transcription" Value="CAUCASIAN" p1:DisplayValue="Caucasian">
                            <AuditRecord>
                                <UserRef UserOID="molly.vittorio@osumc.edu"/>
                                <DateTimeStamp>2018-11-05T16:30:45.366Z</DateTimeStamp>
                            </AuditRecord>
                        </ItemData>
                    </ItemGroupData>
                    <AuditRecord EditPoint="Monitoring">
                        <p1:Review DateTimeStamp="2019-03-12T16:59:47.139Z" UserOID="lia.zevallos@syneoshealth.com" Action="query" Comment="Birth recorded in the SD 24 August 1950. Please verify and correct the CRF page, thanks."/>
                        <p1:Review DateTimeStamp="2018-11-05T16:30:51.928Z" UserOID="molly.vittorio@osumc.edu" Action="submitted"/>
                        <p1:Review DateTimeStamp="2018-11-01T14:45:12.997Z" UserOID="molly.vittorio@osumc.edu" Action="open"/>
                    </AuditRecord>
                </FormData>
            </StudyEventData>
        </SubjectData>
    </ClinicalData>
</ODM>

这是我用来将XML转换为CSV格式的代码。

import java.io.File;

import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.transform.Result;
import javax.xml.transform.Source;
import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.dom.DOMSource;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import org.w3c.dom.Document;

public class Temp {

    public static void main(String args[]) throws Exception {

        Document document;

        File stylesheet = new File("C:/Users/mmahajan/Desktop/Input/style.xsl");
        File xmlSource = new File("C:/Users/mmahajan/Desktop/Input/subject-beataml-BAML-S8 AST-FLT3-20190325114820225683361888824.xml");

        DocumentBuilderFactory factory = DocumentBuilderFactory.newInstance();
        DocumentBuilder builder;
        try {
            builder = factory.newDocumentBuilder();
            document = builder.parse(xmlSource);
            StreamSource stylesource = new StreamSource(stylesheet);
            Transformer transformer = TransformerFactory.newInstance().newTransformer(stylesource);
            Source source = new DOMSource(document);
            Result outputTarget = new StreamResult(new File("C:/Users/mmahajan/Desktop/Input/x.csv"));
            transformer.transform(source, outputTarget);

        } catch (ParserConfigurationException e) {
            e.printStackTrace();
        }

    }

}

到目前为止,我已经编写了以下XSL文件。

<?xml version="1.0"?>
<xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" xmlns:fo="http://www.w3.org/1999/XSL/Format" >
<xsl:output method="text" omit-xml-declaration="yes" indent="no"/>
<xsl:template match="/">
Metaversion,StudyOID,SubjectKey,CreationDateTime,VisitDate,NotDone,Branch,Name,StudyEventOID,Name,Started,FormOID,ItemGroupOID,TimezoneOffset,Value,EntryType,FieldName,ItemOID,UserOID,DateTimeStamp
<xsl:for-each select="//AuditRecord">
<xsl:value-of select="concat(//ClinicalData/@MetaDataVersionOID,',',//ClinicalData/@StudyOID,',',//ClinicalData/SubjectData/@SubjectKey,',',//ClinicalData/SubjectData/StudyEventData/@CreationDateTime,',',//ClinicalData/SubjectData/StudyEventData/@CreationDateTime,',',//ClinicalData/SubjectData/StudyEventData/@VisitDate,',',//ClinicalData/SubjectData/StudyEventData/@NotDone,',',//ClinicalData/SubjectData/StudyEventData/@Branch,',',//ClinicalData/SubjectData/StudyEventData/@Name,',',//ClinicalData/SubjectData/StudyEventData/@StudyEventOID,',',//ClinicalData/SubjectData/StudyEventData/FormData/',',//ClinicalData/SubjectData/StudyEventData/FormData/@Started,',',//ClinicalData/SubjectData/StudyEventData/FormData/@FormOID,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/@ItemGroupOID,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/@TimezoneOffset,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/@Value,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/@EntryType,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/@FieldName,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/@ItemOID,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/AuditRecord/UserRef/@UserOID,',',//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/ItemData/AuditRecord/UserRef/@DateTimeStamp,
'&#xA;')"/>
</xsl:for-each>
</xsl:template>
</xsl:stylesheet>

但这是错误的。正确XSL的任何帮助将不胜感激。

  

更新:我已经修改了XML文件和XSL文件,但是仍然无法   为其生成正确的XSL文件。

2 个答案:

答案 0 :(得分:0)

<xsl:template match="/">
<html>
<head>
</head>
<body>
    <xsl:for-each select="/ClinicalData">
        <td><xsl:value-of select="@MetaDataVersionOID"/></td>
        <td><xsl:value-of select="@StudyOID"/></td>
        <td><xsl:value-of select="SubjectData/SiteRef/@LocationOID"/></td>
    </xsl:for-each>
</body>
</html>
</xsl:template>

答案 1 :(得分:-1)

您可以检查它是否会创建csv输出

<xsl:value-of select="concat(@MetaDataVersionOID, ',', @StudyOID, ',', SubjectData/SiteRef/@LocationOID)"/>

您可以在https://xsltfiddle.liberty-development.net/6r5Gh3b

看到变换

XSLT

    <?xml version="1.0" encoding="UTF-8"?>
<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
    xmlns:xs="http://www.w3.org/2001/XMLSchema"
    xmlns:a="http://www.cdisc.org/ns/odm/v1.3"
    xmlns:p1="https://www.protocolfirst.com/ns/odm/v1.3.2"
    xpath-default-namespace="http://www.cdisc.org/ns/odm/v1.3"
    exclude-result-prefixes="xs"
    version="2.0">

    <xsl:template match="/">
        <xsl:for-each select="//AuditRecord">
            <xsl:text>&#xa;</xsl:text>
            <xsl:value-of select="concat(//ClinicalData/@MetaDataVersionOID,','
                ,//ClinicalData/@StudyOID,','
                ,//ClinicalData/SubjectData/@SubjectKey,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:CreationDateTime,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:CreationDateTime,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:VisitDate,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:NotDone,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:Branch,','
                ,//ClinicalData/SubjectData/StudyEventData/@p1:Name,','
                ,//ClinicalData/SubjectData/StudyEventData/@StudyEventOID,','
                ,//ClinicalData/SubjectData/StudyEventData/FormData/','
                ,//ClinicalData/SubjectData/StudyEventData/FormData/@p1:Started,','
                ,//ClinicalData/SubjectData/StudyEventData/FormData/@FormOID,','
                ,//ClinicalData/SubjectData/StudyEventData/FormData/ItemGroupData/@ItemGroupOID,','
                ,parent::ItemData/@TimezoneOffset,','
                ,parent::ItemData/@Value,','
                ,parent::ItemData/@p1:EntryType,','
                ,parent::ItemData/@p1:FieldName,','
                ,parent::ItemData/@ItemOID,','
                ,UserRef/@UserOID,','
                ,UserRef/@DateTimeStamp,','
                ,UserOID,','
                ,DateTimeStamp,
                '&#xA;')"/>
        </xsl:for-each>
    </xsl:template>


</xsl:stylesheet>