Search code examples
splitxslt-1.0filesplitting

Split XML file based on a tag using XSLT


I have a need to split an XML file based on a tag inside. Here is the input file will look like. The spli should happen based on Order tag

<?xml version="1.0" encoding="UTF-8" standalone="yes" ?>
<Root>
    <MultiApi>
        <API>
            <Input>
                <Order test="0001" >
                    <OrderLines>
                        <OrderLine test1="123" />
                    </OrderLines>
                </Order>
                <Order test="0002" >
                    <OrderLines>
                        <OrderLine test1="456" />
                    </OrderLines>
                </Order>
                <Order test="0003" >
                    <OrderLines>
                        <OrderLine test1="789" />
                    </OrderLines>
                </Order>
            </Input>
        </API>
    </MultiApi>
    <MultiApi>
        <EOF abc="test" MaxMsgPerFile="1" >
        </EOF>
    </MultiApi>
    </Root>

The output should look like:

<Root>
<MultiApi>
    <API>
        <Input>
            <Order test="0001" >
                <OrderLines>
                    <OrderLine test1="123" />
                </OrderLines>
            </Order>
        </Input>
    </API>
</MultiApi>
<MultiApi>
    <API>
        <Input>
            <Order test="0002" >
                <OrderLines>
                    <OrderLine test1="456" />
                </OrderLines>
            </Order>
        </Input>
    </API>
</MultiApi>
<MultiApi>
    <API>
        <Input>
            <Order test="0003" >
                <OrderLines>
                    <OrderLine test1="789" />
                </OrderLines>
            </Order>
        </Input>
    </API>
</MultiApi>
</Root>

I have tried the below XSL - but was returning null. Any help would be great:

<?xml version="1.0" encoding="UTF-8"?>
<xsl:stylesheet version="1.0" 
xmlns:xsl="http://www.w3.org/1999/XSL/Transform">

   <xsl:output method="xml" version="1.0" encoding="UTF-8" indent="yes"/>

      <xsl:variable name="tag">
      <xsl:value-of select="/*/*/EOF/@MaxMsgPerFile"/>
   </xsl:variable>

<xsl:template match="/Root">
    <xsl:copy>


        <xsl:for-each select="MultiApi[not (EOF)]/API/Input/Order[position() mod $tag = 1]">
            <MultiApi>
                <xsl:copy-of select="| . | following-sibling::Order[position() &lt; $tag]"/>

            </MultiApi>
        </xsl:for-each>
    </xsl:copy>
</xsl:template> 

</xsl:stylesheet>

I may not be doing a good job with "following-sibling". Please review and help!


Solution

  • Only requiring one output file, you can easily achieve this with the following stylesheet. The [not(EOF)] predicate on the MultiApi element is not necessary, because the other element does not contain this structure.

    <?xml version="1.0" encoding="UTF-8"?>
    <xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
        <xsl:output method="xml" version="1.0" encoding="UTF-8" indent="yes"/>
        <xsl:variable name="tag">
            <xsl:value-of select="/*/*/EOF/@MaxMsgPerFile"/>
        </xsl:variable>
    
        <xsl:template match="/Root">
            <xsl:copy>
                <xsl:for-each select="MultiApi/API/Input/Order">
                    <MultiApi>
                        <API>
                            <Input>
                                <xsl:copy-of select="."/>
                            </Input>
                        </API>
                    </MultiApi>
                </xsl:for-each>
            </xsl:copy>
        </xsl:template>
    
    </xsl:stylesheet>
    

    Its output is:

    <?xml version="1.0" encoding="UTF-8"?>
    <Root>
        <MultiApi>
            <API>
                <Input>
                    <Order test="0001">
                        <OrderLines>
                            <OrderLine test1="123"/>
                        </OrderLines>
                    </Order>
                </Input>
            </API>
        </MultiApi>
        <MultiApi>
            <API>
                <Input>
                    <Order test="0002">
                        <OrderLines>
                            <OrderLine test1="456"/>
                        </OrderLines>
                    </Order>
                </Input>
            </API>
        </MultiApi>
        <MultiApi>
            <API>
                <Input>
                    <Order test="0003">
                        <OrderLines>
                            <OrderLine test1="789"/>
                        </OrderLines>
                    </Order>
                </Input>
            </API>
        </MultiApi>
    </Root>