xquery自动换行

时间:2010-09-22 08:18:13

标签: xquery

我需要使用XQuery将长字符串换行为100个字符。换句话说,将一些空格更改为换行符,以便非语法行将短于100个字符。有一个简单的方法吗?

4 个答案:

答案 0 :(得分:9)

我认为你只需要这个XPath 2.0表达式:

replace(concat(normalize-space(text),' '),'(.{0,60}) ','$1
')

使用Dimitre的输入,输出:

Dec. 13 — As always for a presidential inaugural, security
and surveillance were extremely tight in Washington, DC,
last January. But as George W. Bush prepared to take the
oath of office, security planners installed an extra layer
of protection: a prototype software system to detect a
biological attack. The U.S. Department of Defense, together
with regional health and emergency-planning agencies,
distributed a special patient-query sheet to military
clinics, civilian hospitals and even aid stations along the
parade route and at the inaugural balls. Software quickly
analyzed complaints of seven key symptoms — from rashes to
sore throats — for patterns that might indicate the early
stages of a bio-attack. There was a brief scare: the system
noticed a surge in flulike symptoms at military clinics.
Thankfully, tests confirmed it was just that — the flu.

答案 1 :(得分:1)

如果您的行超过100个字符,则需要使用换行符替换前101个字符中的最后一组连续空格。如果前101个字符中没有空格,那么您只想替换行中的第一个空格然后可以递归地对字符串中的其余行应用相同的逻辑

这可以这样做:

declare function local:wrap-line($str)
{
  if (string-length($str) < 100 or not(contains($str," ")))
  then $str
  else 
    let $wrapped := if (contains(substring($str,1,101)," "))
                    then replace($str, "^(.{0,99}[^ ]) +", "$1&#10;")
                    else replace($str, "^(.*?) ", "$1&#10;")
    return concat(substring-before($wrapped, "&#10;"), "&#10;",
                  local:wrap-line(substring-after($wrapped, "&#10;")))
};

declare function local:word-wrap($str)
{
  string-join(
    for $line in tokenize($str,"&#10;")
    return local:wrap-line($line),
    "&#10;")
};

这是有效的,因为(.{0,99}[^ ]) +匹配最长的100个字符系列,这些字符不是以空格结尾,后跟多个空格,而(.*?)匹配以空格结尾的最短字符系列。

代码几乎不是最优的,并且需要针对退化情况进行改进(例如,以几个空格结尾的文本行,但它确实有效。

答案 2 :(得分:1)

我不太了解XQuery在XQuery中表达这个XSLT解决方案,但我认为提供它可能会有所帮助。

请注意,在典型的realworld案例中,单词由多个分隔符分隔。以下解决方案将参数中指定的所有字符视为分隔符,并将每一行拆分为最大长度边界。它是XSLT 1.0或2.0的函数/模板的FXSL库的一部分。

<xsl:stylesheet version="1.0"
xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
xmlns:f="http://fxsl.sf.net/"
xmlns:ext="http://exslt.org/common"
xmlns:str-split2lines-func="f:str-split2lines-func"
exclude-result-prefixes="xsl f ext str-split2lines-func"
>


   <xsl:import href="dvc-str-foldl.xsl"/>

   <str-split2lines-func:str-split2lines-func/>

   <xsl:output indent="yes" omit-xml-declaration="yes"/>

    <xsl:template match="/">
      <xsl:call-template name="str-split-to-lines">
        <xsl:with-param name="pStr" select="/*"/>
        <xsl:with-param name="pLineLength" select="60"/>
        <xsl:with-param name="pDelimiters" select="' &#9;&#10;&#13;'"/>
      </xsl:call-template>
    </xsl:template>

    <xsl:template name="str-split-to-lines">
      <xsl:param name="pStr"/>
      <xsl:param name="pLineLength" select="60"/>
      <xsl:param name="pDelimiters" select="' &#9;&#10;&#13;'"/>

      <xsl:variable name="vsplit2linesFun"
                    select="document('')/*/str-split2lines-func:*[1]"/>

      <xsl:variable name="vrtfParams">
       <delimiters><xsl:value-of select="$pDelimiters"/></delimiters>
       <lineLength><xsl:copy-of select="$pLineLength"/></lineLength>
      </xsl:variable>

      <xsl:variable name="vResult">
          <xsl:call-template name="dvc-str-foldl">
            <xsl:with-param name="pFunc" select="$vsplit2linesFun"/>
            <xsl:with-param name="pStr" select="$pStr"/>
            <xsl:with-param name="pA0" select="ext:node-set($vrtfParams)"/>
          </xsl:call-template>
      </xsl:variable>
      <xsl:for-each select="ext:node-set($vResult)/line">
        <xsl:for-each select="word">
          <xsl:value-of select="concat(., ' ')"/>
        </xsl:for-each>
        <xsl:value-of select="'&#xA;'"/>
      </xsl:for-each>
    </xsl:template>

    <xsl:template match="str-split2lines-func:*" mode="f:FXSL">
      <xsl:param name="arg1" select="/.."/>
      <xsl:param name="arg2"/>

      <xsl:copy-of select="$arg1/*[position() &lt; 3]"/>
      <xsl:copy-of select="$arg1/line[position() != last()]"/>

      <xsl:choose>
        <xsl:when test="contains($arg1/*[1], $arg2)">
          <xsl:if test="string($arg1/word) or string($arg1/line/word)">
             <xsl:call-template name="fillLine">
               <xsl:with-param name="pLine" select="$arg1/line[last()]"/>
               <xsl:with-param name="pWord" select="$arg1/word"/>
               <xsl:with-param name="pLineLength" select="$arg1/*[2]"/>
             </xsl:call-template>
          </xsl:if>
        </xsl:when>
        <xsl:otherwise>
          <xsl:copy-of select="$arg1/line[last()]"/>
          <word><xsl:value-of select="concat($arg1/word, $arg2)"/></word>
        </xsl:otherwise>
      </xsl:choose>
    </xsl:template>

      <!-- Test if the new word fits into the last line -->
    <xsl:template name="fillLine">
      <xsl:param name="pLine" select="/.."/>
      <xsl:param name="pWord" select="/.."/>
      <xsl:param name="pLineLength" />

      <xsl:variable name="vnWordsInLine" select="count($pLine/word)"/>
      <xsl:variable name="vLineLength" 
       select="string-length($pLine) + $vnWordsInLine"/>
      <xsl:choose>
        <xsl:when test="not($vLineLength + string-length($pWord) 
                           > 
                            $pLineLength)">
          <line>
            <xsl:copy-of select="$pLine/*"/>
            <xsl:copy-of select="$pWord"/>
          </line>
        </xsl:when>
        <xsl:otherwise>
          <xsl:copy-of select="$pLine"/>
          <line>
            <xsl:copy-of select="$pWord"/>
          </line>
          <word/>
        </xsl:otherwise>
      </xsl:choose>
    </xsl:template>

</xsl:stylesheet>

对以下XML文档应用此转换

<text>
Dec. 13 — As always for a presidential inaugural, security and surveillance were
extremely tight in Washington, DC, last January. But as George W. Bush prepared to
take the oath of office, security planners installed an extra layer of protection: a
prototype software system to detect a biological attack. The U.S. Department of
Defense, together with regional health and emergency-planning agencies, distributed
a special patient-query sheet to military clinics, civilian hospitals and even aid
stations along the parade route and at the inaugural balls. Software quickly
analyzed complaints of seven key symptoms — from rashes to sore throats — for
patterns that might indicate the early stages of a bio-attack. There was a brief
scare: the system noticed a surge in flulike symptoms at military clinics.
Thankfully, tests confirmed it was just that — the flu.
</text>

生成所需结果(行数不超过60个字符):

Dec. 13 — As always for a presidential inaugural, security 
and surveillance were extremely tight in Washington, DC, 
last January. But as George W. Bush prepared to take the 
oath of office, security planners installed an extra layer 
of protection: a prototype software system to detect a 
biological attack. The U.S. Department of Defense, together 
with regional health and emergency-planning agencies, 
distributed a special patient-query sheet to military 
clinics, civilian hospitals and even aid stations along the 
parade route and at the inaugural balls. Software quickly 
analyzed complaints of seven key symptoms — from rashes to 
sore throats — for patterns that might indicate the early 
stages of a bio-attack. There was a brief scare: the system 
noticed a surge in flulike symptoms at military clinics. 
Thankfully, tests confirmed it was just that — the flu. 

答案 3 :(得分:0)

尝试使用以下XQuery函数:这可以自动换行任何文本。

要传递的参数: 1. $ Text - 文字到自动换行 2. 50 -Word换行长度 “” “ - 自动换行 - 新行字符 4. 0 - 起始位置

declare function xf:wrap-string($str as xs:string,
                                $wrap-col as xs:integer,
                                $break-mark as xs:string,
                                $pos as xs:integer)
    as xs:string {
       if(fn:contains( $str, ' ' )) then 
        let $first-word := fn:substring-before( $str, ' ' )
        let $pos-now := xs:integer($pos + 1 + string-length($first-word))
        return
            if ($pos>0 and $pos-now>=$wrap-col) then
                 concat($break-mark,
                 xf:wrap-string($str,$wrap-col,$break-mark,xs:integer(0)))
            else
                concat($first-word,' ',
                 xf:wrap-string(substring-after( $str, ' ' ),
                               $wrap-col,
                               $break-mark,
                               $pos-now))
       else(
        if ($pos+string-length($str)>$wrap-col) then
            concat($break-mark,$str)
        else ($str)
       )
};

    declare function xf:wrap-test($str as xs:string,
                                    $wrap-col as xs:integer,
                                    $break-mark as xs:string,
                                    $pos as xs:integer)
     as xs:string {
            let $Result := xf:wrap-string($str,$wrap-col,$break-mark,$pos)
            return
            if (fn:contains($Result,'&#10;')) then
                fn:string-join(for $line in tokenize($Result, '&#10;')
                                return
                                if (fn:string-length($line)<50) then
                                    xf:pad-string-to-length(string($line),50)
                                else ($line),
                '')
            else $Result 
     }; 

    xf:wrap-test($Text,50,"&#10;",0)

Parameters to pass: 
1. $Text - Text to word wrap
2. 50 -Word wrap string length
3. "&#10;" - After word wrap - new line character
4. 0 - Starting position