|
Subject: [xsl] Re: Anyone implemented a fuzzy matcher in XPath? From: "Roger L. Cauvin" <roger@xxxxxxxxxx> Date: Wed, 30 Jan 2013 05:15:38 -0600 |
Has anyone implemented a fuzzy matcher (approximate string matcher [1]) in XPath?
<xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" xmlns:str="http://exslt.org/strings" extension-element-prefixes="str">
<xsl:variable name="lower-case-letters">abcdefghijklmnopqrstuvwxyz</xsl:variable> <xsl:variable name="upper-case-letters">ABCDEFGHIJKLMNOPQRSTUVWXYZ</xsl:variable>
<xsl:template name="compare-strings">
<xsl:param name="string1"/>
<xsl:param name="string2"/> <xsl:variable name="pairs1">
<xsl:call-template name="get-word-letter-pairs">
<xsl:with-param name="string" select="normalize-space(translate($string1, $lower-case-letters, $upper-case-letters))"/>
</xsl:call-template>
</xsl:variable> <xsl:variable name="pairs2">
<xsl:call-template name="get-word-letter-pairs">
<xsl:with-param name="string" select="normalize-space(translate($string2, $lower-case-letters, $upper-case-letters))"/>
</xsl:call-template>
</xsl:variable> <xsl:call-template name="compare-pairs">
<xsl:with-param name="pairs1" select="$pairs1"/>
<xsl:with-param name="pairs2" select="$pairs2"/>
</xsl:call-template> <xsl:template name="compare-pairs">
<xsl:param name="pairs1"/>
<xsl:param name="pairs2"/> <xsl:variable name="num-pairs1" select="string-length($pairs1) div 3"/>
<xsl:variable name="num-pairs2" select="string-length($pairs2) div 3"/>
<xsl:variable name="union" select="$num-pairs1 + $num-pairs2"/> <xsl:variable name="intersection">
<xsl:call-template name="intersect-remaining-pairs">
<xsl:with-param name="pairs1" select="$pairs1"/>
<xsl:with-param name="pairs2" select="$pairs2"/>
</xsl:call-template>
</xsl:variable> <xsl:template name="intersect-remaining-pairs">
<xsl:param name="pairs1"/>
<xsl:param name="pairs2"/>
<xsl:param name="intersection">0</xsl:param> <xsl:variable name="pair" select="substring-before($pairs1, ' ')"/>
<xsl:choose>
<xsl:when test="$pair = ''">
<xsl:value-of select="$intersection"/>
</xsl:when>
<xsl:when test="contains($pairs2, $pair)">
<xsl:call-template name="intersect-remaining-pairs">
<xsl:with-param name="pairs1" select="substring-after($pairs1, ' ')"/>
<xsl:with-param name="pairs2" select="concat(substring-before($pairs2, $pair), substring-after($pairs2, concat($pair, ' ')))"/>
<xsl:with-param name="intersection" select="$intersection + 1"/>
</xsl:call-template>
</xsl:when>
<xsl:otherwise>
<xsl:call-template name="intersect-remaining-pairs">
<xsl:with-param name="pairs1" select="substring-after($pairs1, ' ')"/>
<xsl:with-param name="pairs2" select="$pairs2"/>
<xsl:with-param name="intersection" select="$intersection"/>
</xsl:call-template>
</xsl:otherwise>
</xsl:choose> <xsl:template name="get-word-letter-pairs">
<xsl:param name="string"/>
<xsl:param name="pairs"></xsl:param> <xsl:choose>
<xsl:when test="$string = ''">
<xsl:value-of select="$pairs"/>
</xsl:when>
<xsl:otherwise>
<xsl:variable name="word">
<xsl:choose>
<xsl:when test="contains($string, ' ')">
<xsl:value-of select="substring-before($string, ' ')"/>
</xsl:when>
<xsl:otherwise>
<xsl:value-of select="$string"/>
</xsl:otherwise>
</xsl:choose>
</xsl:variable>
<xsl:variable name="letter-pairs">
<xsl:call-template name="get-letter-pairs">
<xsl:with-param name="word" select="$word"/>
</xsl:call-template>
</xsl:variable>
<xsl:call-template name="get-word-letter-pairs">
<xsl:with-param name="string" select="substring-after($string, ' ')"/>
<xsl:with-param name="pairs" select="concat($pairs, $letter-pairs)"/>
</xsl:call-template>
</xsl:otherwise>
</xsl:choose>
</xsl:template> <xsl:template name="get-letter-pairs">
<xsl:param name="word"/>
<xsl:param name="pairs"></xsl:param> <xsl:choose>
<xsl:when test="string-length($word) < 2">
<xsl:value-of select="$pairs"/>
</xsl:when>
<xsl:otherwise>
<xsl:call-template name="get-letter-pairs">
<xsl:with-param name="word" select="substring($word, 2, string-length($word) - 1)"/>
<xsl:with-param name="pairs" select="concat($pairs, substring($word, 1, 2), ' ')"/>
</xsl:call-template>
</xsl:otherwise>
</xsl:choose>
</xsl:template>-- Roger L. Cauvin "Smart product decisions" Twitter: @rcauvin http://blog.cauvin.org
| Current Thread |
|---|
|
| <- Previous | Index | Next -> |
|---|---|---|
| Re: [xsl] Info on serializer proper, G. Ken Holman | Thread | [xsl] Saxon via Ant - Getting start, Kerry, Richard |
| Re: [xsl] Are there any free, fully, James Fuller | Date | [xsl] Saxon via Ant - Getting start, Kerry, Richard |
| Month |