Skip to content

Commit

Permalink
Add an attribute to the vertical with the decomposed unicode represen…
Browse files Browse the repository at this point in the history
…tation
  • Loading branch information
simar0at committed Jun 21, 2024
1 parent c120958 commit 6e4be3f
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 3 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -78,7 +78,7 @@
</xsl:template>
<xsl:template name="noske-token">
<xsl:value-of
select="concat(string-join((normalize-space(.), @xtoks:id[parent::xtoks:w], tei:sort-attrs(.)), '&#x9;'), '&#xA;')"
select="concat(string-join((normalize-unicode(normalize-space(.), 'NFC'), @xtoks:id[parent::xtoks:w], normalize-unicode(normalize-space(.), 'NFD'), tei:sort-attrs(.)), '&#x9;'), '&#xA;')"
/>
</xsl:template>
<xsl:template match="xtoks:w | xtoks:pc">
Expand Down
7 changes: 5 additions & 2 deletions nosketchengine/shawi
Original file line number Diff line number Diff line change
Expand Up @@ -21,14 +21,17 @@ TAGSETDOC ""
ATTRIBUTE "word" {
TYPE "MD_MD"
}
# MULTIVALUE y
# MULTISEP ","

## column #2
ATTRIBUTE "wid" {
TYPE "MD_MD"
}

## column #3 used for the decomposed version of the word
ATTRIBUTE "decomp" {
TYPE "MD_MD"
}

## column #3
ATTRIBUTE "ana" {
TYPE "MD_MD"
Expand Down

0 comments on commit 6e4be3f

Please sign in to comment.