Module:NormalizationDiacritic: Difference between revisions

// via Wikitext Extension for VSCode
// via Wikitext Extension for VSCode
 
Line 1: Line 1:
-- Module:NormalizationDiacritic
--[[
-- Removes diacritics from text for word matching.
* Name: NormalizationDiacritic
-- Features:
* Author: Mark W. Datysgeld
--  * Supports Latin and Cyrillic scripts
* Description: Diacritic removal for text normalization in word matching, supporting Latin and Cyrillic scripts
--  * Normalizes apostrophe variants (' and ')
* Notes: Normalizes apostrophe variants; UTF-8 compatible; case-preserving; uses performant gmatch and table.concat pattern for UTF-8 processing; includes caching for performance; avoids string.gsub for better UTF-8 handling
--  * UTF-8 compatible
]]
--  * Case-preserving
--
-- Usage:
--  local DiacriticNormalization = require('Module:NormalizationDiacritic')
--  local normalized = DiacriticNormalization.removeDiacritics("Français")  -- Returns "Francais"


local p = {}
local p = {}