Module:A or an/sandbox

MyWikiBiz, Author Your Legacy — Monday November 25, 2024
< Module:A or an
Revision as of 18:13, 8 July 2021 by Zoran (talk | contribs) (Moved page from wikipedia:en:Module:A or an/sandbox)
(diff) ← Older revision | Latest revision (diff) | Newer revision → (diff)
Jump to navigationJump to search

Documentation for this module may be created at Module:A or an/sandbox/doc

local p = {}
local words = mw.loadData('Module:A or an/words/sandbox')

local lcVChars = 'aeiouà-æè-ïò-öø-üāăąēĕėęěĩīĭįıijōŏőœũūŭůűų'
local ucVvChars = 'AEFHILMNORSXÀ-ÆÈ-ÏÒ-ÖØĀĂĄĒĔĖĘĚĨĪĬĮıIJŌŎŐŒÑĤĦĹĻĽĿŁŃŅŇŊŔŖŘŚŜŞ'

local function findWord(s, t)
	for i, v in ipairs(t) do
		if mw.ustring.find(s, '^' .. v .. '$') then
			return true
		end
	end
end

function p._main(args)
	local s = args[1] and mw.text.trim(args[1])
	local pron = 'a'
	local ret = ''
	
	if s and s ~= '' then
		local origStr = s
		
		s = mw.ustring.gsub(s, '</?[A-Za-z][^>]->', '') -- Remove HTML tags
		s = mw.ustring.gsub(s, '%[%[[^%|]+%|(..-)%]%]', '%1') -- Remove wikilinks
		s = mw.ustring.gsub(mw.ustring.gsub(s, '%[%[', ''), '%]%]', '')
		s = mw.ustring.gsub(s, '^["%$\'%(<%[%{¢-¥₠-₿]+', '') -- Strip some symbols at the beginning
		s = mw.ustring.match(s, '^%.?[0-9%u%l]+') or s -- Extract the first word
		
		if mw.ustring.find(s, '^[0-9]') then -- It begins with a number
			s = mw.ustring.match(s, '^[0-9]+') -- Extract the number
			if findWord(s, words['vNums']) then -- '18' etc.
				pron = 'an'
			end
		elseif mw.ustring.match(s, '^[0-9%u]+$') then -- It looks like an acronym
			if mw.ustring.find(s, '^[' .. ucVvChars .. ']')
				and not findWord(s, words['cvAcronyms']) -- Exclude 'NASA' etc.
				or findWord(s, words['vvAcronyms']) -- 'UNRWA' etc.
			then
				pron = 'an'
			end
		else
			s = mw.ustring.lower(s) -- Uncapitalize
			if mw.ustring.find(s, '^['.. lcVChars .. ']') then -- It begins with a vowel
				if not findWord(s, words['vcWords']) -- Exclude 'euro' etc.
					or findWord(s, words['vvWords']) -- But not 'Euler' etc.
				then
					pron = 'an'
				end
			elseif args.variety and mw.ustring.lower(args.variety) == 'us' -- 'herb' etc.
				and findWord(s, words['cvWordsUS'])
				or findWord(s, words['cvWords']) -- 'hour' etc.
			then
				pron = 'an'
			end
		end
		ret = pron .. ' ' .. origStr
	end
	
	return ret
end

function p.main(frame)
	return p._main(frame:getParent().args)
end

return p