Module:ConvertNumeric: Difference between revisions

(2 intermediate revisions by 2 users not shown)

Line 3:

-- When editing, preview with: [[Module_talk:ConvertNumeric/testcases]]

-- First, edit [[Module:ConvertNumeric/sandbox]], then preview with [[Module_talk:ConvertNumeric/sandbox/testcases]]

require('strict')

local ones_position = {

Line 189:

Line 190:

}

local ~~eng_lt20 = {~~

local engord_tens_end = {

~~['zeroth'] = 0,~~

['twentieth'] = 20,

~~['first'] = 1,~~

['thirtieth'] = 30,

~~['second'] = 2,~~

['fortieth'] = 40,

~~['third'] = 3,~~

['fiftieth'] = 50,

~~['fourth'] = 4,~~

['sixtieth'] = 60,

~~['fifth'] = 5,~~

['seventieth'] = 70,

~~['sixth'] = 6,~~

['eightieth'] = 80,

~~['seventh'] = 7,~~

['ninetieth'] = 90,

~~['eighth'] = 8,~~

~~['ninth'] = 9,~~

~~['tenth'] = 10,~~

~~['eleventh'] = 11,~~

~~['twelfth'] = 12,~~

~~['thirteenth'] = 13,~~

~~['fourteenth'] = 14,~~

~~['fifteenth'] = 15,~~

~~['sixteenth'] = 16,~~

~~['seventeenth'] = 17,~~

~~['eighteenth'] = 18,~~

~~['nineteenth'] = 19,~~

}

~~local eng_tens_end~~ = {

['twentieth'] = 20,

['thirtieth'] = 30,

['fortieth'] = 40,

['fiftieth'] = 50,

['sixtieth'] = 60,

['seventieth'] = 70,

['eightieth'] = 80,

['ninetieth'] = 90,

}

local eng_tens_cont = {

['twenty'] = 20,

['thirty'] = 30,

['forty'] = 40,

['fifty'] = 50,

['sixty'] = 60,

['seventy'] = 70,

['eighty'] = 80,

['ninety'] = 90,

}

-- Converts a given valid roman numeral (and some invalid roman numerals) to a number. Returns -1, errorstring on error

-- Converts a given valid roman numeral (and some invalid roman numerals) to a number. Returns { -1, errorstring } on error.

local function roman_to_numeral(roman)

if type(roman) ~= "string" then return -1, "roman numeral not a string" end

Line 259:

Line 239:

end

-- Converts a given integer between 0 and 100 to English text (e.g. 47 -> forty-seven)

-- Converts a given integer between 0 and 100 to English text (e.g. 47 -> forty-seven).

local function numeral_to_english_less_100(num, ordinal, plural, zero)

local terminal_ones, terminal_tens

Line 290:

Line 270:

end

-- Converts a given integer (in string form) between 0 and 1000 to English text (e.g. 47 -> forty-seven)

-- Converts a given integer (in string form) between 0 and 1000 to English text (e.g. 47 -> forty-seven).

local function numeral_to_english_less_1000(num, use_and, ordinal, plural, zero)

num = tonumber(num)

Line 302:

Line 282:

end

-- Converts an English-text ~~ordinal between~~ 'zeroth' ~~and~~ 'ninety-ninth' to a number [0–99], else -1

-- Converts an ordinal in English text from 'zeroth' to 'ninety-ninth' inclusive to a number [0–99], else -1.

local function english_to_ordinal(english)

local eng = string.lower(english or '')

local ~~eng_lt20~~ = ~~eng_lt20~~

local engord_lt20 = {} -- ones_position_ord{} keys & values swapped

local ~~eng_tens_end~~ = ~~eng_tens_end~~

for k, v in pairs( ones_position_ord ) do

local ~~eng_tens_cont~~ = ~~eng_tens_cont~~

engord_lt20[v] = k

end

if engord_lt20[eng] then

return engord_lt20[eng] -- e.g. first -> 1

elseif engord_tens_end[eng] then

return engord_tens_end[eng] -- e.g. ninetieth -> 90

else

local tens, ones = string.match(eng, '^([a-z]+)[%s%-]+([a-z]+)$')

if tens and ones then

local tens_cont = eng_tens_cont[tens]

local ones_end = engord_lt20[ones]

if tens_cont and ones_end then

return tens_cont + ones_end -- e.g. ninety-ninth -> 99

end

return -1 -- Failed

end

-- Converts a number in English text from 'zero' to 'ninety-nine' inclusive to a number [0–99], else -1.

local function english_to_numeral(english)

local eng = string.lower(english or '')

local eng_lt20 = { ['single'] = 1 } -- ones_position{} keys & values swapped

for k, v in pairs( ones_position ) do

eng_lt20[v] = k

end

if eng_lt20[eng] then

return eng_lt20[eng] --e.g. ~~first~~ -> 1

return eng_lt20[eng] -- e.g. one -> 1

elseif ~~eng_tens_end~~[eng] then

elseif eng_tens_cont[eng] then

return ~~eng_tens_end~~[eng] --e.g. ~~ninetieth~~ -> 90

return eng_tens_cont[eng] -- e.g. ninety -> 90

else

local tens, ones = string.match(eng, '^([a-z]+)%-([a-z]+)$')

local tens, ones = string.match(eng, '^([a-z]+)[%s%-]+([a-z]+)$')

if tens and ones then

local tens_cont = eng_tens_cont[tens]

local ones_end = eng_lt20[ones]

if tens_cont and ones_end then

return tens_cont + ones_end --e.g. ninety-~~ninth~~ -> 99

return tens_cont + ones_end -- e.g. ninety-nine -> 99

end

return -1 --~~failed~~

return -1 -- Failed

end

Line 380:

Line 387:

end

-- Rounds a number to the nearest two-word number (round = up, down, or "on" for round to nearest)

-- Rounds a number to the nearest two-word number (round = up, down, or "on" for round to nearest).

-- Numbers with two digits before the decimal will be rounded to an integer as specified by round.

-- Larger numbers will be rounded to a number with only one nonzero digit in front and all other digits zero.

Line 515:

Line 522:

-- capitalize (boolean): whether to capitalize the result (e.g. 'One' instead of 'one')

-- use_and (boolean): whether to use the word 'and' between tens/ones place and higher places

-- hyphenate (boolean): whether to hyphenate all words in the result, useful ~~for use~~ as an adjective

-- hyphenate (boolean): whether to hyphenate all words in the result, useful as an adjective

-- ordinal (boolean): whether to produce an ordinal (e.g. 'first' instead of 'one')

-- plural (boolean): whether to pluralize the resulting number

Line 620:

Line 627:

local function _numeral_to_english2(args)

local num = args.num

local num = tostring(args.num)

~~if (not tonumber(num)) then~~

num = num:gsub("^%s*(.-)%s*$", "%1") -- Trim whitespace

num = num:gsub(",", "") -- Remove commas

num = num:gsub("^<span[^<>]*></span>", "") -- Generated by Template:age

if num ~= '' then -- a fraction may have an empty whole number

if not num:find("^%-?%d*%.?%d*%-?[Ee]?[+%-]?%d*$") then

-- Input not in a valid format, try to eval it as an expr to see

-- Input not in a valid format, try to ~~pass~~ it ~~through #~~expr to see

-- if that produces a number (e.g. "3 + 5" will become "8").

local noerr, result = pcall(mw.ext.ParserFunctions.expr, num)

~~num~~ = mw.~~getCurrentFrame():preprocess('{{#expr: '~~ .. num ~~.. '}}'~~)

if noerr then

num = result

end

-- ~~Pass args from frame to~~ helper function

-- Call helper function passing args

return _numeral_to_english(

num,

Line 656:

Line 664:

roman_to_numeral = roman_to_numeral,

spell_number = _numeral_to_english,

spell_number2 = _numeral_to_english2,

english_to_ordinal = english_to_ordinal,

english_to_numeral = english_to_numeral,

}

Line 666:

Line 675:

function p._english_to_ordinal(frame) -- callable via {{#invoke:ConvertNumeric|_english_to_ordinal|First}}

return english_to_ordinal(frame.args[1])

end

function p._english_to_numeral(frame) -- callable via {{#invoke:ConvertNumeric|_english_to_numeral|One}}

return english_to_numeral(frame.args[1])

end

function p.numeral_to_english(frame)

local args = frame.args

~~local num = args[1]~~

-- Tail call to helper function passing args from frame

~~num = num:gsub("^%s*(.~~-~~)%s*$", "%1")~~ -~~- Trim whitespace~~

return _numeral_to_english2{

~~num = num:gsub(",", "") -- Remove commas~~

['num'] = args[1],

num = ~~num:gsub("^<span~~[~~^<>~~]*></span>", ~~"") -- Generated by Template:age~~

['numerator'] = args['numerator'],

~~if num ~=~~ '' ~~then -- a fraction may have an empty whole number~~

['denominator'] = args['denominator'],

~~if not num:find("^%-?%d*%.?%d*%-?[Ee~~]?[~~+%-]?%d*$") then~~

['capitalize'] = args['case'] == 'U' or args['case'] == 'u',

~~-- Input not in a valid format, try to pass it through #expr to see~~

['use_and'] = args['sp'] ~= 'us',

~~-- if that produces a number (e.g. "3 + 5" will become "8").~~

['hyphenate'] = args['adj'] == 'on',

~~num = frame:preprocess(~~'~~{{#expr:~~ ' ~~.. num .. '}}')~~

['ordinal'] = args['ord'] == 'on',

~~end~~

['plural'] = args['pl'] == 'on',

~~end~~

['links'] = args['lk'],

['negative_word'] = args['negative'],

~~-- Pass args from frame to helper function~~

['round'] = args['round'],

~~return _numeral_to_english(~~

['zero'] = args['zero'],

~~num~~,

['use_one'] = args['one'] == 'one' -- experiment: using '|one=one' makes fraction 2+1/2 give "two and one-half" instead of "two and a half"

~~args~~['~~numerator~~'],

}

args['denominator'],

args['case'] == 'U' or args['case'] == 'u',

args['sp'] ~= 'us',

args['adj'] == 'on',

args['ord'] == 'on',

args['pl'] == 'on',

args['lk'],

args['negative'],

args['round'],

args['zero'],

args['one'] == 'one' -- experiment: using '|one=one' makes fraction 2+1/2 give "two and one-half" instead of "two and a half"

~~) or ''~~

end

Line 707:

Line 708:

if div >= 1 then return decToHexDigit(div)..dig[mod+1] else return dig[mod+1] end

end -- I think this is supposed to be done with a tail call but first I want something that works at all

---- finds all the decimal numbers in the input text and hexes each of them

function p.decToHex(frame)

@@ Line 3: / Line 3: @@
 -- When editing, preview with: [[Module_talk:ConvertNumeric/testcases]]
 -- First, edit [[Module:ConvertNumeric/sandbox]], then preview with [[Module_talk:ConvertNumeric/sandbox/testcases]]
+require('strict')
 local ones_position = {
@@ Line 189: / Line 190: @@
 }
-local eng_lt20 = {
+local engord_tens_end  = {
-	['zeroth']      =  0,
+	['twentieth']	= 20,
-	['first']       =  1,
+	['thirtieth']	= 30,
-	['second']      =  2,
+	['fortieth']	= 40,
-	['third']       =  3,
+	['fiftieth']	= 50,
-	['fourth']      =  4,
+	['sixtieth']	= 60,
-	['fifth']       =  5,
+	['seventieth']	= 70,
-	['sixth']       =  6,
+	['eightieth']	= 80,
-	['seventh']     =  7,
+	['ninetieth']	= 90,
-	['eighth']      =  8,
-	['ninth']       =  9,
-	['tenth']       = 10,
-	['eleventh']    = 11,
-	['twelfth']     = 12,
-	['thirteenth']  = 13,
-	['fourteenth']  = 14,
-	['fifteenth']   = 15,
-	['sixteenth']   = 16,
-	['seventeenth'] = 17,
-	['eighteenth']  = 18,
-	['nineteenth']  = 19,
-}
-local eng_tens_end  = {
-	['twentieth']  = 20,
-	['thirtieth']  = 30,
-	['fortieth']   = 40,
-	['fiftieth']   = 50,
-	['sixtieth']   = 60,
-	['seventieth'] = 70,
-	['eightieth']  = 80,
-	['ninetieth']  = 90,
 }
 local eng_tens_cont = {
-	['twenty']  = 20,
+	['twenty']	= 20,
-	['thirty']  = 30,
+	['thirty']	= 30,
-	['forty']   = 40,
+	['forty']	= 40,
-	['fifty']   = 50,
+	['fifty']	= 50,
-	['sixty']   = 60,
+	['sixty']	= 60,
-	['seventy'] = 70,
+	['seventy']	= 70,
-	['eighty']  = 80,
+	['eighty']	= 80,
-	['ninety']  = 90,
+	['ninety']	= 90,
 }
--- Converts a given valid roman numeral (and some invalid roman numerals) to a number. Returns -1, errorstring on error
+-- Converts a given valid roman numeral (and some invalid roman numerals) to a number. Returns { -1, errorstring } on error.
 local function roman_to_numeral(roman)
 	if type(roman) ~= "string" then return -1, "roman numeral not a string" end
@@ Line 259: / Line 239: @@
 end
--- Converts a given integer between 0 and 100 to English text (e.g. 47 -> forty-seven)
+-- Converts a given integer between 0 and 100 to English text (e.g. 47 -> forty-seven).
 local function numeral_to_english_less_100(num, ordinal, plural, zero)
 	local terminal_ones, terminal_tens
@@ Line 290: / Line 270: @@
 end
--- Converts a given integer (in string form) between 0 and 1000 to English text (e.g. 47 -> forty-seven)
+-- Converts a given integer (in string form) between 0 and 1000 to English text (e.g. 47 -> forty-seven).
 local function numeral_to_english_less_1000(num, use_and, ordinal, plural, zero)
 	num = tonumber(num)
@@ Line 302: / Line 282: @@
 end
--- Converts an English-text ordinal between 'zeroth' and 'ninety-ninth' to a number [0–99], else -1
+-- Converts an ordinal in English text from 'zeroth' to 'ninety-ninth' inclusive to a number [0–99], else -1.
 local function english_to_ordinal(english)
 	local eng = string.lower(english or '')
-	local eng_lt20 = eng_lt20
+	local engord_lt20 = {} -- ones_position_ord{} keys & values swapped
-	local eng_tens_end = eng_tens_end
+	for k, v in pairs( ones_position_ord ) do
-	local eng_tens_cont = eng_tens_cont
+		engord_lt20[v] = k
+	end
+	if engord_lt20[eng] then
+		return engord_lt20[eng] -- e.g. first -> 1
+	elseif engord_tens_end[eng] then
+		return engord_tens_end[eng] -- e.g. ninetieth -> 90
+	else
+		local tens, ones = string.match(eng, '^([a-z]+)[%s%-]+([a-z]+)$')
+		if tens and ones then
+			local tens_cont = eng_tens_cont[tens]
+			local ones_end  = engord_lt20[ones]
+			if tens_cont and ones_end then
+				return tens_cont + ones_end -- e.g. ninety-ninth -> 99
+			end
+		end
+	end
+	return -1 -- Failed
+end
+-- Converts a number in English text from 'zero' to 'ninety-nine' inclusive to a number [0–99], else -1.
+local function english_to_numeral(english)
+	local eng = string.lower(english or '')
+	local eng_lt20 = { ['single'] = 1 } -- ones_position{} keys & values swapped
+	for k, v in pairs( ones_position ) do
+		eng_lt20[v] = k
+	end
 	if eng_lt20[eng] then
-		return eng_lt20[eng] --e.g. first -> 1
+		return eng_lt20[eng] -- e.g. one -> 1
-	elseif eng_tens_end[eng] then
+	elseif eng_tens_cont[eng] then
-		return eng_tens_end[eng] --e.g. ninetieth -> 90
+		return eng_tens_cont[eng] -- e.g. ninety -> 90
 	else
-		local tens, ones = string.match(eng, '^([a-z]+)%-([a-z]+)$')
+		local tens, ones = string.match(eng, '^([a-z]+)[%s%-]+([a-z]+)$')
 		if tens and ones then
 			local tens_cont = eng_tens_cont[tens]
 			local ones_end  = eng_lt20[ones]
 			if tens_cont and ones_end then
-				return tens_cont + ones_end --e.g. ninety-ninth -> 99
+				return tens_cont + ones_end -- e.g. ninety-nine -> 99
 			end
 		end
 	end
-	return -1 --failed
+	return -1 -- Failed
 end
@@ Line 380: / Line 387: @@
 end
--- Rounds a number to the nearest two-word number (round = up, down, or "on" for round to nearest)
+-- Rounds a number to the nearest two-word number (round = up, down, or "on" for round to nearest).
 -- Numbers with two digits before the decimal will be rounded to an integer as specified by round.
 -- Larger numbers will be rounded to a number with only one nonzero digit in front and all other digits zero.
@@ Line 515: / Line 522: @@
 -- capitalize (boolean): whether to capitalize the result (e.g. 'One' instead of 'one')
 -- use_and (boolean): whether to use the word 'and' between tens/ones place and higher places
--- hyphenate (boolean): whether to hyphenate all words in the result, useful for use as an adjective
+-- hyphenate (boolean): whether to hyphenate all words in the result, useful as an adjective
 -- ordinal (boolean): whether to produce an ordinal (e.g. 'first' instead of 'one')
 -- plural (boolean): whether to pluralize the resulting number
@@ Line 620: / Line 627: @@
 local function _numeral_to_english2(args)
-	local num = args.num
+	local num = tostring(args.num)
-	if (not tonumber(num)) then
+	num = num:gsub("^%s*(.-)%s*$", "%1")   -- Trim whitespace
-		num = num:gsub("^%s*(.-)%s*$", "%1")   -- Trim whitespace
+	num = num:gsub(",", "")   -- Remove commas
-		num = num:gsub(",", "")   -- Remove commas
+	num = num:gsub("^<span[^<>]*></span>", "") -- Generated by Template:age
-		num = num:gsub("^<span[^<>]*></span>", "") -- Generated by Template:age
+	if num ~= '' then  -- a fraction may have an empty whole number
-		if num ~= '' then  -- a fraction may have an empty whole number
+		if not num:find("^%-?%d*%.?%d*%-?[Ee]?[+%-]?%d*$") then
-			if not num:find("^%-?%d*%.?%d*%-?[Ee]?[+%-]?%d*$") then
+			-- Input not in a valid format, try to eval it as an expr to see
-				-- Input not in a valid format, try to pass it through #expr to see
+			-- if that produces a number (e.g. "3 + 5" will become "8").
-				-- if that produces a number (e.g. "3 + 5" will become "8").
+			local noerr, result = pcall(mw.ext.ParserFunctions.expr, num)
-				num = mw.getCurrentFrame():preprocess('{{#expr: ' .. num .. '}}')
+			if noerr then
+				num = result
 			end
 		end
 	end
-	-- Pass args from frame to helper function
+	-- Call helper function passing args
 	return _numeral_to_english(
 		num,
@@ Line 656: / Line 664: @@
 	roman_to_numeral = roman_to_numeral,
 	spell_number = _numeral_to_english,
 	spell_number2 = _numeral_to_english2,
 	english_to_ordinal = english_to_ordinal,
+	english_to_numeral = english_to_numeral,
 }
@@ Line 666: / Line 675: @@
 function p._english_to_ordinal(frame) -- callable via {{#invoke:ConvertNumeric|_english_to_ordinal|First}}
 	return english_to_ordinal(frame.args[1])
+end
+function p._english_to_numeral(frame) -- callable via {{#invoke:ConvertNumeric|_english_to_numeral|One}}
+	return english_to_numeral(frame.args[1])
 end
 function p.numeral_to_english(frame)
 	local args = frame.args
-	local num = args[1]
+	-- Tail call to helper function passing args from frame
-	num = num:gsub("^%s*(.-)%s*$", "%1")   -- Trim whitespace
+	return _numeral_to_english2{
-	num = num:gsub(",", "")   -- Remove commas
+		['num'] = args[1],
-	num = num:gsub("^<span[^<>]*></span>", "") -- Generated by Template:age
+		['numerator'] = args['numerator'],
-	if num ~= '' then  -- a fraction may have an empty whole number
+		['denominator'] = args['denominator'],
-		if not num:find("^%-?%d*%.?%d*%-?[Ee]?[+%-]?%d*$") then
+		['capitalize'] = args['case'] == 'U' or args['case'] == 'u',
-			-- Input not in a valid format, try to pass it through #expr to see
+		['use_and'] = args['sp'] ~= 'us',
-			-- if that produces a number (e.g. "3 + 5" will become "8").
+		['hyphenate'] = args['adj'] == 'on',
-			num = frame:preprocess('{{#expr: ' .. num .. '}}')
+		['ordinal'] = args['ord'] == 'on',
-		end
+		['plural'] = args['pl'] == 'on',
-	end
+		['links'] = args['lk'],
+		['negative_word'] = args['negative'],
-	-- Pass args from frame to helper function
+		['round'] = args['round'],
-	return _numeral_to_english(
+		['zero'] = args['zero'],
-		num,
+		['use_one'] = args['one'] == 'one'  -- experiment: using '|one=one' makes fraction 2+1/2 give "two and one-half" instead of "two and a half"
-		args['numerator'],
+	}
-		args['denominator'],
-		args['case'] == 'U' or args['case'] == 'u',
-		args['sp'] ~= 'us',
-		args['adj'] == 'on',
-		args['ord'] == 'on',
-		args['pl'] == 'on',
-		args['lk'],
-		args['negative'],
-		args['round'],
-		args['zero'],
-		args['one'] == 'one'  -- experiment: using '|one=one' makes fraction 2+1/2 give "two and one-half" instead of "two and a half"
-	) or ''
 end
@@ Line 707: / Line 708: @@
 	if div >= 1 then return decToHexDigit(div)..dig[mod+1] else return dig[mod+1] end
 end -- I think this is supposed to be done with a tail call but first I want something that works at all
 ---- finds all the decimal numbers in the input text and hexes each of them
 function p.decToHex(frame)