<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en">
	<id>https://test.st34an.tech/index.php?action=history&amp;feed=atom&amp;title=Module%3AHeadword%2Fdata</id>
	<title>Module:Headword/data - Revision history</title>
	<link rel="self" type="application/atom+xml" href="https://test.st34an.tech/index.php?action=history&amp;feed=atom&amp;title=Module%3AHeadword%2Fdata"/>
	<link rel="alternate" type="text/html" href="https://test.st34an.tech/index.php?title=Module:Headword/data&amp;action=history"/>
	<updated>2026-04-10T22:41:18Z</updated>
	<subtitle>Revision history for this page on the wiki</subtitle>
	<generator>MediaWiki 1.45.3</generator>
	<entry>
		<id>https://test.st34an.tech/index.php?title=Module:Headword/data&amp;diff=275&amp;oldid=prev</id>
		<title>Jsrs701: 1 revision imported</title>
		<link rel="alternate" type="text/html" href="https://test.st34an.tech/index.php?title=Module:Headword/data&amp;diff=275&amp;oldid=prev"/>
		<updated>2026-04-10T07:29:34Z</updated>

		<summary type="html">&lt;p&gt;1 revision imported&lt;/p&gt;
&lt;table style=&quot;background-color: #fff; color: #202122;&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;tr class=&quot;diff-title&quot; lang=&quot;en&quot;&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;← Older revision&lt;/td&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;Revision as of 07:29, 10 April 2026&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;4&quot; class=&quot;diff-notice&quot; lang=&quot;en&quot;&gt;&lt;div class=&quot;mw-diff-empty&quot;&gt;(No difference)&lt;/div&gt;
&lt;/td&gt;&lt;/tr&gt;
&lt;!-- diff cache key mediawikidb:diff:1.41:old-274:rev-275 --&gt;
&lt;/table&gt;</summary>
		<author><name>Jsrs701</name></author>
	</entry>
	<entry>
		<id>https://test.st34an.tech/index.php?title=Module:Headword/data&amp;diff=274&amp;oldid=prev</id>
		<title>bob&gt;Djpwikiadmin at 02:30, 7 September 2023</title>
		<link rel="alternate" type="text/html" href="https://test.st34an.tech/index.php?title=Module:Headword/data&amp;diff=274&amp;oldid=prev"/>
		<updated>2023-09-07T02:30:28Z</updated>

		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;p&gt;&lt;b&gt;New page&lt;/b&gt;&lt;/p&gt;&lt;div&gt;local u = mw.ustring.char&lt;br /&gt;
local rsubn = mw.ustring.gsub&lt;br /&gt;
&lt;br /&gt;
-- Version of rsubn() that discards all but the first return value.&lt;br /&gt;
local function rsub(term, foo, bar)&lt;br /&gt;
	return (rsubn(term, foo, bar))&lt;br /&gt;
end&lt;br /&gt;
&lt;br /&gt;
local function track(track_id)&lt;br /&gt;
	local tracking_page = &amp;quot;headword/&amp;quot; .. track_id&lt;br /&gt;
	local m_debug_track = require(&amp;quot;Module:debug/track&amp;quot;)&lt;br /&gt;
	m_debug_track(tracking_page)&lt;br /&gt;
	return true&lt;br /&gt;
end&lt;br /&gt;
&lt;br /&gt;
local frame = mw.getCurrentFrame()&lt;br /&gt;
local title = mw.title.getCurrentTitle()&lt;br /&gt;
&lt;br /&gt;
local data = {}&lt;br /&gt;
&lt;br /&gt;
------ 1. Lists that will be converted into sets. ------&lt;br /&gt;
&lt;br /&gt;
data.invariable = {&lt;br /&gt;
	&amp;quot;cmavo&amp;quot;,&lt;br /&gt;
	&amp;quot;cmene&amp;quot;,&lt;br /&gt;
	&amp;quot;fu&amp;#039;ivla&amp;quot;,&lt;br /&gt;
	&amp;quot;gismu&amp;quot;,&lt;br /&gt;
	&amp;quot;Han tu&amp;quot;,&lt;br /&gt;
	&amp;quot;hanja&amp;quot;,&lt;br /&gt;
	&amp;quot;hanzi&amp;quot;,&lt;br /&gt;
	&amp;quot;jyutping&amp;quot;,&lt;br /&gt;
	&amp;quot;kanji&amp;quot;,&lt;br /&gt;
	&amp;quot;lujvo&amp;quot;,&lt;br /&gt;
	&amp;quot;phrasebook&amp;quot;,&lt;br /&gt;
	&amp;quot;pinyin&amp;quot;,&lt;br /&gt;
	&amp;quot;rafsi&amp;quot;,&lt;br /&gt;
	&amp;quot;romaji&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
data.lemmas = {&lt;br /&gt;
	&amp;quot;abbreviations&amp;quot;,&lt;br /&gt;
	&amp;quot;acronyms&amp;quot;,&lt;br /&gt;
	&amp;quot;adjectives&amp;quot;,&lt;br /&gt;
	&amp;quot;adnominals&amp;quot;,&lt;br /&gt;
	&amp;quot;adpositions&amp;quot;,&lt;br /&gt;
	&amp;quot;adverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;affixes&amp;quot;,&lt;br /&gt;
	&amp;quot;ambipositions&amp;quot;,&lt;br /&gt;
	&amp;quot;articles&amp;quot;,&lt;br /&gt;
	&amp;quot;circumfixes&amp;quot;,&lt;br /&gt;
	&amp;quot;circumpositions&amp;quot;,&lt;br /&gt;
	&amp;quot;classifiers&amp;quot;,&lt;br /&gt;
	&amp;quot;cmavo&amp;quot;,&lt;br /&gt;
	&amp;quot;cmavo clusters&amp;quot;,&lt;br /&gt;
	&amp;quot;cmene&amp;quot;,&lt;br /&gt;
	&amp;quot;combining forms&amp;quot;,&lt;br /&gt;
	&amp;quot;conjunctions&amp;quot;,&lt;br /&gt;
	&amp;quot;counters&amp;quot;,&lt;br /&gt;
	&amp;quot;determiners&amp;quot;,&lt;br /&gt;
	&amp;quot;diacritical marks&amp;quot;,&lt;br /&gt;
	&amp;quot;equative adjectives&amp;quot;,&lt;br /&gt;
	&amp;quot;fu&amp;#039;ivla&amp;quot;,&lt;br /&gt;
	&amp;quot;gismu&amp;quot;,&lt;br /&gt;
	&amp;quot;Han characters&amp;quot;,&lt;br /&gt;
	&amp;quot;Han tu&amp;quot;,&lt;br /&gt;
	&amp;quot;hanja&amp;quot;,&lt;br /&gt;
	&amp;quot;hanzi&amp;quot;,&lt;br /&gt;
	&amp;quot;ideophones&amp;quot;,&lt;br /&gt;
	&amp;quot;idioms&amp;quot;,&lt;br /&gt;
	&amp;quot;infixes&amp;quot;,&lt;br /&gt;
	&amp;quot;initialisms&amp;quot;,&lt;br /&gt;
	&amp;quot;interfixes&amp;quot;,&lt;br /&gt;
	&amp;quot;interjections&amp;quot;,&lt;br /&gt;
	&amp;quot;kanji&amp;quot;,&lt;br /&gt;
	&amp;quot;letters&amp;quot;,&lt;br /&gt;
	&amp;quot;ligatures&amp;quot;,&lt;br /&gt;
	&amp;quot;logograms&amp;quot;,&lt;br /&gt;
	&amp;quot;lujvo&amp;quot;,&lt;br /&gt;
	&amp;quot;morphemes&amp;quot;,&lt;br /&gt;
	&amp;quot;non-constituents&amp;quot;,&lt;br /&gt;
	&amp;quot;nouns&amp;quot;,&lt;br /&gt;
	&amp;quot;numbers&amp;quot;,&lt;br /&gt;
	&amp;quot;numeral symbols&amp;quot;,&lt;br /&gt;
	&amp;quot;numerals&amp;quot;,&lt;br /&gt;
	&amp;quot;particles&amp;quot;,&lt;br /&gt;
	&amp;quot;phrases&amp;quot;,&lt;br /&gt;
	&amp;quot;postpositions&amp;quot;,&lt;br /&gt;
	&amp;quot;postpositional phrases&amp;quot;,&lt;br /&gt;
	&amp;quot;predicatives&amp;quot;,&lt;br /&gt;
	&amp;quot;prefixes&amp;quot;,&lt;br /&gt;
	&amp;quot;prepositional phrases&amp;quot;,&lt;br /&gt;
	&amp;quot;prepositions&amp;quot;,&lt;br /&gt;
	&amp;quot;preverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;pronominal adverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;pronouns&amp;quot;,&lt;br /&gt;
	&amp;quot;proper nouns&amp;quot;,&lt;br /&gt;
	&amp;quot;proverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;punctuation marks&amp;quot;,&lt;br /&gt;
	&amp;quot;relatives&amp;quot;,&lt;br /&gt;
	&amp;quot;roots&amp;quot;,&lt;br /&gt;
	&amp;quot;stems&amp;quot;,&lt;br /&gt;
	&amp;quot;suffixes&amp;quot;,&lt;br /&gt;
	&amp;quot;syllables&amp;quot;,&lt;br /&gt;
	&amp;quot;symbols&amp;quot;,&lt;br /&gt;
	&amp;quot;verbs&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
data.nonlemmas = {&lt;br /&gt;
	&amp;quot;active participle forms&amp;quot;,&lt;br /&gt;
	&amp;quot;active participles&amp;quot;,&lt;br /&gt;
	&amp;quot;adjectival participles&amp;quot;,&lt;br /&gt;
    &amp;quot;adjective case forms&amp;quot;,&lt;br /&gt;
	&amp;quot;adjective forms&amp;quot;,&lt;br /&gt;
	&amp;quot;adjective feminine forms&amp;quot;,&lt;br /&gt;
	&amp;quot;adjective plural forms&amp;quot;,&lt;br /&gt;
	&amp;quot;adverb forms&amp;quot;,&lt;br /&gt;
	&amp;quot;adverbial participles&amp;quot;,&lt;br /&gt;
	&amp;quot;agent participles&amp;quot;,&lt;br /&gt;
	&amp;quot;article forms&amp;quot;,&lt;br /&gt;
	&amp;quot;circumfix forms&amp;quot;,&lt;br /&gt;
	&amp;quot;combined forms&amp;quot;,&lt;br /&gt;
	&amp;quot;comparative adjective forms&amp;quot;,&lt;br /&gt;
	&amp;quot;comparative adjectives&amp;quot;,&lt;br /&gt;
	&amp;quot;comparative adverb forms&amp;quot;,&lt;br /&gt;
	&amp;quot;comparative adverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;conjunction forms&amp;quot;,&lt;br /&gt;
	&amp;quot;contractions&amp;quot;,&lt;br /&gt;
	&amp;quot;converbs&amp;quot;,&lt;br /&gt;
	&amp;quot;determiner comparative forms&amp;quot;,&lt;br /&gt;
	&amp;quot;determiner forms&amp;quot;,&lt;br /&gt;
	&amp;quot;determiner superlative forms&amp;quot;,&lt;br /&gt;
	&amp;quot;diminutive nouns&amp;quot;,&lt;br /&gt;
	&amp;quot;equative adjective forms&amp;quot;,&lt;br /&gt;
	&amp;quot;equative adjectives&amp;quot;,&lt;br /&gt;
	&amp;quot;future participles&amp;quot;,&lt;br /&gt;
	&amp;quot;gerunds&amp;quot;,&lt;br /&gt;
	&amp;quot;infinitive forms&amp;quot;,&lt;br /&gt;
	&amp;quot;infinitives&amp;quot;,&lt;br /&gt;
	&amp;quot;interjection forms&amp;quot;,&lt;br /&gt;
	&amp;quot;jyutping&amp;quot;,&lt;br /&gt;
	&amp;quot;kanji readings&amp;quot;,&lt;br /&gt;
	&amp;quot;misspellings&amp;quot;,&lt;br /&gt;
	&amp;quot;negative participles&amp;quot;,&lt;br /&gt;
	&amp;quot;nominal participles&amp;quot;,&lt;br /&gt;
	&amp;quot;noun case forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun dual forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun paucal forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun plural forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun possessive forms&amp;quot;,&lt;br /&gt;
	&amp;quot;noun singulative forms&amp;quot;,&lt;br /&gt;
	&amp;quot;numeral forms&amp;quot;,&lt;br /&gt;
	&amp;quot;participles&amp;quot;,&lt;br /&gt;
	&amp;quot;participle forms&amp;quot;,&lt;br /&gt;
	&amp;quot;particle forms&amp;quot;,&lt;br /&gt;
	&amp;quot;passive participles&amp;quot;,&lt;br /&gt;
	&amp;quot;past active participles&amp;quot;,&lt;br /&gt;
	&amp;quot;past participles&amp;quot;,&lt;br /&gt;
	&amp;quot;past participle forms&amp;quot;,&lt;br /&gt;
	&amp;quot;past passive participles&amp;quot;,&lt;br /&gt;
	&amp;quot;perfect active participles&amp;quot;,&lt;br /&gt;
	&amp;quot;perfect participles&amp;quot;,&lt;br /&gt;
	&amp;quot;perfect passive participles&amp;quot;,&lt;br /&gt;
	&amp;quot;pinyin&amp;quot;,&lt;br /&gt;
	&amp;quot;plurals&amp;quot;,&lt;br /&gt;
	&amp;quot;postposition forms&amp;quot;,&lt;br /&gt;
	&amp;quot;prefix forms&amp;quot;,&lt;br /&gt;
	&amp;quot;preposition contractions&amp;quot;,&lt;br /&gt;
	&amp;quot;preposition forms&amp;quot;,&lt;br /&gt;
	&amp;quot;prepositional pronouns&amp;quot;,&lt;br /&gt;
	&amp;quot;present active participles&amp;quot;,&lt;br /&gt;
	&amp;quot;present participles&amp;quot;,&lt;br /&gt;
	&amp;quot;present passive participles&amp;quot;,&lt;br /&gt;
	&amp;quot;pronoun forms&amp;quot;,&lt;br /&gt;
	&amp;quot;pronoun possessive forms&amp;quot;,&lt;br /&gt;
	&amp;quot;proper noun forms&amp;quot;,&lt;br /&gt;
	&amp;quot;proper noun plural forms&amp;quot;,&lt;br /&gt;
	&amp;quot;rafsi&amp;quot;,&lt;br /&gt;
	&amp;quot;romanizations&amp;quot;,&lt;br /&gt;
	&amp;quot;root forms&amp;quot;,&lt;br /&gt;
	&amp;quot;singulatives&amp;quot;,&lt;br /&gt;
	&amp;quot;suffix forms&amp;quot;,&lt;br /&gt;
	&amp;quot;superlative adjective forms&amp;quot;,&lt;br /&gt;
	&amp;quot;superlative adjectives&amp;quot;,&lt;br /&gt;
	&amp;quot;superlative adverb forms&amp;quot;,&lt;br /&gt;
	&amp;quot;superlative adverbs&amp;quot;,&lt;br /&gt;
	&amp;quot;verb forms&amp;quot;,&lt;br /&gt;
	&amp;quot;verbal nouns&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- These langauges will not have links to separate parts of the headword.&lt;br /&gt;
data.no_multiword_links = {&lt;br /&gt;
	&amp;quot;zh&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- These languages will not have &amp;quot;LANG multiword terms&amp;quot; categories added.&lt;br /&gt;
data.no_multiword_cat = {&lt;br /&gt;
	-------- Languages without spaces between words (sometimes spaces between phrases) --------&lt;br /&gt;
	&amp;quot;blt&amp;quot;, -- Tai Dam&lt;br /&gt;
	&amp;quot;ja&amp;quot;, -- Japanese&lt;br /&gt;
	&amp;quot;khb&amp;quot;, -- Lü&lt;br /&gt;
	&amp;quot;km&amp;quot;, -- Khmer&lt;br /&gt;
	&amp;quot;lo&amp;quot;, -- Lao&lt;br /&gt;
	&amp;quot;mnw&amp;quot;, -- Mon&lt;br /&gt;
	&amp;quot;my&amp;quot;, -- Burmese&lt;br /&gt;
	&amp;quot;nan&amp;quot;, -- Min Nan (some words in Latin script; hyphens between syllables)&lt;br /&gt;
	&amp;quot;nod&amp;quot;, -- Northern Thai&lt;br /&gt;
	&amp;quot;ojp&amp;quot;, -- Old Japanese&lt;br /&gt;
	&amp;quot;shn&amp;quot;, -- Shan&lt;br /&gt;
	&amp;quot;sou&amp;quot;, -- Southern Thai&lt;br /&gt;
	&amp;quot;tdd&amp;quot;, -- Tai Nüa&lt;br /&gt;
	&amp;quot;th&amp;quot;, -- Thai&lt;br /&gt;
	&amp;quot;tts&amp;quot;, -- Isan&lt;br /&gt;
	&amp;quot;twh&amp;quot;, -- Tai Dón&lt;br /&gt;
	&amp;quot;txg&amp;quot;, -- Tangut&lt;br /&gt;
	&amp;quot;zh&amp;quot;, -- Chinese (all varieties with Chinese characters)&lt;br /&gt;
	&amp;quot;zkt&amp;quot;, -- Khitan&lt;br /&gt;
&lt;br /&gt;
	-------- Languages with spaces between syllables --------&lt;br /&gt;
	&amp;quot;ahk&amp;quot;, -- Akha&lt;br /&gt;
	&amp;quot;aou&amp;quot;, -- A&amp;#039;ou&lt;br /&gt;
	&amp;quot;atb&amp;quot;, -- Zaiwa&lt;br /&gt;
	&amp;quot;byk&amp;quot;, -- Biao&lt;br /&gt;
	&amp;quot;cdy&amp;quot;, -- Chadong&lt;br /&gt;
	--&amp;quot;duu&amp;quot;, -- Drung; not sure&lt;br /&gt;
	--&amp;quot;hmx-pro&amp;quot;, -- Proto-Hmong-Mien&lt;br /&gt;
	--&amp;quot;hnj&amp;quot;, -- Green Hmong; not sure&lt;br /&gt;
	&amp;quot;huq&amp;quot;, -- Tsat&lt;br /&gt;
	&amp;quot;ium&amp;quot;, -- Iu Mien&lt;br /&gt;
	--&amp;quot;lis&amp;quot;, -- Lisu; not sure&lt;br /&gt;
	&amp;quot;mtq&amp;quot;, -- Muong&lt;br /&gt;
	--&amp;quot;mww&amp;quot;, -- White Hmong; not sure&lt;br /&gt;
	&amp;quot;onb&amp;quot;, -- Lingao&lt;br /&gt;
	--&amp;quot;sit-gkh&amp;quot;, -- Gokhy; not sure&lt;br /&gt;
	--&amp;quot;swi&amp;quot;, -- Sui; not sure&lt;br /&gt;
	&amp;quot;tbq-lol-pro&amp;quot;, -- Proto-Loloish&lt;br /&gt;
	&amp;quot;tdh&amp;quot;, -- Thulung&lt;br /&gt;
	&amp;quot;ukk&amp;quot;, -- Muak Sa-aak&lt;br /&gt;
	&amp;quot;vi&amp;quot;, -- Vietnamese&lt;br /&gt;
	&amp;quot;yig&amp;quot;, -- Wusa Nasu&lt;br /&gt;
	&amp;quot;zng&amp;quot;, -- Mang&lt;br /&gt;
&lt;br /&gt;
	-------- Languages with ~ with surrounding spaces used to separate variants --------&lt;br /&gt;
	&amp;quot;mkh-ban-pro&amp;quot;, -- Proto-Bahnaric&lt;br /&gt;
	&amp;quot;sit-pro&amp;quot;, -- Proto-Sino-Tibetan; listed above&lt;br /&gt;
&lt;br /&gt;
	-------- Other weirdnesses --------&lt;br /&gt;
	&amp;quot;mul&amp;quot;, -- Translingual; gestures, Morse code, etc.&lt;br /&gt;
	&amp;quot;aot&amp;quot;, -- Atong (India); bullet is a letter&lt;br /&gt;
&lt;br /&gt;
	-------- All sign languages	--------&lt;br /&gt;
	&amp;quot;ads&amp;quot;,&lt;br /&gt;
	&amp;quot;aed&amp;quot;,&lt;br /&gt;
	&amp;quot;aen&amp;quot;,&lt;br /&gt;
	&amp;quot;afg&amp;quot;,&lt;br /&gt;
	&amp;quot;ase&amp;quot;,&lt;br /&gt;
	&amp;quot;asf&amp;quot;,&lt;br /&gt;
	&amp;quot;asp&amp;quot;,&lt;br /&gt;
	&amp;quot;asq&amp;quot;,&lt;br /&gt;
	&amp;quot;asw&amp;quot;,&lt;br /&gt;
	&amp;quot;bfi&amp;quot;,&lt;br /&gt;
	&amp;quot;bfk&amp;quot;,&lt;br /&gt;
	&amp;quot;bog&amp;quot;,&lt;br /&gt;
	&amp;quot;bqn&amp;quot;,&lt;br /&gt;
	&amp;quot;bqy&amp;quot;,&lt;br /&gt;
	&amp;quot;bvl&amp;quot;,&lt;br /&gt;
	&amp;quot;bzs&amp;quot;,&lt;br /&gt;
	&amp;quot;cds&amp;quot;,&lt;br /&gt;
	&amp;quot;csc&amp;quot;,&lt;br /&gt;
	&amp;quot;csd&amp;quot;,&lt;br /&gt;
	&amp;quot;cse&amp;quot;,&lt;br /&gt;
	&amp;quot;csf&amp;quot;,&lt;br /&gt;
	&amp;quot;csg&amp;quot;,&lt;br /&gt;
	&amp;quot;csl&amp;quot;,&lt;br /&gt;
	&amp;quot;csn&amp;quot;,&lt;br /&gt;
	&amp;quot;csq&amp;quot;,&lt;br /&gt;
	&amp;quot;csr&amp;quot;,&lt;br /&gt;
	&amp;quot;doq&amp;quot;,&lt;br /&gt;
	&amp;quot;dse&amp;quot;,&lt;br /&gt;
	&amp;quot;dsl&amp;quot;,&lt;br /&gt;
	&amp;quot;ecs&amp;quot;,&lt;br /&gt;
	&amp;quot;esl&amp;quot;,&lt;br /&gt;
	&amp;quot;esn&amp;quot;,&lt;br /&gt;
	&amp;quot;eso&amp;quot;,&lt;br /&gt;
	&amp;quot;eth&amp;quot;,&lt;br /&gt;
	&amp;quot;fcs&amp;quot;,&lt;br /&gt;
	&amp;quot;fse&amp;quot;,&lt;br /&gt;
	&amp;quot;fsl&amp;quot;,&lt;br /&gt;
	&amp;quot;fss&amp;quot;,&lt;br /&gt;
	&amp;quot;gds&amp;quot;,&lt;br /&gt;
	&amp;quot;gse&amp;quot;,&lt;br /&gt;
	&amp;quot;gsg&amp;quot;,&lt;br /&gt;
	&amp;quot;gsm&amp;quot;,&lt;br /&gt;
	&amp;quot;gss&amp;quot;,&lt;br /&gt;
	&amp;quot;gus&amp;quot;,&lt;br /&gt;
	&amp;quot;hab&amp;quot;,&lt;br /&gt;
	&amp;quot;haf&amp;quot;,&lt;br /&gt;
	&amp;quot;hds&amp;quot;,&lt;br /&gt;
	&amp;quot;hks&amp;quot;,&lt;br /&gt;
	&amp;quot;hos&amp;quot;,&lt;br /&gt;
	&amp;quot;hps&amp;quot;,&lt;br /&gt;
	&amp;quot;hsh&amp;quot;,&lt;br /&gt;
	&amp;quot;hsl&amp;quot;,&lt;br /&gt;
	&amp;quot;icl&amp;quot;,&lt;br /&gt;
	&amp;quot;iks&amp;quot;,&lt;br /&gt;
	&amp;quot;ils&amp;quot;,&lt;br /&gt;
	&amp;quot;inl&amp;quot;,&lt;br /&gt;
	&amp;quot;ins&amp;quot;,&lt;br /&gt;
	&amp;quot;ise&amp;quot;,&lt;br /&gt;
	&amp;quot;isg&amp;quot;,&lt;br /&gt;
	&amp;quot;isr&amp;quot;,&lt;br /&gt;
	&amp;quot;jcs&amp;quot;,&lt;br /&gt;
	&amp;quot;jhs&amp;quot;,&lt;br /&gt;
	&amp;quot;jls&amp;quot;,&lt;br /&gt;
	&amp;quot;jos&amp;quot;,&lt;br /&gt;
	&amp;quot;jsl&amp;quot;,&lt;br /&gt;
	&amp;quot;jus&amp;quot;,&lt;br /&gt;
	&amp;quot;kgi&amp;quot;,&lt;br /&gt;
	&amp;quot;kvk&amp;quot;,&lt;br /&gt;
	&amp;quot;lbs&amp;quot;,&lt;br /&gt;
	&amp;quot;lls&amp;quot;,&lt;br /&gt;
	&amp;quot;lsl&amp;quot;,&lt;br /&gt;
	&amp;quot;lso&amp;quot;,&lt;br /&gt;
	&amp;quot;lsp&amp;quot;,&lt;br /&gt;
	&amp;quot;lst&amp;quot;,&lt;br /&gt;
	&amp;quot;lsy&amp;quot;,&lt;br /&gt;
	&amp;quot;lws&amp;quot;,&lt;br /&gt;
	&amp;quot;mdl&amp;quot;,&lt;br /&gt;
	&amp;quot;mfs&amp;quot;,&lt;br /&gt;
	&amp;quot;mre&amp;quot;,&lt;br /&gt;
	&amp;quot;msd&amp;quot;,&lt;br /&gt;
	&amp;quot;msr&amp;quot;,&lt;br /&gt;
	&amp;quot;mzc&amp;quot;,&lt;br /&gt;
	&amp;quot;mzg&amp;quot;,&lt;br /&gt;
	&amp;quot;mzy&amp;quot;,&lt;br /&gt;
	&amp;quot;nbs&amp;quot;,&lt;br /&gt;
	&amp;quot;ncs&amp;quot;,&lt;br /&gt;
	&amp;quot;nsi&amp;quot;,&lt;br /&gt;
	&amp;quot;nsl&amp;quot;,&lt;br /&gt;
	&amp;quot;nsp&amp;quot;,&lt;br /&gt;
	&amp;quot;nsr&amp;quot;,&lt;br /&gt;
	&amp;quot;nzs&amp;quot;,&lt;br /&gt;
	&amp;quot;okl&amp;quot;,&lt;br /&gt;
	&amp;quot;pgz&amp;quot;,&lt;br /&gt;
	&amp;quot;pks&amp;quot;,&lt;br /&gt;
	&amp;quot;prl&amp;quot;,&lt;br /&gt;
	&amp;quot;prz&amp;quot;,&lt;br /&gt;
	&amp;quot;psc&amp;quot;,&lt;br /&gt;
	&amp;quot;psd&amp;quot;,&lt;br /&gt;
	&amp;quot;psg&amp;quot;,&lt;br /&gt;
	&amp;quot;psl&amp;quot;,&lt;br /&gt;
	&amp;quot;pso&amp;quot;,&lt;br /&gt;
	&amp;quot;psp&amp;quot;,&lt;br /&gt;
	&amp;quot;psr&amp;quot;,&lt;br /&gt;
	&amp;quot;pys&amp;quot;,&lt;br /&gt;
	&amp;quot;rms&amp;quot;,&lt;br /&gt;
	&amp;quot;rsl&amp;quot;,&lt;br /&gt;
	&amp;quot;rsm&amp;quot;,&lt;br /&gt;
	&amp;quot;sdl&amp;quot;,&lt;br /&gt;
	&amp;quot;sfb&amp;quot;,&lt;br /&gt;
	&amp;quot;sfs&amp;quot;,&lt;br /&gt;
	&amp;quot;sgg&amp;quot;,&lt;br /&gt;
	&amp;quot;sgx&amp;quot;,&lt;br /&gt;
	&amp;quot;slf&amp;quot;,&lt;br /&gt;
	&amp;quot;sls&amp;quot;,&lt;br /&gt;
	&amp;quot;sqk&amp;quot;,&lt;br /&gt;
	&amp;quot;sqs&amp;quot;,&lt;br /&gt;
	&amp;quot;ssp&amp;quot;,&lt;br /&gt;
	&amp;quot;ssr&amp;quot;,&lt;br /&gt;
	&amp;quot;svk&amp;quot;,&lt;br /&gt;
	&amp;quot;swl&amp;quot;,&lt;br /&gt;
	&amp;quot;syy&amp;quot;,&lt;br /&gt;
	&amp;quot;tse&amp;quot;,&lt;br /&gt;
	&amp;quot;tsm&amp;quot;,&lt;br /&gt;
	&amp;quot;tsq&amp;quot;,&lt;br /&gt;
	&amp;quot;tss&amp;quot;,&lt;br /&gt;
	&amp;quot;tsy&amp;quot;,&lt;br /&gt;
	&amp;quot;tza&amp;quot;,&lt;br /&gt;
	&amp;quot;ugn&amp;quot;,&lt;br /&gt;
	&amp;quot;ugy&amp;quot;,&lt;br /&gt;
	&amp;quot;ukl&amp;quot;,&lt;br /&gt;
	&amp;quot;uks&amp;quot;,&lt;br /&gt;
	&amp;quot;vgt&amp;quot;,&lt;br /&gt;
	&amp;quot;vsi&amp;quot;,&lt;br /&gt;
	&amp;quot;vsl&amp;quot;,&lt;br /&gt;
	&amp;quot;vsv&amp;quot;,&lt;br /&gt;
	&amp;quot;xki&amp;quot;,&lt;br /&gt;
	&amp;quot;xml&amp;quot;,&lt;br /&gt;
	&amp;quot;xms&amp;quot;,&lt;br /&gt;
	&amp;quot;ygs&amp;quot;,&lt;br /&gt;
	&amp;quot;ysl&amp;quot;,&lt;br /&gt;
	&amp;quot;zib&amp;quot;,&lt;br /&gt;
	&amp;quot;zsl&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- In these languages, the hyphen is not considered a word separator for the &amp;quot;multiword terms&amp;quot; category.&lt;br /&gt;
data.hyphen_not_multiword_sep = {&lt;br /&gt;
	&amp;quot;akk&amp;quot;, -- Akkadian; hyphens between syllables&lt;br /&gt;
	&amp;quot;akl&amp;quot;, -- Aklanon; hyphens for mid-word glottal stops&lt;br /&gt;
	&amp;quot;ber-pro&amp;quot;, -- Proto-Berber; morphemes separated by hyphens&lt;br /&gt;
	&amp;quot;ceb&amp;quot;, -- Cebuano; hyphens for mid-word glottal stops&lt;br /&gt;
	&amp;quot;cnk&amp;quot;, -- Khumi Chin; hyphens used in single words&lt;br /&gt;
	&amp;quot;cpi&amp;quot;, -- Chinese Pidgin English; Chinese-derived words with hyphens between syllables&lt;br /&gt;
	&amp;quot;de&amp;quot;, -- too many false positives&lt;br /&gt;
	&amp;quot;esx-esk-pro&amp;quot;, -- hyphen used to separate morphemes&lt;br /&gt;
	&amp;quot;fi&amp;quot;, -- Finnish; hyphen used to separate components in compound words if the final and initial vowels match, respectively&lt;br /&gt;
	&amp;quot;hil&amp;quot;, -- Hiligaynon; hyphens for mid-word glottal stops&lt;br /&gt;
	&amp;quot;ilo&amp;quot;, -- Ilocano; hyphens for mid-word glottal stops&lt;br /&gt;
	&amp;quot;lcp&amp;quot;, -- Western Lawa; dash as syllable joiner&lt;br /&gt;
	&amp;quot;lwl&amp;quot;, -- Eastern Lawa; dash as syllable joiner&lt;br /&gt;
	&amp;quot;mfa&amp;quot;, -- Pattani Malay in Thai script; dash as syllable joiner&lt;br /&gt;
	&amp;quot;mkh-vie-pro&amp;quot;, -- Proto-Vietic; morphemes separated by hyphens&lt;br /&gt;
	&amp;quot;msb&amp;quot;, -- Masbatenyo; too many false positives&lt;br /&gt;
	&amp;quot;tl&amp;quot;, -- Tagalog; too many false positives&lt;br /&gt;
	&amp;quot;war&amp;quot;, -- Waray-Waray; too many false positives&lt;br /&gt;
	&amp;quot;yo&amp;quot;, -- Yoruba; hyphens used to show lengthened nasal vowels&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- These languages will not have &amp;quot;LANG masculine nouns&amp;quot; and similar categories added.&lt;br /&gt;
data.no_gender_cat = {&lt;br /&gt;
	-- Languages without gender but which use the gender field for other purposes&lt;br /&gt;
	&amp;quot;ja&amp;quot;,&lt;br /&gt;
	&amp;quot;th&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
data.notranslit = {&lt;br /&gt;
	&amp;quot;ams&amp;quot;,&lt;br /&gt;
	&amp;quot;az&amp;quot;,&lt;br /&gt;
	&amp;quot;bbc&amp;quot;,&lt;br /&gt;
	&amp;quot;bug&amp;quot;,&lt;br /&gt;
	&amp;quot;cia&amp;quot;,&lt;br /&gt;
	&amp;quot;cjm&amp;quot;,&lt;br /&gt;
	&amp;quot;cmn&amp;quot;,&lt;br /&gt;
	&amp;quot;cpi&amp;quot;,&lt;br /&gt;
	&amp;quot;hak&amp;quot;,&lt;br /&gt;
	&amp;quot;ja&amp;quot;,&lt;br /&gt;
	&amp;quot;kzg&amp;quot;,&lt;br /&gt;
	&amp;quot;lad&amp;quot;,&lt;br /&gt;
	&amp;quot;lzh&amp;quot;,&lt;br /&gt;
	&amp;quot;ms&amp;quot;,&lt;br /&gt;
	&amp;quot;mul&amp;quot;,&lt;br /&gt;
	&amp;quot;mvi&amp;quot;,&lt;br /&gt;
	&amp;quot;nan&amp;quot;,&lt;br /&gt;
	&amp;quot;oj&amp;quot;,&lt;br /&gt;
	&amp;quot;okn&amp;quot;,&lt;br /&gt;
	&amp;quot;ro&amp;quot;,&lt;br /&gt;
	&amp;quot;ryn&amp;quot;,&lt;br /&gt;
	&amp;quot;rys&amp;quot;,&lt;br /&gt;
	&amp;quot;ryu&amp;quot;,&lt;br /&gt;
	&amp;quot;sh&amp;quot;,&lt;br /&gt;
	&amp;quot;tgt&amp;quot;,&lt;br /&gt;
	&amp;quot;th&amp;quot;,&lt;br /&gt;
	&amp;quot;tkn&amp;quot;,&lt;br /&gt;
	&amp;quot;tly&amp;quot;,&lt;br /&gt;
	&amp;quot;txg&amp;quot;,&lt;br /&gt;
	&amp;quot;und&amp;quot;,&lt;br /&gt;
	&amp;quot;vi&amp;quot;,&lt;br /&gt;
	&amp;quot;xug&amp;quot;,&lt;br /&gt;
	&amp;quot;yoi&amp;quot;,&lt;br /&gt;
	&amp;quot;yox&amp;quot;,&lt;br /&gt;
	&amp;quot;yue&amp;quot;,&lt;br /&gt;
	&amp;quot;za&amp;quot;,&lt;br /&gt;
	&amp;quot;zh&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- Script codes for which a script-tagged display title will be added.&lt;br /&gt;
data.toBeTagged = {&lt;br /&gt;
	&amp;quot;Ahom&amp;quot;,&lt;br /&gt;
	&amp;quot;Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;fa-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;glk-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;kk-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ks-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ku-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;mzn-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ms-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ota-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;pa-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ps-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;sd-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;tt-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ug-Arab&amp;quot;,&lt;br /&gt;
		&amp;quot;ur-Arab&amp;quot;,&lt;br /&gt;
	&amp;quot;Armi&amp;quot;,&lt;br /&gt;
	&amp;quot;Armn&amp;quot;,&lt;br /&gt;
	&amp;quot;Avst&amp;quot;,&lt;br /&gt;
	&amp;quot;Bali&amp;quot;,&lt;br /&gt;
	&amp;quot;Bamu&amp;quot;,&lt;br /&gt;
	&amp;quot;Batk&amp;quot;,&lt;br /&gt;
	&amp;quot;Beng&amp;quot;,&lt;br /&gt;
		&amp;quot;as-Beng&amp;quot;,&lt;br /&gt;
	&amp;quot;Bopo&amp;quot;,&lt;br /&gt;
	&amp;quot;Brah&amp;quot;,&lt;br /&gt;
	&amp;quot;Brai&amp;quot;,&lt;br /&gt;
	&amp;quot;Bugi&amp;quot;,&lt;br /&gt;
	&amp;quot;Buhd&amp;quot;,&lt;br /&gt;
	&amp;quot;Cakm&amp;quot;,&lt;br /&gt;
	&amp;quot;Cans&amp;quot;,&lt;br /&gt;
	&amp;quot;Cari&amp;quot;,&lt;br /&gt;
	&amp;quot;Cham&amp;quot;,&lt;br /&gt;
	&amp;quot;Cher&amp;quot;,&lt;br /&gt;
	&amp;quot;Copt&amp;quot;,&lt;br /&gt;
	&amp;quot;Cprt&amp;quot;,&lt;br /&gt;
	&amp;quot;Cyrl&amp;quot;,&lt;br /&gt;
	&amp;quot;Cyrs&amp;quot;,&lt;br /&gt;
	&amp;quot;Deva&amp;quot;,&lt;br /&gt;
	&amp;quot;Dsrt&amp;quot;,&lt;br /&gt;
	&amp;quot;Egyd&amp;quot;,&lt;br /&gt;
	&amp;quot;Egyp&amp;quot;,&lt;br /&gt;
	&amp;quot;Ethi&amp;quot;,&lt;br /&gt;
	&amp;quot;Geok&amp;quot;,&lt;br /&gt;
	&amp;quot;Geor&amp;quot;,&lt;br /&gt;
	&amp;quot;Glag&amp;quot;,&lt;br /&gt;
	&amp;quot;Goth&amp;quot;,&lt;br /&gt;
	&amp;quot;Grek&amp;quot;,&lt;br /&gt;
		&amp;quot;Polyt&amp;quot;,&lt;br /&gt;
		&amp;quot;polytonic&amp;quot;,&lt;br /&gt;
	&amp;quot;Gujr&amp;quot;,&lt;br /&gt;
	&amp;quot;Guru&amp;quot;,&lt;br /&gt;
	&amp;quot;Hang&amp;quot;,&lt;br /&gt;
	&amp;quot;Hani&amp;quot;,&lt;br /&gt;
	&amp;quot;Hano&amp;quot;,&lt;br /&gt;
	&amp;quot;Hebr&amp;quot;,&lt;br /&gt;
	&amp;quot;Hira&amp;quot;,&lt;br /&gt;
	&amp;quot;Hluw&amp;quot;,&lt;br /&gt;
	&amp;quot;Ital&amp;quot;,&lt;br /&gt;
	&amp;quot;Java&amp;quot;,&lt;br /&gt;
	&amp;quot;Kali&amp;quot;,&lt;br /&gt;
	&amp;quot;Kana&amp;quot;,&lt;br /&gt;
	&amp;quot;Khar&amp;quot;,&lt;br /&gt;
	&amp;quot;Khmr&amp;quot;,&lt;br /&gt;
	&amp;quot;Knda&amp;quot;,&lt;br /&gt;
	&amp;quot;Kthi&amp;quot;,&lt;br /&gt;
	&amp;quot;Lana&amp;quot;,&lt;br /&gt;
	&amp;quot;Laoo&amp;quot;,&lt;br /&gt;
	&amp;quot;Latn&amp;quot;,&lt;br /&gt;
		&amp;quot;Latf&amp;quot;,&lt;br /&gt;
		&amp;quot;Latg&amp;quot;,&lt;br /&gt;
		&amp;quot;Latnx&amp;quot;,&lt;br /&gt;
		&amp;quot;Latinx&amp;quot;,&lt;br /&gt;
		&amp;quot;nv-Latn&amp;quot;,&lt;br /&gt;
		&amp;quot;pjt-Latn&amp;quot;,&lt;br /&gt;
	&amp;quot;Lepc&amp;quot;,&lt;br /&gt;
	&amp;quot;Limb&amp;quot;,&lt;br /&gt;
	&amp;quot;Linb&amp;quot;,&lt;br /&gt;
	&amp;quot;Lisu&amp;quot;,&lt;br /&gt;
	&amp;quot;Lyci&amp;quot;,&lt;br /&gt;
	&amp;quot;Lydi&amp;quot;,&lt;br /&gt;
	&amp;quot;Mand&amp;quot;,&lt;br /&gt;
	&amp;quot;Mani&amp;quot;,&lt;br /&gt;
	&amp;quot;Merc&amp;quot;,&lt;br /&gt;
	&amp;quot;Mero&amp;quot;,&lt;br /&gt;
	&amp;quot;Mlym&amp;quot;,&lt;br /&gt;
	&amp;quot;Mong&amp;quot;,&lt;br /&gt;
		&amp;quot;mnc-Mong&amp;quot;,&lt;br /&gt;
		&amp;quot;sjo-Mong&amp;quot;,&lt;br /&gt;
		&amp;quot;xwo-Mong&amp;quot;,&lt;br /&gt;
	&amp;quot;Mtei&amp;quot;,&lt;br /&gt;
	&amp;quot;Mymr&amp;quot;,&lt;br /&gt;
	&amp;quot;Narb&amp;quot;,&lt;br /&gt;
	&amp;quot;Nkoo&amp;quot;,&lt;br /&gt;
	&amp;quot;Ogam&amp;quot;,&lt;br /&gt;
	&amp;quot;Olck&amp;quot;,&lt;br /&gt;
	&amp;quot;Orkh&amp;quot;,&lt;br /&gt;
	&amp;quot;Orya&amp;quot;,&lt;br /&gt;
	&amp;quot;Osma&amp;quot;,&lt;br /&gt;
	&amp;quot;Palm&amp;quot;,&lt;br /&gt;
	&amp;quot;Phag&amp;quot;,&lt;br /&gt;
	&amp;quot;Phli&amp;quot;,&lt;br /&gt;
	&amp;quot;Phlv&amp;quot;,&lt;br /&gt;
	&amp;quot;Phnx&amp;quot;,&lt;br /&gt;
	&amp;quot;Plrd&amp;quot;,&lt;br /&gt;
	&amp;quot;Prti&amp;quot;,&lt;br /&gt;
	&amp;quot;Rjng&amp;quot;,&lt;br /&gt;
	&amp;quot;Runr&amp;quot;,&lt;br /&gt;
	&amp;quot;Samr&amp;quot;,&lt;br /&gt;
	&amp;quot;Sarb&amp;quot;,&lt;br /&gt;
	&amp;quot;Saur&amp;quot;,&lt;br /&gt;
	&amp;quot;Sgnw&amp;quot;,&lt;br /&gt;
	&amp;quot;Shaw&amp;quot;,&lt;br /&gt;
	&amp;quot;Shrd&amp;quot;,&lt;br /&gt;
	&amp;quot;Sinh&amp;quot;,&lt;br /&gt;
	&amp;quot;Sora&amp;quot;,&lt;br /&gt;
	&amp;quot;Sund&amp;quot;,&lt;br /&gt;
	&amp;quot;Sylo&amp;quot;,&lt;br /&gt;
	&amp;quot;Syrc&amp;quot;,&lt;br /&gt;
	&amp;quot;Tagb&amp;quot;,&lt;br /&gt;
	&amp;quot;Tale&amp;quot;,&lt;br /&gt;
	&amp;quot;Talu&amp;quot;,&lt;br /&gt;
	&amp;quot;Taml&amp;quot;,&lt;br /&gt;
	&amp;quot;Tang&amp;quot;,&lt;br /&gt;
	&amp;quot;Tavt&amp;quot;,&lt;br /&gt;
	&amp;quot;Telu&amp;quot;,&lt;br /&gt;
	&amp;quot;Tfng&amp;quot;,&lt;br /&gt;
	&amp;quot;Tglg&amp;quot;,&lt;br /&gt;
	&amp;quot;Thaa&amp;quot;,&lt;br /&gt;
	&amp;quot;Thai&amp;quot;,&lt;br /&gt;
	&amp;quot;Tibt&amp;quot;,&lt;br /&gt;
		&amp;quot;xzh-Tibt&amp;quot;,&lt;br /&gt;
	&amp;quot;Ugar&amp;quot;,&lt;br /&gt;
	&amp;quot;Vaii&amp;quot;,&lt;br /&gt;
	&amp;quot;Xpeo&amp;quot;,&lt;br /&gt;
	&amp;quot;Xsux&amp;quot;,&lt;br /&gt;
	&amp;quot;Yiii&amp;quot;,&lt;br /&gt;
	&amp;quot;Zmth&amp;quot;,&lt;br /&gt;
	&amp;quot;Zsym&amp;quot;,&lt;br /&gt;
&lt;br /&gt;
	&amp;quot;Ipach&amp;quot;,&lt;br /&gt;
	&amp;quot;IPAchar&amp;quot;,&lt;br /&gt;
	&amp;quot;Music&amp;quot;,&lt;br /&gt;
	&amp;quot;musical&amp;quot;,&lt;br /&gt;
	&amp;quot;Rumin&amp;quot;,&lt;br /&gt;
	&amp;quot;Ruminumerals&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- Parts of speech which will not be categorised in categories like &amp;quot;English terms spelled with É&amp;quot; if&lt;br /&gt;
-- the term is the character in question (e.g. the letter entry for English [[é]]). This contrasts with&lt;br /&gt;
-- entries like the French adjective [[m̂]], which is a one-letter word spelled with the letter.&lt;br /&gt;
data.pos_not_spelled_with_self = {&lt;br /&gt;
	&amp;quot;diacritical marks&amp;quot;,&lt;br /&gt;
	&amp;quot;Han characters&amp;quot;,&lt;br /&gt;
	&amp;quot;Han tu&amp;quot;,&lt;br /&gt;
	&amp;quot;hanja&amp;quot;,&lt;br /&gt;
	&amp;quot;hanzi&amp;quot;,&lt;br /&gt;
	&amp;quot;kanji&amp;quot;,&lt;br /&gt;
	&amp;quot;letters&amp;quot;,&lt;br /&gt;
	&amp;quot;ligatures&amp;quot;,&lt;br /&gt;
	&amp;quot;logograms&amp;quot;,&lt;br /&gt;
	&amp;quot;numeral symbols&amp;quot;,&lt;br /&gt;
	&amp;quot;numerals&amp;quot;,&lt;br /&gt;
	&amp;quot;symbols&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- Convert lists into sets.&lt;br /&gt;
for key, list in pairs(data) do&lt;br /&gt;
	data[key] = {}&lt;br /&gt;
	for _, item in ipairs(list) do&lt;br /&gt;
		data[key][item] = true&lt;br /&gt;
	end&lt;br /&gt;
end&lt;br /&gt;
&lt;br /&gt;
------ 2. Lists that will not be converted into sets. ------&lt;br /&gt;
&lt;br /&gt;
-- Recognized aliases for parts of speech (param 2=). Key is the short form and value is the canonical singular (not&lt;br /&gt;
-- pluralized) form. It is singular so that the same table can be used in [[Module:form of]] for the p=/POS= param&lt;br /&gt;
-- and [[Module:links]] for the pos= param.&lt;br /&gt;
data.pos_aliases = {&lt;br /&gt;
	[&amp;quot;a&amp;quot;] = &amp;quot;adjective&amp;quot;,&lt;br /&gt;
	[&amp;quot;adj&amp;quot;] = &amp;quot;adjective&amp;quot;,&lt;br /&gt;
	[&amp;quot;adv&amp;quot;] = &amp;quot;adverb&amp;quot;,&lt;br /&gt;
	[&amp;quot;art&amp;quot;] = &amp;quot;article&amp;quot;,&lt;br /&gt;
	[&amp;quot;det&amp;quot;] = &amp;quot;determiner&amp;quot;,&lt;br /&gt;
	[&amp;quot;cnum&amp;quot;] = &amp;quot;cardinal numeral&amp;quot;,&lt;br /&gt;
	[&amp;quot;conj&amp;quot;] = &amp;quot;conjunction&amp;quot;,&lt;br /&gt;
	[&amp;quot;conv&amp;quot;] = &amp;quot;converb&amp;quot;,&lt;br /&gt;
	[&amp;quot;int&amp;quot;] = &amp;quot;interjection&amp;quot;,&lt;br /&gt;
	[&amp;quot;intj&amp;quot;] = &amp;quot;interjection&amp;quot;,&lt;br /&gt;
	[&amp;quot;n&amp;quot;] = &amp;quot;noun&amp;quot;,&lt;br /&gt;
	[&amp;quot;num&amp;quot;] = &amp;quot;numeral&amp;quot;,&lt;br /&gt;
	[&amp;quot;part&amp;quot;] = &amp;quot;participle&amp;quot;,&lt;br /&gt;
	[&amp;quot;pcl&amp;quot;] = &amp;quot;particle&amp;quot;,&lt;br /&gt;
	[&amp;quot;phr&amp;quot;] = &amp;quot;phrase&amp;quot;,&lt;br /&gt;
	[&amp;quot;pn&amp;quot;] = &amp;quot;proper noun&amp;quot;,&lt;br /&gt;
	[&amp;quot;proper&amp;quot;] = &amp;quot;proper noun&amp;quot;,&lt;br /&gt;
	[&amp;quot;postp&amp;quot;] = &amp;quot;postposition&amp;quot;,&lt;br /&gt;
	[&amp;quot;pre&amp;quot;] = &amp;quot;preposition&amp;quot;,&lt;br /&gt;
	[&amp;quot;prep&amp;quot;] = &amp;quot;preposition&amp;quot;,&lt;br /&gt;
	[&amp;quot;pro&amp;quot;] = &amp;quot;pronoun&amp;quot;,&lt;br /&gt;
	[&amp;quot;pron&amp;quot;] = &amp;quot;pronoun&amp;quot;,&lt;br /&gt;
	[&amp;quot;onum&amp;quot;] = &amp;quot;ordinal numeral&amp;quot;,&lt;br /&gt;
	[&amp;quot;v&amp;quot;] = &amp;quot;verb&amp;quot;,&lt;br /&gt;
	[&amp;quot;vb&amp;quot;] = &amp;quot;verb&amp;quot;,&lt;br /&gt;
	[&amp;quot;vi&amp;quot;] = &amp;quot;intransitive verb&amp;quot;,&lt;br /&gt;
	[&amp;quot;vt&amp;quot;] = &amp;quot;transitive verb&amp;quot;,&lt;br /&gt;
	[&amp;quot;vti&amp;quot;] = &amp;quot;transitive and intransitive verb&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- Parts of speech for which categories like &amp;quot;German masculine nouns&amp;quot; or &amp;quot;Russian imperfective verbs&amp;quot;&lt;br /&gt;
-- will be generated if the headword is of the appropriate gender/number.&lt;br /&gt;
data.pos_for_gender_number_cat = {&lt;br /&gt;
	[&amp;quot;nouns&amp;quot;] = &amp;quot;nouns&amp;quot;,&lt;br /&gt;
	[&amp;quot;proper nouns&amp;quot;] = &amp;quot;nouns&amp;quot;,&lt;br /&gt;
	[&amp;quot;suffixes&amp;quot;] = &amp;quot;suffixes&amp;quot;,&lt;br /&gt;
	-- We include verbs because impf and pf are valid &amp;quot;genders&amp;quot;.&lt;br /&gt;
	[&amp;quot;verbs&amp;quot;] = &amp;quot;verbs&amp;quot;,&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
-- Combining character data used when categorising unusual characters. These resolve into two patterns, used to find single combining characters (i.e. character + diacritic(s)) or double combining characters (i.e. character + diacritic(s) + character).&lt;br /&gt;
local comb_chars = {&lt;br /&gt;
	single = {&lt;br /&gt;
		{0x0300, 0x034E},&lt;br /&gt;
		-- Exclude combining grapheme joiner.&lt;br /&gt;
		{0x0350, 0x035B},&lt;br /&gt;
		{0x0363, 0x036F},&lt;br /&gt;
		{0x0483, 0x0489},&lt;br /&gt;
		{0x0591, 0x05BD},&lt;br /&gt;
		{0x05BF},&lt;br /&gt;
		{0x05C1, 0x05C2},&lt;br /&gt;
		{0x05C4, 0x05C5},&lt;br /&gt;
		{0x05C7},&lt;br /&gt;
		{0x0610, 0x061A},&lt;br /&gt;
		{0x064B, 0x065F},&lt;br /&gt;
		{0x0670},&lt;br /&gt;
		{0x06D6, 0x06DC},&lt;br /&gt;
		{0x06DF, 0x06E4},&lt;br /&gt;
		{0x06E7, 0x06E8},&lt;br /&gt;
		{0x06EA, 0x06ED},&lt;br /&gt;
		{0x0711},&lt;br /&gt;
		{0x0730, 0x074A},&lt;br /&gt;
		{0x07A6, 0x07B0},&lt;br /&gt;
		{0x07EB, 0x07F3},&lt;br /&gt;
		{0x07FD},&lt;br /&gt;
		{0x0816, 0x0819},&lt;br /&gt;
		{0x081B, 0x0823},&lt;br /&gt;
		{0x0825, 0x0827},&lt;br /&gt;
		{0x0829, 0x082D},&lt;br /&gt;
		{0x0859, 0x085B},&lt;br /&gt;
		{0x0898, 0x089F},&lt;br /&gt;
		{0x08CA, 0x08E1},&lt;br /&gt;
		{0x08E3, 0x0903},&lt;br /&gt;
		{0x093A, 0x093C},&lt;br /&gt;
		{0x093E, 0x094F},&lt;br /&gt;
		{0x0951, 0x0957},&lt;br /&gt;
		{0x0962, 0x0963},&lt;br /&gt;
		{0x0981, 0x0983},&lt;br /&gt;
		{0x09BC},&lt;br /&gt;
		{0x09BE, 0x09C4},&lt;br /&gt;
		{0x09C7, 0x09C8},&lt;br /&gt;
		{0x09CB, 0x09CD},&lt;br /&gt;
		{0x09D7},&lt;br /&gt;
		{0x09E2, 0x09E3},&lt;br /&gt;
		{0x09FE},&lt;br /&gt;
		{0x0A01, 0x0A03},&lt;br /&gt;
		{0x0A3C},&lt;br /&gt;
		{0x0A3E, 0x0A42},&lt;br /&gt;
		{0x0A47, 0x0A48},&lt;br /&gt;
		{0x0A4B, 0x0A4D},&lt;br /&gt;
		{0x0A51},&lt;br /&gt;
		{0x0A70, 0x0A71},&lt;br /&gt;
		{0x0A75},&lt;br /&gt;
		{0x0A81, 0x0A83},&lt;br /&gt;
		{0x0ABC},&lt;br /&gt;
		{0x0ABE, 0x0AC5},&lt;br /&gt;
		{0x0AC7, 0x0AC9},&lt;br /&gt;
		{0x0ACB, 0x0ACD},&lt;br /&gt;
		{0x0AE2, 0x0AE3},&lt;br /&gt;
		{0x0AFA, 0x0AFF},&lt;br /&gt;
		{0x0B01, 0x0B03},&lt;br /&gt;
		{0x0B3C},&lt;br /&gt;
		{0x0B3E, 0x0B44},&lt;br /&gt;
		{0x0B47, 0x0B48},&lt;br /&gt;
		{0x0B4B, 0x0B4D},&lt;br /&gt;
		{0x0B55, 0x0B57},&lt;br /&gt;
		{0x0B62, 0x0B63},&lt;br /&gt;
		{0x0B82},&lt;br /&gt;
		{0x0BBE, 0x0BC2},&lt;br /&gt;
		{0x0BC6, 0x0BC8},&lt;br /&gt;
		{0x0BCA, 0x0BCD},&lt;br /&gt;
		{0x0BD7},&lt;br /&gt;
		{0x0C00, 0x0C04},&lt;br /&gt;
		{0x0C3C},&lt;br /&gt;
		{0x0C3E, 0x0C44},&lt;br /&gt;
		{0x0C46, 0x0C48},&lt;br /&gt;
		{0x0C4A, 0x0C4D},&lt;br /&gt;
		{0x0C55, 0x0C56},&lt;br /&gt;
		{0x0C62, 0x0C63},&lt;br /&gt;
		{0x0C81, 0x0C83},&lt;br /&gt;
		{0x0CBC},&lt;br /&gt;
		{0x0CBE, 0x0CC4},&lt;br /&gt;
		{0x0CC6, 0x0CC8},&lt;br /&gt;
		{0x0CCA, 0x0CCD},&lt;br /&gt;
		{0x0CD5, 0x0CD6},&lt;br /&gt;
		{0x0CE2, 0x0CE3},&lt;br /&gt;
		{0x0CF3},&lt;br /&gt;
		{0x0D00, 0x0D03},&lt;br /&gt;
		{0x0D3B, 0x0D3C},&lt;br /&gt;
		{0x0D3E, 0x0D44},&lt;br /&gt;
		{0x0D46, 0x0D48},&lt;br /&gt;
		{0x0D4A, 0x0D4D},&lt;br /&gt;
		{0x0D57},&lt;br /&gt;
		{0x0D62, 0x0D63},&lt;br /&gt;
		{0x0D81, 0x0D83},&lt;br /&gt;
		{0x0DCA},&lt;br /&gt;
		{0x0DCF, 0x0DD4},&lt;br /&gt;
		{0x0DD6},&lt;br /&gt;
		{0x0DD8, 0x0DDF},&lt;br /&gt;
		{0x0DF2, 0x0DF3},&lt;br /&gt;
		{0x0E31},&lt;br /&gt;
		{0x0E34, 0x0E3A},&lt;br /&gt;
		{0x0E47, 0x0E4E},&lt;br /&gt;
		{0x0EB1},&lt;br /&gt;
		{0x0EB4, 0x0EBC},&lt;br /&gt;
		{0x0EC8, 0x0ECE},&lt;br /&gt;
		{0x0F18, 0x0F19},&lt;br /&gt;
		{0x0F35},&lt;br /&gt;
		{0x0F37},&lt;br /&gt;
		{0x0F39},&lt;br /&gt;
		{0x0F3E, 0x0F3F},&lt;br /&gt;
		{0x0F71, 0x0F84},&lt;br /&gt;
		{0x0F86, 0x0F87},&lt;br /&gt;
		{0x0F8D, 0x0F97},&lt;br /&gt;
		{0x0F99, 0x0FBC},&lt;br /&gt;
		{0x0FC6},&lt;br /&gt;
		{0x102B, 0x103E},&lt;br /&gt;
		{0x1056, 0x1059},&lt;br /&gt;
		{0x105E, 0x1060},&lt;br /&gt;
		{0x1062, 0x1064},&lt;br /&gt;
		{0x1067, 0x106D},&lt;br /&gt;
		{0x1071, 0x1074},&lt;br /&gt;
		{0x1082, 0x108D},&lt;br /&gt;
		{0x108F},&lt;br /&gt;
		{0x109A, 0x109D},&lt;br /&gt;
		{0x135D, 0x135F},&lt;br /&gt;
		{0x1712, 0x1715},&lt;br /&gt;
		{0x1732, 0x1734},&lt;br /&gt;
		{0x1752, 0x1753},&lt;br /&gt;
		{0x1772, 0x1773},&lt;br /&gt;
		{0x17B4, 0x17D3},&lt;br /&gt;
		{0x17DD},&lt;br /&gt;
		-- Exclude Mongolian variation selectors.&lt;br /&gt;
		{0x1885, 0x1886},&lt;br /&gt;
		{0x18A9},&lt;br /&gt;
		{0x1920, 0x192B},&lt;br /&gt;
		{0x1930, 0x193B},&lt;br /&gt;
		{0x1A17, 0x1A1B},&lt;br /&gt;
		{0x1A55, 0x1A5E},&lt;br /&gt;
		{0x1A60, 0x1A7C},&lt;br /&gt;
		{0x1A7F},&lt;br /&gt;
		{0x1AB0, 0x1ACE},&lt;br /&gt;
		{0x1B00, 0x1B04},&lt;br /&gt;
		{0x1B34, 0x1B44},&lt;br /&gt;
		{0x1B6B, 0x1B73},&lt;br /&gt;
		{0x1B80, 0x1B82},&lt;br /&gt;
		{0x1BA1, 0x1BAD},&lt;br /&gt;
		{0x1BE6, 0x1BF3},&lt;br /&gt;
		{0x1C24, 0x1C37},&lt;br /&gt;
		{0x1CD0, 0x1CD2},&lt;br /&gt;
		{0x1CD4, 0x1CE8},&lt;br /&gt;
		{0x1CED},&lt;br /&gt;
		{0x1CF4},&lt;br /&gt;
		{0x1CF7, 0x1CF9},&lt;br /&gt;
		{0x1DC0, 0x1DCC},&lt;br /&gt;
		{0x1DCE, 0x1DFB},&lt;br /&gt;
		{0x1DFD, 0x1DFF},&lt;br /&gt;
		{0x20D0, 0x20F0},&lt;br /&gt;
		{0x2CEF, 0x2CF1},&lt;br /&gt;
		{0x2D7F},&lt;br /&gt;
		{0x2DE0, 0x2DFF},&lt;br /&gt;
		{0x302A, 0x302F},&lt;br /&gt;
		{0x3099, 0x309A},&lt;br /&gt;
		{0xA66F, 0xA672},&lt;br /&gt;
		{0xA674, 0xA67D},&lt;br /&gt;
		{0xA69E, 0xA69F},&lt;br /&gt;
		{0xA6F0, 0xA6F1},&lt;br /&gt;
		{0xA802},&lt;br /&gt;
		{0xA806},&lt;br /&gt;
		{0xA80B},&lt;br /&gt;
		{0xA823, 0xA827},&lt;br /&gt;
		{0xA82C},&lt;br /&gt;
		{0xA880, 0xA881},&lt;br /&gt;
		{0xA8B4, 0xA8C5},&lt;br /&gt;
		{0xA8E0, 0xA8F1},&lt;br /&gt;
		{0xA8FF},&lt;br /&gt;
		{0xA926, 0xA92D},&lt;br /&gt;
		{0xA947, 0xA953},&lt;br /&gt;
		{0xA980, 0xA983},&lt;br /&gt;
		{0xA9B3, 0xA9C0},&lt;br /&gt;
		{0xA9E5},&lt;br /&gt;
		{0xAA29, 0xAA36},&lt;br /&gt;
		{0xAA43},&lt;br /&gt;
		{0xAA4C, 0xAA4D},&lt;br /&gt;
		{0xAA7B, 0xAA7D},&lt;br /&gt;
		{0xAAB0},&lt;br /&gt;
		{0xAAB2, 0xAAB4},&lt;br /&gt;
		{0xAAB7, 0xAAB8},&lt;br /&gt;
		{0xAABE, 0xAABF},&lt;br /&gt;
		{0xAAC1},&lt;br /&gt;
		{0xAAEB, 0xAAEF},&lt;br /&gt;
		{0xAAF5, 0xAAF6},&lt;br /&gt;
		{0xABE3, 0xABEA},&lt;br /&gt;
		{0xABEC, 0xABED},&lt;br /&gt;
		{0xFB1E},&lt;br /&gt;
		{0xFE20, 0xFE2F},&lt;br /&gt;
		{0x101FD},&lt;br /&gt;
		{0x102E0},&lt;br /&gt;
		{0x10376, 0x1037A},&lt;br /&gt;
		{0x10A01, 0x10A03},&lt;br /&gt;
		{0x10A05, 0x10A06},&lt;br /&gt;
		{0x10A0C, 0x10A0F},&lt;br /&gt;
		{0x10A38, 0x10A3A},&lt;br /&gt;
		{0x10A3F},&lt;br /&gt;
		{0x10AE5, 0x10AE6},&lt;br /&gt;
		{0x10D24, 0x10D27},&lt;br /&gt;
		{0x10EAB, 0x10EAC},&lt;br /&gt;
		{0x10EFD, 0x10EFF},&lt;br /&gt;
		{0x10F46, 0x10F50},&lt;br /&gt;
		{0x10F82, 0x10F85},&lt;br /&gt;
		{0x11000, 0x11002},&lt;br /&gt;
		{0x11038, 0x11046},&lt;br /&gt;
		{0x11070},&lt;br /&gt;
		{0x11073, 0x11074},&lt;br /&gt;
		{0x1107F, 0x11082},&lt;br /&gt;
		{0x110B0, 0x110BA},&lt;br /&gt;
		{0x110C2},&lt;br /&gt;
		{0x11100, 0x11102},&lt;br /&gt;
		{0x11127, 0x11134},&lt;br /&gt;
		{0x11145, 0x11146},&lt;br /&gt;
		{0x11173},&lt;br /&gt;
		{0x11180, 0x11182},&lt;br /&gt;
		{0x111B3, 0x111C0},&lt;br /&gt;
		{0x111C9, 0x111CC},&lt;br /&gt;
		{0x111CE, 0x111CF},&lt;br /&gt;
		{0x1122C, 0x11237},&lt;br /&gt;
		{0x1123E},&lt;br /&gt;
		{0x11241},&lt;br /&gt;
		{0x112DF, 0x112EA},&lt;br /&gt;
		{0x11300, 0x11303},&lt;br /&gt;
		{0x1133B, 0x1133C},&lt;br /&gt;
		{0x1133E, 0x11344},&lt;br /&gt;
		{0x11347, 0x11348},&lt;br /&gt;
		{0x1134B, 0x1134D},&lt;br /&gt;
		{0x11357},&lt;br /&gt;
		{0x11362, 0x11363},&lt;br /&gt;
		{0x11366, 0x1136C},&lt;br /&gt;
		{0x11370, 0x11374},&lt;br /&gt;
		{0x11435, 0x11446},&lt;br /&gt;
		{0x1145E},&lt;br /&gt;
		{0x114B0, 0x114C3},&lt;br /&gt;
		{0x115AF, 0x115B5},&lt;br /&gt;
		{0x115B8, 0x115C0},&lt;br /&gt;
		{0x115DC, 0x115DD},&lt;br /&gt;
		{0x11630, 0x11640},&lt;br /&gt;
		{0x116AB, 0x116B7},&lt;br /&gt;
		{0x1171D, 0x1172B},&lt;br /&gt;
		{0x1182C, 0x1183A},&lt;br /&gt;
		{0x11930, 0x11935},&lt;br /&gt;
		{0x11937, 0x11938},&lt;br /&gt;
		{0x1193B, 0x1193E},&lt;br /&gt;
		{0x11940},&lt;br /&gt;
		{0x11942, 0x11943},&lt;br /&gt;
		{0x119D1, 0x119D7},&lt;br /&gt;
		{0x119DA, 0x119E0},&lt;br /&gt;
		{0x119E4},&lt;br /&gt;
		{0x11A01, 0x11A0A},&lt;br /&gt;
		{0x11A33, 0x11A39},&lt;br /&gt;
		{0x11A3B, 0x11A3E},&lt;br /&gt;
		{0x11A47},&lt;br /&gt;
		{0x11A51, 0x11A5B},&lt;br /&gt;
		{0x11A8A, 0x11A99},&lt;br /&gt;
		{0x11C2F, 0x11C36},&lt;br /&gt;
		{0x11C38, 0x11C3F},&lt;br /&gt;
		{0x11C92, 0x11CA7},&lt;br /&gt;
		{0x11CA9, 0x11CB6},&lt;br /&gt;
		{0x11D31, 0x11D36},&lt;br /&gt;
		{0x11D3A},&lt;br /&gt;
		{0x11D3C, 0x11D3D},&lt;br /&gt;
		{0x11D3F, 0x11D45},&lt;br /&gt;
		{0x11D47},&lt;br /&gt;
		{0x11D8A, 0x11D8E},&lt;br /&gt;
		{0x11D90, 0x11D91},&lt;br /&gt;
		{0x11D93, 0x11D97},&lt;br /&gt;
		{0x11EF3, 0x11EF6},&lt;br /&gt;
		{0x11F00, 0x11F01},&lt;br /&gt;
		{0x11F03},&lt;br /&gt;
		{0x11F34, 0x11F3A},&lt;br /&gt;
		{0x11F3E, 0x11F42},&lt;br /&gt;
		{0x13440},&lt;br /&gt;
		{0x13447, 0x13455},&lt;br /&gt;
		{0x16AF0, 0x16AF4},&lt;br /&gt;
		{0x16B30, 0x16B36},&lt;br /&gt;
		{0x16F4F},&lt;br /&gt;
		{0x16F51, 0x16F87},&lt;br /&gt;
		{0x16F8F, 0x16F92},&lt;br /&gt;
		-- Exclude Khitan Small Script filler.&lt;br /&gt;
		{0x16FF0, 0x16FF1},&lt;br /&gt;
		{0x1BC9D, 0x1BC9E},&lt;br /&gt;
		{0x1CF00, 0x1CF2D},&lt;br /&gt;
		{0x1CF30, 0x1CF46},&lt;br /&gt;
		{0x1D165, 0x1D169},&lt;br /&gt;
		{0x1D16D, 0x1D172},&lt;br /&gt;
		{0x1D17B, 0x1D182},&lt;br /&gt;
		{0x1D185, 0x1D18B},&lt;br /&gt;
		{0x1D1AA, 0x1D1AD},&lt;br /&gt;
		{0x1D242, 0x1D244},&lt;br /&gt;
		{0x1DA00, 0x1DA36},&lt;br /&gt;
		{0x1DA3B, 0x1DA6C},&lt;br /&gt;
		{0x1DA75},&lt;br /&gt;
		{0x1DA84},&lt;br /&gt;
		{0x1DA9B, 0x1DA9F},&lt;br /&gt;
		{0x1DAA1, 0x1DAAF},&lt;br /&gt;
		{0x1E000, 0x1E006},&lt;br /&gt;
		{0x1E008, 0x1E018},&lt;br /&gt;
		{0x1E01B, 0x1E021},&lt;br /&gt;
		{0x1E023, 0x1E024},&lt;br /&gt;
		{0x1E026, 0x1E02A},&lt;br /&gt;
		{0x1E08F},&lt;br /&gt;
		{0x1E130, 0x1E136},&lt;br /&gt;
		{0x1E2AE},&lt;br /&gt;
		{0x1E2EC, 0x1E2EF},&lt;br /&gt;
		{0x1E4EC, 0x1E4EF},&lt;br /&gt;
		{0x1E8D0, 0x1E8D6},&lt;br /&gt;
		{0x1E944, 0x1E94A}&lt;br /&gt;
	},&lt;br /&gt;
	double = {&lt;br /&gt;
		{0x035C, 0x0362},&lt;br /&gt;
		{0x1DCD},&lt;br /&gt;
		{0x1DFC}&lt;br /&gt;
	},&lt;br /&gt;
	vs = { -- variation selectors; separated out so that we don&amp;#039;t get categories for them&lt;br /&gt;
		{0xFE00, 0xFE0F},&lt;br /&gt;
		{0xE0100, 0xE01EF}&lt;br /&gt;
	}&lt;br /&gt;
}&lt;br /&gt;
for i, set in pairs(comb_chars) do&lt;br /&gt;
	for j, range in ipairs(set) do&lt;br /&gt;
		for k, char in ipairs(range) do&lt;br /&gt;
			range[k] = u(char)&lt;br /&gt;
		end&lt;br /&gt;
		set[j] = table.concat(range, &amp;quot;-&amp;quot;)&lt;br /&gt;
	end&lt;br /&gt;
	comb_chars[i] = table.concat(set)&lt;br /&gt;
end&lt;br /&gt;
comb_chars.both = comb_chars.single .. comb_chars.double .. comb_chars.vs&lt;br /&gt;
comb_chars = {&lt;br /&gt;
	combined_single = &amp;quot;[^&amp;quot; .. comb_chars.both .. &amp;quot;][&amp;quot; .. comb_chars.single .. comb_chars.vs .. &amp;quot;]+%f[^&amp;quot; .. comb_chars.both .. &amp;quot;]&amp;quot;,&lt;br /&gt;
	combined_double = &amp;quot;[^&amp;quot; .. comb_chars.both .. &amp;quot;][&amp;quot; .. comb_chars.single .. comb_chars.vs .. &amp;quot;]*[&amp;quot; .. comb_chars.double .. &amp;quot;]+[&amp;quot; .. comb_chars.both .. &amp;quot;]*.[&amp;quot; .. comb_chars.single .. comb_chars.vs .. &amp;quot;]*&amp;quot;,&lt;br /&gt;
	diacritics_single = &amp;quot;[&amp;quot; .. comb_chars.single .. &amp;quot;]&amp;quot;,&lt;br /&gt;
	diacritics_double = &amp;quot;[&amp;quot; .. comb_chars.double .. &amp;quot;]&amp;quot;&lt;br /&gt;
}&lt;br /&gt;
&lt;br /&gt;
local unsupported_characters = {}&lt;br /&gt;
for k, v in pairs(require(&amp;quot;Module:links/data&amp;quot;).unsupported_characters) do&lt;br /&gt;
	unsupported_characters[v] = k&lt;br /&gt;
end&lt;br /&gt;
&lt;br /&gt;
-- Get the list of unsupported titles and invert it (so the keys are pagenames and values are canonical titles).&lt;br /&gt;
local unsupported_titles = {}&lt;br /&gt;
for k, v in pairs(require(&amp;quot;Module:links/data&amp;quot;).unsupported_titles) do&lt;br /&gt;
	unsupported_titles[v] = k&lt;br /&gt;
end&lt;br /&gt;
data.unsupported_titles = unsupported_titles&lt;br /&gt;
&lt;br /&gt;
------ 3. Page-wide processing (so that it only needs to be done once per page). ------&lt;br /&gt;
&lt;br /&gt;
--Get the pagename.&lt;br /&gt;
local pagename = title.subpageText&lt;br /&gt;
	:gsub(&amp;quot;^Unsupported titles/(.*)&amp;quot;, function(m)&lt;br /&gt;
		data.unsupported_title = true&lt;br /&gt;
		return unsupported_titles[m] or (m:gsub(&amp;quot;`.-`&amp;quot;, unsupported_characters))&lt;br /&gt;
	end)&lt;br /&gt;
-- Save pagename, as local variable will be destructively modified.&lt;br /&gt;
data.pagename = pagename&lt;br /&gt;
-- Decompose the pagename in Unicode normalization form D.&lt;br /&gt;
data.decompose_pagename = mw.ustring.toNFD(pagename)&lt;br /&gt;
-- Explode the current page name into a character table, taking decomposed combining characters into account.&lt;br /&gt;
local explode_pagename = {}&lt;br /&gt;
local pagename_len = 0&lt;br /&gt;
local function explode(char)&lt;br /&gt;
	explode_pagename[char] = true&lt;br /&gt;
	pagename_len = pagename_len + 1&lt;br /&gt;
	return &amp;quot;&amp;quot;&lt;br /&gt;
end&lt;br /&gt;
pagename = rsub(pagename, comb_chars.combined_double, explode)&lt;br /&gt;
pagename = rsub(pagename, comb_chars.combined_single, explode)&lt;br /&gt;
	:gsub(&amp;quot;[%z\1-\127\194-\244][\128-\191]*&amp;quot;, explode)&lt;br /&gt;
&lt;br /&gt;
data.comb_chars = comb_chars&lt;br /&gt;
data.explode_pagename = explode_pagename&lt;br /&gt;
data.pagename_len = pagename_len&lt;br /&gt;
&lt;br /&gt;
-- Generate DEFAULTSORT.&lt;br /&gt;
data.encoded_pagename = mw.text.encode(data.pagename)&lt;br /&gt;
data.pagename_defaultsort = require(&amp;quot;Module:languages&amp;quot;).getByCode(&amp;quot;mul&amp;quot;):makeSortKey(data.encoded_pagename)&lt;br /&gt;
frame:callParserFunction(&lt;br /&gt;
	&amp;quot;DEFAULTSORT&amp;quot;,&lt;br /&gt;
	data.pagename_defaultsort&lt;br /&gt;
)&lt;br /&gt;
&lt;br /&gt;
------ 4. Parse page for maintenance categories. ------&lt;br /&gt;
local content = title:getContent()&lt;br /&gt;
-- Raw wikitext use of {{DEFAULTSORT:}} and aliases.&lt;br /&gt;
local defaultsort = {&lt;br /&gt;
	[&amp;quot;DEFAULTSORT&amp;quot;] = true,&lt;br /&gt;
	[&amp;quot;DEFAULTSORTKEY&amp;quot;] = true,&lt;br /&gt;
	[&amp;quot;DEFAULTCATEGORYSORT&amp;quot;] = true&lt;br /&gt;
}&lt;br /&gt;
for magic_word in content:gmatch(&amp;quot;{{%s*(DEFAULT.-):.-}}&amp;quot;) do&lt;br /&gt;
	if defaultsort[magic_word] then&lt;br /&gt;
		data.pagename_defaultsort_conflict = frame:expandTemplate{&lt;br /&gt;
			title = &amp;quot;tracking category&amp;quot;,&lt;br /&gt;
			args = {&amp;quot;Pages with DEFAULTSORT conflicts&amp;quot;}&lt;br /&gt;
		}&lt;br /&gt;
		break&lt;br /&gt;
	end&lt;br /&gt;
end&lt;br /&gt;
-- Raw wikitext use of {{DISPLAYTITLE:}}.&lt;br /&gt;
if content:find(&amp;quot;{{%s*DISPLAYTITLE:.-}}&amp;quot;) then&lt;br /&gt;
	data.pagename_displaytitle_conflict = frame:expandTemplate{&lt;br /&gt;
		title = &amp;quot;tracking category&amp;quot;,&lt;br /&gt;
		args = {&amp;quot;Pages with DISPLAYTITLE conflicts&amp;quot;}&lt;br /&gt;
	}&lt;br /&gt;
end&lt;br /&gt;
-- Raw wikitext use of a topic or langname category.&lt;br /&gt;
local wikitext_topic_cat = {}&lt;br /&gt;
local wikitext_langname_cat = {}&lt;br /&gt;
local prefixes = {&lt;br /&gt;
	[&amp;quot;CAT&amp;quot;] = true,&lt;br /&gt;
	[&amp;quot;CATEGORY&amp;quot;] = true&lt;br /&gt;
}&lt;br /&gt;
for prefix, cat in content:gmatch(&amp;quot;%[%[[ _]*(%a-)[ _]*:[ _]*(.-)[ _]*%]%]&amp;quot;) do&lt;br /&gt;
	if prefixes[prefix:upper()] then&lt;br /&gt;
		local code = cat:match(&amp;quot;^([%w%-.]+):&amp;quot;)&lt;br /&gt;
		if code then&lt;br /&gt;
			wikitext_topic_cat[code] = true&lt;br /&gt;
		else&lt;br /&gt;
			cat = cat:gsub(&amp;quot;|.*&amp;quot;, &amp;quot;&amp;quot;)&lt;br /&gt;
				:gsub(&amp;quot;[ _]+&amp;quot;, &amp;quot; &amp;quot;)&lt;br /&gt;
			local n = cat:find(&amp;quot;.%f[%z _]&amp;quot;)&lt;br /&gt;
			while n do&lt;br /&gt;
				local name = cat:sub(1, n)&lt;br /&gt;
				wikitext_langname_cat[name] = true&lt;br /&gt;
				n = cat:find(&amp;quot;.%f[%z _]&amp;quot;, n + 1)&lt;br /&gt;
			end&lt;br /&gt;
		end&lt;br /&gt;
	end&lt;br /&gt;
end&lt;br /&gt;
data.wikitext_topic_cat = wikitext_topic_cat&lt;br /&gt;
data.wikitext_langname_cat = wikitext_langname_cat&lt;br /&gt;
-- Manual &amp;quot;terms spelled with&amp;quot; categories.&lt;br /&gt;
if content:find(&amp;quot;terms spelled with&amp;quot;) then&lt;br /&gt;
	track(&amp;quot;terms-spelled-with&amp;quot;)&lt;br /&gt;
end&lt;br /&gt;
&lt;br /&gt;
return data&lt;/div&gt;</summary>
		<author><name>bob&gt;Djpwikiadmin</name></author>
	</entry>
</feed>