Module:User:Suzukaze-c/zh/data/info

From Wiktionary, the free dictionary
Jump to navigation Jump to search

This is a private module sandbox of Suzukaze-c, for their own experimentation. Items in this module may be added and removed at Suzukaze-c's discretion; do not rely on this module's stability.


-- TODO: rename to "zh/data/varieties"?

local export = {}

export.data = {
	["m"] = {
		["name"] = "Mandarin",
		["name_w"] = "w:Mandarin Chinese",
		["var"] = "Standard Chinese", -- most of the time
		["var_w"] = "w:Standard Chinese",
		["region"] = "", -- not Beijing?
		["region_w"] = "",
		["rom"] = "Pinyin",
		["rom_w"] = "w:Pinyin",
		["iso"] = "cmn",

		["roms_order"] = { "PY", "ZY", "WG", "GR", "IPA" },
		["rom_default"] = "PY",
		["rom_secondary"] = { "ZY" },
		["rom_disabled"] = { },
		["roms"] = {
			["PY"] = "Pinyin",
			["ZY"] = "Zhuyin",
			["WG"] = "Wade-Giles",
			["GR"] = "Gwoyeu Romatzyh",
			["IPA"] = "IPA",
		},
		["roms_w"] = {
			["PY"] = "w:Pinyin",
			["ZY"] = "w:Zhuyin",
			["WG"] = "w:Wade-Giles",
			["GR"] = "w:Gwoyeu Romatzyh",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["m-s"] = {
		["name"] = "Mandarin",
		["name_w"] = "w:Mandarin Chinese",
		["var"] = "Sichuanese",
		["var_w"] = "w:Sichuanese dialect",
		["region"] = "Chengdu",
		["region_w"] = "w:Chengdu",
		["rom"] = "Sichuanese Pinyin",
		["rom_w"] = "w:Sichuanese Pinyin",
		["iso"] = "cmn",

		["roms_order"] = { "PY", "SWZ", "IPA" },
		["rom_default"] = "PY",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["PY"] = "Sichuanese Pinyin",
			["SWZ"] = "Xin Wenz",
			["IPA"] = "IPA",
		},
		["roms_w"] = {
			["PY"] = "w:Sichuanese Pinyin",
			["SWZ"] = "w:zh:四川话拉丁化新文字",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["dg"] = {
		["name"] = "Mandarin",
		["name_w"] = "w:Mandarin Chinese",
		["var"] = "Dungan",
		["var_w"] = "w:Dungan language",
		["region"] = "Standard Gansu",
		["region_w"] = "w:Gansu",
		["rom"] = "Dungan Cyrillic alphabet",
		["rom_w"] = "w:Dungan language#Writing system",
		["iso"] = "dng",

		["roms_order"] = { "CYRL", "IPA" },
		["rom_default"] = "CYRL",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["CYRL"] = "Cyrillic",
			["IPA"] = "IPA",
		},
		["roms_w"] = {
			["CYRL"] = "w:Dungan language#Writing system",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["c"] = {
		["name"] = "Cantonese",
		["name_w"] = "w:Cantonese",
		["var"] = "Standard Cantonese",
		["var_w"] = "w:Standard Cantonese", -- redirects to [[w:Cantonese]]
		["region"] = "", -- GZ/HK?
		["region_w"] = "",
		["rom"] = "Jyutping",
		["rom_w"] = "w:Jyutping",
		["iso"] = "yue",

		["roms_order"] = { "JP", "YALE", "CPY", "GD", "IPA" },
		["rom_default"] = "JP",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["JP"] = "Jyutping",
			["YALE"] = "Yale",
			["CPY"] = "Cantonese Pinyin",
			["GD"] = "Guangdong Romanization",
			["IPA"] = "IPA",
		},
		["roms_w"] = {
			["JP"] = "w:Jyutping",
			["YALE"] = "w:Yale romanization of Cantonese",
			["CPY"] = "w:Cantonese Pinyin",
			["GD"] = "w:Guangdong Romanization#Cantonese",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["c-t"] = {
		["name"] = "Cantonese",
		["name_w"] = "w:Cantonese",
		["var"] = "Taishanese",
		["var_w"] = "w:Taishanese",
		["region"] = "Taicheng",
		["region_w"] = "w:Taicheng Subdistrict",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Cantonese/Taishanese",
		["iso"] = "yue",

		["roms_order"] = { "WT", "IPA", "SLI", "GCH", "DLI" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { },
		["rom_disabled"] = {
			["SLI"] = 1,
			["GCH"] = 1,
			["DLI"] = 1,
		},
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
			["SLI"] = "Stephen Li",
			["GCH"] = "Gene Chin",
			["DLI"] = "Defense Language Institute",
		},
		["roms_w"] = {
			["WT"] = "Wiktionary:About Chinese/Cantonese/Taishanese",
			["IPA"] = "w:International Phonetic Alphabet",
			["SLI"] = "[http://www.stephen-li.com/TaishaneseVocabulary/Taishanese.html Stephen Li]",
			["GCH"] = "[https://sites.fitnyc.edu/users/gene_chin/hoisanva/index.htm Gene M Chin]",
			["DLI"] = "",
		},
	},
	["g"] = {
		["name"] = "Gan",
		["name_w"] = "w:Gan Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Nanchang",
		["region_w"] = "w:Nanchang dialect",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Gan",
		["iso"] = "gan",

		["roms_order"] = { "WT", "IPA" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { "WT" },
		["rom_disabled"] = { },
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["WT"] = "Wiktionary:About Chinese/Gan",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["h-s"] = {
		["name"] = "Hakka",
		["name_w"] = "w:Hakka Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Sixian",
		["region_w"] = "w:Sixian dialect",
		["rom"] = "",
		["rom_w"] = "",
		["iso"] = "hak",

		["roms_order"] = { "PFS", "HRS", "HFPY", "IPA" },
		["rom_default"] = "PFS",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["PFS"] = "Pha̍k-fa-sṳ",
			["HRS"] = "Hakka Romanization System",
			["HFPY"] = "Hagfa Pinyim",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["PFS"] = "w:Pha̍k-fa-sṳ",
			["HRS"] = "w:zh:客家語拼音方案",
			["HFPY"] = "w:Hagfa Pinyim",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["h-m"] = {
		["name"] = "Hakka",
		["name_w"] = "w:Hakka Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Meixian",
		["region_w"] = "w:Meixian dialect",
		["rom"] = "",
		["rom_w"] = "",
		["iso"] = "hak",

		["roms_order"] = { "GD", "IPA" },
		["rom_default"] = "GD",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["GD"] = "Guangdong Romanization",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["GD"] = "w:Guangdong Romanization#Hakka",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["j"] = {
		["name"] = "Jin",
		["name_w"] = "w:Jin Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Taiyuan",
		["region_w"] = "w:zh:太原話",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Jin",
		["iso"] = "cjy",

		["roms_order"] = { "WT", "IPA", "IPA-nosandhi" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
			["IPA-nosandhi"] = "IPA",
		},
		["roms_names_wp"] = {
			["WT"] = "Wiktionary:About Chinese/Jin",
			["IPA"] = "w:International Phonetic Alphabet",
			["IPA-nosandhi"] = "w:International Phonetic Alphabet",
		},
		["roms_names_qualifiers"] = {
			["IPA"] = "old-style",
			["IPA-nosandhi"] = "old-style, no sandhi",
		},
	},
	["mb"] = {
		["name"] = "Min Bei",
		["name_w"] = "w:Northern Min",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Jian'ou",
		["region_w"] = "w:Jian'ou dialect",
		["rom"] = "Kienning Colloquial Romanized",
		["rom_w"] = "w:Kienning Colloquial Romanized",
		["iso"] = "mnp",

		["roms_order"] = { "KCR", "IPA" },
		["rom_default"] = "KCR",
		["rom_secondary"] = { "IPA" },
		["rom_disabled"] = { },
		["roms"] = {
			["KCR"] = "Kienning Colloquial Romanized",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["KCR"] = "w:Kienning Colloquial Romanized",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["md"] = {
		["name"] = "Min Dong",
		["name_w"] = "w:Eastern Min",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Fuzhou",
		["region_w"] = "w:Fuzhou dialect",
		["rom"] = "Bàng-uâ-cê",
		["rom_w"] = "w:Bàng-uâ-cê",
		["iso"] = "cdo",

		["roms_order"] = { "BUC", "IPA" },
		["rom_default"] = "BUC",
		["rom_secondary"] = { "IPA" },
		["rom_disabled"] = { },
		["roms"] = {
			["BUC"] = "Bàng-uâ-cê",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["BUC"] = "w:Bàng-uâ-cê",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["mn"] = {
		["name"] = "Min Nan",
		["name_w"] = "w:Southern Min",
		["var"] = "Hokkien",
		["var_w"] = "w:Hokkien",
		["region"] = "", -- various
		["region_w"] = "",
		["rom"] = "Pe̍h-ōe-jī",
		["rom_w"] = "w:Pe̍h-ōe-jī",
		["iso"] = "nan",

		["roms_order"] = { "POJ", "TL", "PSDB", "IPA" },
		["rom_default"] = "POJ",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["POJ"] = "Pe̍h-ōe-jī",
			["TL"] = "Tâi-lô",
			["PSDB"] = "Phofsit Daibuun",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["POJ"] = "w:Pe̍h-ōe-jī",
			["TL"] = "w:Tâi-lô",
			["PSDB"] = "w:Phofsit Daibuun",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["mn-t"] = {
		["name"] = "Min Nan",
		["name_w"] = "w:Southern Min",
		["var"] = "Teochew",
		["var_w"] = "w:Teochew dialect",
		["region"] = "", -- various
		["region_w"] = "",
		["rom"] = "Peng'im",
		["rom_w"] = "w:Peng'im",
		["iso"] = "nan",

		["roms_order"] = { "GD", "POJ", "IPA" },
		["rom_default"] = "GD",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["GD"] = "Guangdong Romanization",
			["POJ"] = "Pe̍h-ōe-jī-like",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["GD"] = "w:Guangdong Romanization#Teochew",
			["POJ"] = "[[w:Pe̍h-ōe-jī|Pe̍h-ōe-jī]]-like",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["w-sh"] = {
		["name"] = "Wu",
		["name_w"] = "w:Wu Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Shanghai",
		["region_w"] = "w:Shanghainese",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Wu",
		["iso"] = "wuu",

		["roms_order"] = { "WT", "IPA" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["WT"] = "Wiktionary:About Chinese/Wu",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["w-wz"] = {
		["name"] = "Wu",
		["name_w"] = "w:Wu Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Wenzhou",
		["region_w"] = "w:Wenzhounese",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Wenzhou",
		["iso"] = "wuu",

		["roms_order"] = { "WT", "IPA" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
		},
		["roms_names_wp"] = {
			["WT"] = "Wiktionary:About Chinese/Wu",
			["IPA"] = "w:International Phonetic Alphabet",
		},
	},
	["x"] = {
		["name"] = "Xiang",
		["name_w"] = "w:Xiang Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "Changsha",
		["region_w"] = "w:Changsha dialect",
		["rom"] = "Wiktionary",
		["rom_w"] = "Wiktionary:About Chinese/Xiang",
		["iso"] = "hsn",

		["roms_order"] = { "WT", "IPA", "IPA-新派" },
		["rom_default"] = "IPA",
		["rom_secondary"] = { },
		["rom_disabled"] = { },
		["roms"] = {
			["WT"] = "Wiktionary",
			["IPA"] = "IPA",
			["IPA-新派"] = "IPA",
		},
		["roms_names_wp"] = {
			["WT"] = "Wiktionary:About Chinese/Jin",
			["IPA"] = "w:International Phonetic Alphabet",
			["IPA-新派"] = "w:International Phonetic Alphabet",
		},
		["roms_names_qualifiers"] = {
			["IPA"] = "old-style",
			["IPA-新派"] = "new-style",
		},
	},

	["mc"] = {
		["name"] = "Middle Chinese",
		["name_w"] = "w:Middle Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "",
		["region_w"] = "",
		["rom"] = "",
		["rom_w"] = "",
		["iso"] = "ltc",
	},
	["oc"] = {
		["name"] = "Old Chinese",
		["name_w"] = "w:Old Chinese",
		["var"] = "",
		["var_w"] = "",
		["region"] = "",
		["region_w"] = "",
		["rom"] = "",
		["rom_w"] = "",
		["iso"] = "och",
	},

	["cl"] = {
		["name"] = "Classical Chinese",
		["name_w"] = "w:Classical Chinese",
		["var"] = "Classical Chinese",
		["var_w"] = "w:Classical Chinese",
		["region"] = "",
		["region_w"] = "",
		["rom"] = "Pinyin",
		["rom_w"] = "w:Pinyin",
		["iso"] = "cmn", -- for zh-usex purposes; canonical is "lzh"
	},
	["cl-vn"] = {
		["name"] = "Classical Chinese",
		["name_w"] = "w:Classical Chinese",
		["var"] = "Classical Chinese",
		["var_w"] = "w:Classical Chinese",
		["region"] = "",
		["region_w"] = "",
		["rom"] = "Sino-Vietnamese",
		["rom_w"] = "w:Sino-Vietnamese vocabulary",
		["iso"] = "vi",
	},
}

return export

--[[
proposals
  - splitting "oc" into "oc-zs":Zhengzhang and "oc-bs":Baxter-Sagart
      - simplify zh-pron input (esp. since they don't seem to feature the same set of characters)
  - moving "Wiktionary:About Chinese/*" pages to the "Appendix:" namespace
      - moving the Baxter-Sagart notation notes out of zh-pron
]]