Module:languages/data/exceptional: Difference between revisions
No edit summary |
No edit summary |
||
| (48 intermediate revisions by 6 users not shown) | |||
| Line 13: | Line 13: | ||
local m = {} | local m = {} | ||
m["lhaz"] = { | |||
"Lhazareen", | |||
nil, | |||
"plai", | |||
"Latn", | |||
ancestors = "pls-pro", | |||
type = "conlang" | |||
} | |||
m["meer"] = { | |||
"Meereenese Valyrian", | |||
nil, | |||
"conlang-fam", | |||
"Latn", | |||
ancestors = "qhv", | |||
type = "conlang" | |||
} | |||
m["asta"] = { | |||
"Astapori Valyrian", | |||
nil, | |||
"conlang-fam", | |||
"Latn", | |||
ancestors = "qhv", | |||
type = "conlang" | |||
} | |||
m["ghis"] = { | |||
"Ghiscari", | |||
nil, | |||
"conlang-fam", | |||
"Latn", | |||
type = "conlang" | |||
} | |||
m["assh"] = { | |||
"Asshai'i", | |||
nil, | |||
"conlang-fam", | |||
"Latn", | |||
type = "conlang" | |||
} | |||
m["estu"] = { | |||
"Esturian", | |||
nil, | |||
"cel-his", | |||
"Latn", | |||
entry_name = { | |||
from = {"‧"}, | |||
to = {""}, | |||
}, | |||
sort_key = { | |||
remove_diacritics = c.hook, | |||
}, | |||
ancestors = "cel-pro", | |||
type = "conlang", | |||
} | |||
m["naur"] = { | |||
"Naurese", | |||
nil, | |||
"roa-ocr", | |||
"Latn", | |||
entry_name = { | |||
from = {"‧"}, | |||
to = {""}, | |||
}, | |||
sort_key = { | |||
remove_diacritics = c.hook, | |||
}, | |||
ancestors = "la", | |||
type = "conlang", | |||
} | |||
m["envu"] = { | |||
"Enventian", | |||
nil, | |||
"gmw", | |||
"Latn", | |||
entry_name = { | |||
from = {"‧"}, | |||
to = {""}, | |||
}, | |||
sort_key = { | |||
remove_diacritics = c.hook, | |||
}, | |||
ancestors = "ole-envu, pro-gmw", | |||
type = "conlang", | |||
main_category = "word" | |||
} | |||
m["ole-envu"] = { | |||
"Old Enventian", | |||
nil, | |||
"gmw", | |||
"Latn", | |||
entry_name = { | |||
from = {"‧"}, | |||
to = {""}, | |||
}, | |||
sort_key = { | |||
remove_diacritics = c.hook, | |||
}, | |||
ancestors = "pro-gmw", | |||
type = "conlang", | |||
} | |||
m["lyti-mid"] = { | m["lyti-mid"] = { | ||
| Line 35: | Line 142: | ||
"Afrihili", | "Afrihili", | ||
384707, | 384707, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 74: | Line 181: | ||
"Proto-Alopian", | "Proto-Alopian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
sort_key = { | sort_key = { | ||
| Line 111: | Line 218: | ||
"Bolak", | "Bolak", | ||
2909283, | 2909283, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 118: | Line 225: | ||
"Black Speech", | "Black Speech", | ||
686210, | 686210, | ||
" | "conlang-fam", | ||
"Latn, Teng", | "Latn, Teng", | ||
} | } | ||
| Line 125: | Line 232: | ||
"Communicationssprache", | "Communicationssprache", | ||
35227, | 35227, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 139: | Line 239: | ||
"Eloi", | "Eloi", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 146: | Line 246: | ||
"Goa'uld", | "Goa'uld", | ||
19823, | 19823, | ||
" | "conlang-fam", | ||
"Latn, Egyp, Mero", | "Latn, Egyp, Mero", | ||
} | } | ||
| Line 153: | Line 253: | ||
"Lapine", | "Lapine", | ||
6488195, | 6488195, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 160: | Line 260: | ||
"Mandalorian", | "Mandalorian", | ||
54289, | 54289, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 167: | Line 267: | ||
"Mundolinco", | "Mundolinco", | ||
851355, | 851355, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 174: | Line 274: | ||
"Na'vi", | "Na'vi", | ||
316939, | 316939, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 181: | Line 281: | ||
"Noxilo", | "Noxilo", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 191: | Line 291: | ||
"ǂA Ṇṵĩ", | "ǂA Ṇṵĩ", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
sort_key = { | sort_key = { | ||
| Line 232: | Line 332: | ||
"Unas", | "Unas", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 244: | Line 344: | ||
ancestors = "mish-pro, ine-pro", | ancestors = "mish-pro, ine-pro", | ||
type = "reconstructed,conlang", | type = "reconstructed,conlang", | ||
} | |||
m["aoka"] = { | |||
"Ah Oka", | |||
nil, | |||
"sntl", | |||
"Latn", | |||
ancestors="sntl-pro, hauh", | |||
type = "conlang" | |||
} | } | ||
| Line 249: | Line 358: | ||
"Kotava", | "Kotava", | ||
1377116, | 1377116, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 256: | Line 365: | ||
"Proto-Axwan", | "Proto-Axwan", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "reconstructed,conlang", | type = "reconstructed,conlang", | ||
| Line 282: | Line 391: | ||
"Bemé", | "Bemé", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang" | type = "conlang" | ||
| Line 318: | Line 427: | ||
"Gwaxol", | "Gwaxol", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "wasc, nent-pro", | ancestors = "wasc, nent-pro", | ||
| Line 330: | Line 439: | ||
to = {"¹", "²", "³", "⁴", "⁵", "⁶"}, | to = {"¹", "²", "³", "⁴", "⁵", "⁶"}, | ||
} | } | ||
} | |||
m["hauh"] = { | |||
"Hau-Hau", | |||
nil, | |||
"sntl", | |||
"Latn", | |||
ancestors="sntl-pro", | |||
type = "conlang" | |||
} | } | ||
| Line 344: | Line 462: | ||
"Hazulacanol", | "Hazulacanol", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "wasc", | ancestors = "wasc", | ||
type = "conlang", | type = "conlang", | ||
} | } | ||
m["xodc"] = { | m["xodc"] = { | ||
"Xodec", | "Xodec", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "hzlc", | ancestors = "hzlc", | ||
| Line 364: | Line 481: | ||
"North Xodec", | "North Xodec", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "xodc, hzlc", | ancestors = "xodc, hzlc", | ||
| Line 381: | Line 498: | ||
"Kilīmos-sāîl", | "Kilīmos-sāîl", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "wasc", | ancestors = "wasc", | ||
| Line 390: | Line 507: | ||
"Knrawi", | "Knrawi", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn, Wacg", | ||
type = "conlang", | type = "conlang", | ||
} | } | ||
| Line 407: | Line 524: | ||
"Central Isles Creole", | "Central Isles Creole", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "knra, qsc", | ancestors = "knra, qsc", | ||
| Line 416: | Line 533: | ||
"Maahaat", | "Maahaat", | ||
nil, | nil, | ||
"slaq", | "slaq-fam", | ||
"Latn", | "Latn", | ||
ancestors = "slaq-pro", | ancestors = "slaq-pro", | ||
| Line 425: | Line 542: | ||
"Maazha", | "Maazha", | ||
nil, | nil, | ||
"slaq", | "slaq-fam", | ||
"Latn", | "Latn", | ||
ancestors = "slaq-pro", | ancestors = "slaq-pro", | ||
| Line 442: | Line 559: | ||
"Naedzur", | "Naedzur", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "naedz-old", | ancestors = "naedz-old", | ||
| Line 451: | Line 568: | ||
"Old Naedzur", | "Old Naedzur", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 459: | Line 576: | ||
"Nentammmi", | "Nentammmi", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "reconstructed,conlang", | type = "reconstructed,conlang", | ||
| Line 476: | Line 593: | ||
"Misa Okan", | "Misa Okan", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 484: | Line 601: | ||
"Po Po", | "Po Po", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 501: | Line 618: | ||
"Sokya", | "Sokya", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "qsc", | ancestors = "qsc", | ||
| Line 510: | Line 627: | ||
"Rokadong", | "Rokadong", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Roka", | "Roka", | ||
ancestors = "annen", | ancestors = "annen", | ||
| Line 519: | Line 636: | ||
"Ankistran substrate", | "Ankistran substrate", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 527: | Line 644: | ||
"Kairitelan", | "Kairitelan", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "annen", | ancestors = "annen", | ||
| Line 536: | Line 653: | ||
"Liðakuin", | "Liðakuin", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "anldk-old", | ancestors = "anldk-old", | ||
| Line 545: | Line 662: | ||
"Debazi", | "Debazi", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "anmnk", | ancestors = "anmnk", | ||
| Line 554: | Line 671: | ||
"Old Liðakuin", | "Old Liðakuin", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "anwgs", | ancestors = "anwgs", | ||
| Line 563: | Line 680: | ||
"Classical Munkai", | "Classical Munkai", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "anpmk", | ancestors = "anpmk", | ||
| Line 572: | Line 689: | ||
"Proto-Munkai", | "Proto-Munkai", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "anplm", | ancestors = "anplm", | ||
| Line 581: | Line 698: | ||
"Proto-Leyen-Mangellian", | "Proto-Leyen-Mangellian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 589: | Line 706: | ||
"Proto-Nenta", | "Proto-Nenta", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 597: | Line 714: | ||
"Proto-West-Gomensayan", | "Proto-West-Gomensayan", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 605: | Line 722: | ||
"Hatzonian", | "Hatzonian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "ankar", | ancestors = "ankar", | ||
| Line 614: | Line 731: | ||
"Common Kardonian", | "Common Kardonian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "ankar", | ancestors = "ankar", | ||
| Line 623: | Line 740: | ||
"Speodan", | "Speodan", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "ankar", | ancestors = "ankar", | ||
| Line 632: | Line 749: | ||
"Calubian", | "Calubian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "ankar", | ancestors = "ankar", | ||
| Line 641: | Line 758: | ||
"Dyamantian", | "Dyamantian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "ankar", | ancestors = "ankar", | ||
| Line 650: | Line 767: | ||
"Middle Kardonian", | "Middle Kardonian", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 725: | Line 842: | ||
type = "conlang", | type = "conlang", | ||
} | } | ||
m["thus"] = { | |||
"Thustani", | |||
nil, | |||
"qfa-iso", | |||
"Latn", | |||
ancestors = "thus-old", | |||
type = "conlang" | |||
} | |||
m["thus-old"] = { | |||
"Old Thustani", | |||
nil, | |||
"qfa-iso", | |||
"Latn", | |||
type = "conlang" | |||
} | |||
m["elva"] = { | m["elva"] = { | ||
"Elvarri", | "Elvarri", | ||
"lxel, lxel-nor", | |||
" | "conlang-fam", | ||
"Latn", | |||
ancestors = "lxel-pro,lxel-nor-pro,elva-ear", | |||
type="conlang" | |||
} | |||
m["elva-ear"] = { | |||
"Early Elvarri", | |||
"lxel, lxel-nor", | |||
"conlang-fam", | |||
"Latn", | |||
ancestors = "lxel-pro,lxel-nor-pro", | |||
type="conlang" | |||
} | |||
m["sadl"] = { | |||
"Sadling", | |||
"lxel, lxel-sou", | |||
"conlang-fam", | |||
"Latn", | "Latn", | ||
ancestors = "lxel-pro, lxel-sou-pro", | |||
type="conlang" | type="conlang" | ||
} | } | ||
| Line 740: | Line 894: | ||
"Latn, Runr", | "Latn, Runr", | ||
ancestors = "gem-pro", | ancestors = "gem-pro", | ||
type = "conlang", | |||
} | |||
m["cacr"] = { | |||
"Cabot Creole", | |||
nil, | |||
"iro-nor, iro", | |||
"Latn", | |||
sort_key = { | |||
from = {"%-"}, | |||
to = {""}, | |||
}, | |||
display_text = { | |||
from = {"^(.+):"}, -- colon, except if beginning with it | |||
to = {"%1꞉"}, --modifier letter colon | |||
}, | |||
ancestors = "iro-pro, iro-nor-pro", | |||
type = "conlang", | type = "conlang", | ||
} | } | ||
| Line 768: | Line 939: | ||
ancestors = "vdnc-pro", | ancestors = "vdnc-pro", | ||
type = "conlang", | type = "conlang", | ||
} | |||
m["gnym"] = { | |||
"Ganymedian", | |||
nil, | |||
"conlang-fam", | |||
"Latn", | |||
type = "conlang" | |||
} | } | ||
| Line 792: | Line 971: | ||
"Jokelang 2", | "Jokelang 2", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 829: | Line 1,008: | ||
"Kílta", | "Kílta", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
sort_key = { | sort_key = { | ||
| Line 845: | Line 1,024: | ||
} | } | ||
m[" | m["lxel-pro"] = { | ||
" | "Proto-Luxelvic", | ||
nil, | nil, | ||
" | "lxel", | ||
"Latn", | "Latn", | ||
type = "conlang", | sort_key = { | ||
} | from = {"[-*·]"}, | ||
to = {""}, | |||
remove_diacritics = c.macron .. c.breve, | |||
}, | |||
type = "reconstructed,conlang", | |||
} | |||
m["lxel-nor-pro"] = { | |||
"Proto–North Luxelvic", | |||
nil, | |||
"lxel-nor,lxel", | |||
"Latn", | |||
sort_key = { | |||
from = {"[-*·]"}, | |||
to = {""}, | |||
remove_diacritics = c.macron .. c.breve, | |||
}, | |||
ancestors="lxel-pro", | |||
type = "reconstructed,conlang", | |||
} | |||
m["lxel-sou-pro"] = { | |||
"Proto–South Luxelvic", | |||
nil, | |||
"lxel-sou,lxel", | |||
"Latn", | |||
sort_key = { | |||
from = {"[-*·]"}, | |||
to = {""}, | |||
remove_diacritics = c.macron .. c.breve, | |||
}, | |||
ancestors="lxel-pro", | |||
type = "reconstructed,conlang", | |||
} | |||
m["sasr"] = { | |||
"Ancient Sassrian", | |||
nil, | |||
"sasr", | |||
"Latn", | |||
type = "conlang", | |||
} | |||
m["lyti"] = { | m["lyti"] = { | ||
"Oltic", | "Oltic", | ||
| Line 928: | Line 1,147: | ||
"Nawuhu", | "Nawuhu", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 945: | Line 1,164: | ||
"Pine", | "Pine", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Teul, Tugv", | "Teul, Tugv", | ||
entry_name = { | entry_name = { | ||
from = {"‧"}, | from = {"‧$", "‧"}, | ||
to = {""}, | to = {"-", ""}, | ||
}, | }, | ||
sort_key = { | sort_key = { | ||
remove_diacritics = c.hook, | remove_diacritics = c.hook, | ||
from = {"%-"}, | |||
to = {""}, | |||
}, | }, | ||
type = "conlang", | type = "conlang", | ||
| Line 963: | Line 1,184: | ||
"Old Ponish", | "Old Ponish", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "gmw-pro", | ancestors = "gmw-pro", | ||
| Line 972: | Line 1,193: | ||
"Ponish", | "Ponish", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
ancestors = "old-pnsh", | ancestors = "old-pnsh", | ||
| Line 981: | Line 1,202: | ||
"Sekhulla", | "Sekhulla", | ||
nil, | nil, | ||
"wasc", | "wasc-fam", | ||
"Latn", | "Latn", | ||
ancestors = "wasc", | ancestors = "wasc", | ||
| Line 1,024: | Line 1,245: | ||
"Proto-Slaq", | "Proto-Slaq", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "reconstructed,conlang", | type = "reconstructed,conlang", | ||
| Line 1,050: | Line 1,271: | ||
"Toki Pona", | "Toki Pona", | ||
36846, | 36846, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 1,058: | Line 1,279: | ||
"Uchee", | "Uchee", | ||
nil, | nil, | ||
"slaq", | "slaq-fam", | ||
"Latn", | "Latn", | ||
ancestors = "slaq-pro", | ancestors = "slaq-pro", | ||
| Line 1,075: | Line 1,296: | ||
"Urka", | "Urka", | ||
nil, | nil, | ||
"slaq", | "slaq-fam", | ||
"Latn", | "Latn", | ||
ancestors = "slaq-pro", | ancestors = "slaq-pro", | ||
| Line 1,096: | Line 1,317: | ||
"Wascotl", | "Wascotl", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "reconstructed,conlang", | type = "reconstructed,conlang", | ||
| Line 1,104: | Line 1,325: | ||
"Wedge", | "Wedge", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type="conlang", | type="conlang", | ||
| Line 1,112: | Line 1,333: | ||
"Chiingimec", | "Chiingimec", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Cyrl", | "Cyrl", | ||
translit = "xchc-translit", | translit = "xchc-translit", | ||
| Line 1,221: | Line 1,442: | ||
"Proto-Plains", | "Proto-Plains", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "reconstructed,conlang" | type = "reconstructed,conlang" | ||
| Line 1,265: | Line 1,486: | ||
"Qut", | "Qut", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "conlang", | type = "conlang", | ||
| Line 1,476: | Line 1,697: | ||
ancestors = "vhus, phus, non, gem-pro", | ancestors = "vhus, phus, non, gem-pro", | ||
type = "conlang", | type = "conlang", | ||
} | |||
m["sdno"] = { | |||
"Sudrey Norse", | |||
nil, | |||
"gem", | |||
"Latn", | |||
ancestors = "non, gem-pro", | |||
type = "conlang", | |||
sort_key = {remove_diacritics = c.grave .. c.acute}, | |||
standard_chars = "AaÀàBbCcDdEeÈèFfGgHhIiÌìLlMmNnOoÒòPpRrSsTtUuÙùVv" .. c.punc, | |||
} | } | ||
| Line 1,482: | Line 1,714: | ||
nil, | nil, | ||
"gem", | "gem", | ||
" | "Latn", | ||
ancestors = "non, gem-pro", | ancestors = "sdno, non, gem-pro", | ||
type = "conlang", | type = "conlang", | ||
sort_key = {remove_diacritics = c.grave .. c.acute}, | |||
standard_chars = "AaÀàBbCcDdEeÈèFfGgHhIiÌìLlMmNnOoÒòPpRrSsTtUuÙùVvZz" .. c.punc, | |||
} | } | ||
m["opch"] = { | |||
"Opach", | |||
nil, | |||
"ine", | |||
"Latn", | |||
ancestors = "mpch, epch, opch-pro, ine-pro", | |||
type = "conlang", | |||
} | |||
| Line 2,106: | Line 2,346: | ||
"nic-grs", | "nic-grs", | ||
"Latn", | "Latn", | ||
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ .. c.tilde .. c.macron}, | |||
} | } | ||
m["alv-bgu"] = { | m["alv-bgu"] = { | ||
" | "Bainouk Gubeeher", | ||
17002646, | 17002646, | ||
"alv-bny", | "alv-bny", | ||
| Line 2,287: | Line 2,527: | ||
"Adûni", | "Adûni", | ||
1232159, | 1232159, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,295: | Line 2,535: | ||
"Belter Creole", | "Belter Creole", | ||
108055510, | 108055510, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,308: | Line 2,548: | ||
"Bolak", | "Bolak", | ||
2909283, | 2909283, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,316: | Line 2,556: | ||
"Black Speech", | "Black Speech", | ||
686210, | 686210, | ||
" | "conlang-fam", | ||
"Latn, Teng", | "Latn, Teng", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,324: | Line 2,564: | ||
"Communicationssprache", | "Communicationssprache", | ||
35227, | 35227, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,332: | Line 2,572: | ||
"Dothraki", | "Dothraki", | ||
2914733, | 2914733, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,340: | Line 2,580: | ||
"Eloi", | "Eloi", | ||
nil, | nil, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,348: | Line 2,588: | ||
"Goa'uld", | "Goa'uld", | ||
19823, | 19823, | ||
" | "conlang-fam", | ||
"Latn, Egyp, Mero", | "Latn, Egyp, Mero", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,356: | Line 2,596: | ||
"Lapine", | "Lapine", | ||
6488195, | 6488195, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,364: | Line 2,604: | ||
"Mandalorian", | "Mandalorian", | ||
54289, | 54289, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,372: | Line 2,612: | ||
"Mundolinco", | "Mundolinco", | ||
851355, | 851355, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,380: | Line 2,620: | ||
"Naʼvi", | "Naʼvi", | ||
316939, | 316939, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 2,485: | Line 2,717: | ||
"Little Swanport", | "Little Swanport", | ||
6652138, | 6652138, | ||
"qfa-unc", | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 2,889: | Line 3,121: | ||
"bnt-ngu", | "bnt-ngu", | ||
"Latn", | "Latn", | ||
strip_diacritics = {remove_diacritics = c.grave .. c.acute}, | |||
} | } | ||
| Line 2,899: | Line 3,131: | ||
type = "reconstructed", | type = "reconstructed", | ||
sort_key = "bnt-pro-sortkey", | sort_key = "bnt-pro-sortkey", | ||
} | |||
m["bnt-sab-pro"] = { | |||
"Proto-Sabaki", | |||
nil, -- Q2209395 is the code for the Sabaki family | |||
"bnt-sab", | |||
"Latn", | |||
type = "reconstructed", | |||
} | } | ||
| Line 3,060: | Line 3,300: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
strip_diacritics = { | |||
from = {"q̣", "p̣", "ʓ", "ċ"}, | from = {"q̣", "p̣", "ʓ", "ċ"}, | ||
to = {"q̇", "ṗ", "ʒ", "c̣"} | to = {"q̇", "ṗ", "ʒ", "c̣"} | ||
| Line 3,072: | Line 3,312: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
strip_diacritics = { | |||
from = {"q̣", "p̣", "ʓ", "ċ"}, | from = {"q̣", "p̣", "ʓ", "ċ"}, | ||
to = {"q̇", "ṗ", "ʒ", "c̣"} | to = {"q̇", "ṗ", "ʒ", "c̣"} | ||
| Line 3,115: | Line 3,355: | ||
"cel-bry", | "cel-bry", | ||
"Latn, Polyt", | "Latn, Polyt", | ||
sort_key = { | sort_key = { | ||
Latn = "cel-bry-pro-sortkey", | Latn = "cel-bry-pro-sortkey", | ||
}, | }, | ||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,135: | Line 3,366: | ||
"cel", | "cel", | ||
"Latn, Polyt, Ital", | "Latn, Polyt, Ital", | ||
strip_diacritics = { | |||
Latn = {remove_diacritics = c.macron .. c.breve .. c.diaer}, | Latn = {remove_diacritics = c.macron .. c.breve .. c.diaer}, | ||
}, | }, | ||
sort_key = { | sort_key = { | ||
Latn = "cel-bry-pro-sortkey", | Latn = "cel-bry-pro-sortkey", | ||
}, | }, | ||
-- Ital translit in [[Module:scripts/data]] | |||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,345: | Line 3,569: | ||
"Mlym, Knda", | "Mlym, Knda", | ||
ancestors = "ml, tcy", | ancestors = "ml, tcy", | ||
translit | -- Knda translit in [[Module:scripts/data]] | ||
-- Mlym translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,364: | Line 3,586: | ||
"dra-kan", | "dra-kan", | ||
"Knda", | "Knda", | ||
-- Knda translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,380: | Line 3,602: | ||
"dra-kan", | "dra-kan", | ||
"Knda", | "Knda", | ||
-- Knda translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,424: | Line 3,646: | ||
m["egx-dem"] = { | m["egx-dem"] = { | ||
"Demotic", | "Demotic Egyptian", | ||
36765, | 36765, | ||
"egx", | "egx", | ||
"Latn, Egyd, Polyt", | "Latn, Egyd, Polyt", | ||
sort_key = { | sort_key = { | ||
Latn = { | Latn = { | ||
| Line 3,443: | Line 3,656: | ||
to = {p[1], p[2], p[3], p[4], p[5], p[6], p[7], p[8], p[9], p[10], p[11], p[12], p[13], p[15], p[16], p[16], p[17], p[14], p[19], p[18], p[20], p[21], p[22], p[23], p[24], p[23], p[25], p[26], p[26]} | to = {p[1], p[2], p[3], p[4], p[5], p[6], p[7], p[8], p[9], p[10], p[11], p[12], p[13], p[15], p[16], p[16], p[17], p[14], p[19], p[18], p[20], p[21], p[22], p[23], p[24], p[23], p[25], p[26], p[26]} | ||
}, | }, | ||
}, | }, | ||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,603: | Line 3,816: | ||
"gmq-eas", | "gmq-eas", | ||
"Latn, Runr", | "Latn, Runr", | ||
strip_diacritics = {remove_diacritics = c.macron}, | |||
} | } | ||
| Line 3,619: | Line 3,832: | ||
"gmq-eas", | "gmq-eas", | ||
"Latn, Runr", | "Latn, Runr", | ||
strip_diacritics = {remove_diacritics = c.macron}, | |||
} | } | ||
| Line 3,743: | Line 3,956: | ||
m["gn-cls"] = { | m["gn-cls"] = { | ||
"Classical | "Classical Guarani", | ||
17478065, | 17478065, | ||
" | "gn", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 3,759: | Line 3,971: | ||
Grek = "el-translit", | Grek = "el-translit", | ||
}, | }, | ||
-- Grek display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,779: | Line 3,983: | ||
Grek = "el-translit", | Grek = "el-translit", | ||
}, | }, | ||
-- Grek display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,801: | Line 3,997: | ||
}, | }, | ||
override_translit = true, | override_translit = true, | ||
strip_diacritics = { | |||
Cyrl = {remove_diacritics = c.acute}, | Cyrl = {remove_diacritics = c.acute}, | ||
}, | }, | ||
-- Grek display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,824: | Line 4,014: | ||
remove_diacritics = c.grave .. c.acute .. c.macron .. c.breve .. c.caron | remove_diacritics = c.grave .. c.acute .. c.macron .. c.breve .. c.caron | ||
}}, | }}, | ||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
-- NOTE: formerly no translit specified for Polyt; presumably an accidental omission; if not, set Polyt = false in | |||
-- the translit section | |||
} | } | ||
m["hmn-pro"] = { | m["hmn-pro"] = { | ||
"Proto- | "Proto-Hmongic", | ||
116773210, | 116773210, | ||
"hmn", | "hmn", | ||
| Line 3,835: | Line 4,028: | ||
m["hmx-mie-pro"] = { | m["hmx-mie-pro"] = { | ||
"Proto- | "Proto-Mienic", | ||
116773229, | 116773229, | ||
"hmx-mie", | "hmx-mie", | ||
| Line 3,890: | Line 4,083: | ||
translit = { | translit = { | ||
Deva = "sa-translit", | Deva = "sa-translit", | ||
Shrd | -- Shrd translit in [[Module:scripts/data]] | ||
Sidd | -- Sidd translit in [[Module:scripts/data]] | ||
}, | }, | ||
} | } | ||
| Line 3,902: | Line 4,095: | ||
ancestors = "sa", | ancestors = "sa", | ||
translit = { | translit = { | ||
Brah | -- Brah translit in [[Module:scripts/data]] | ||
Khar = "Khar-translit", | Khar = "Khar-translit", | ||
}, | }, | ||
} | |||
m["inc-dng-pro"] = { | |||
"Proto-Dangari", | |||
nil, | |||
"inc-dng", | |||
"Latn", | |||
type = "reconstructed", | |||
} | } | ||
| Line 3,912: | Line 4,113: | ||
"inc-bas", | "inc-bas", | ||
"Brah, Sidd", | "Brah, Sidd", | ||
-- Brah, Sidd translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 3,982: | Line 4,180: | ||
"inc-hie", | "inc-hie", | ||
"Deva, Kthi, ur-Arab", | "Deva, Kthi, ur-Arab", | ||
strip_diacritics = { | |||
from = {"هٔ", "ۂ"}, -- character "ۂ" code U+06C2 to "ه" and "هٔ" | from = {"هٔ", "ۂ"}, -- character "ۂ" code U+06C2 to "ه" and "هٔ" (U+0647 + U+0654) to "ه" | ||
to = {"ہ", "ہ"}, | to = {"ہ", "ہ"}, | ||
remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef | remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef | ||
| Line 4,014: | Line 4,212: | ||
"inc-hiw", | "inc-hiw", | ||
"Deva, ur-Arab", | "Deva, ur-Arab", | ||
strip_diacritics = { | |||
from = {"هٔ", "ۂ"}, -- character "ۂ" code U+06C2 to "ه" and "هٔ" | from = {"هٔ", "ۂ"}, -- character "ۂ" code U+06C2 to "ه" and "هٔ" (U+0647 + U+0654) to "ه" | ||
to = {"ہ", "ہ"}, | to = {"ہ", "ہ"}, | ||
remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef | remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef | ||
| Line 4,041: | Line 4,239: | ||
["pa-Arab"] = "pa-Arab-translit", | ["pa-Arab"] = "pa-Arab-translit", | ||
}, | }, | ||
strip_diacritics = {remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun}, | |||
} | } | ||
| Line 4,084: | Line 4,282: | ||
"ine", | "ine", | ||
"Polyt", | "Polyt", | ||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 4,115: | Line 4,310: | ||
"xme", | "xme", | ||
"Polyt, Latn", | "Polyt, Latn", | ||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | |||
} | |||
m["xme-mid"] = { | m["xme-mid"] = { | ||
"Middle Median", | "Middle Median", | ||
| Line 4,142: | Line 4,326: | ||
"fa-Arab, Latn, Hebr", | "fa-Arab, Latn, Hebr", | ||
ancestors = "xme-mid", | ancestors = "xme-mid", | ||
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 4,352: | Line 4,537: | ||
"itc-sbl", | "itc-sbl", | ||
"Ital, Polyt, Latn", | "Ital, Polyt, Latn", | ||
-- Ital translit in [[Module:scripts/data]] (NOTE: formerly not present, probably an accidental omission) | |||
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 4,374: | Line 4,549: | ||
translit = s["jpx-translit"], | translit = s["jpx-translit"], | ||
display_text = s["jpx-displaytext"], | display_text = s["jpx-displaytext"], | ||
strip_diacritics = s["jpx-stripdiacritics"], | |||
sort_key = s["jpx-sortkey"], | sort_key = s["jpx-sortkey"], | ||
} | } | ||
| Line 4,463: | Line 4,638: | ||
ancestors = "okm", | ancestors = "okm", | ||
translit = "okm-translit", | translit = "okm-translit", | ||
-- Kore strip_diacritics in [[Module:scripts/data]] | |||
} | } | ||
| Line 4,515: | Line 4,690: | ||
"Idiom Neutral", | "Idiom Neutral", | ||
35847, | 35847, | ||
" | "conlang-fam", | ||
"Latn", | "Latn", | ||
type = "appendix-constructed", | type = "appendix-constructed", | ||
| Line 4,568: | Line 4,743: | ||
nil, | nil, | ||
"Phnx", | "Phnx", | ||
-- Phnx translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission) | |||
} | } | ||
| Line 5,198: | Line 5,374: | ||
} | } | ||
m[" | m["ngf-bin-pro"] = { | ||
" | "Proto-Binanderean", | ||
137881672, | |||
" | "ngf-bin", | ||
"Latn", | "Latn", | ||
type = "reconstructed", | |||
} | } | ||
| Line 5,344: | Line 5,508: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
} | |||
m["njo-jgl"] = { | |||
"Chungli Ao", | |||
55607615, | |||
"sit-aao", | |||
"Latn", | |||
} | } | ||
| Line 5,411: | Line 5,582: | ||
m["omq-sjq"] = { | m["omq-sjq"] = { | ||
"San Juan Quiahije Chatino", | "San Juan Quiahije Chatino", | ||
138330751, | |||
"omq-cha", | "omq-cha", | ||
"Latn", | "Latn", | ||
| Line 5,431: | Line 5,602: | ||
m["omq-tri-pro"] = { | m["omq-tri-pro"] = { | ||
"Proto- | "Proto-Triqui", | ||
116773817, | 116773817, | ||
"omq-tri", | "omq-tri", | ||
| Line 5,494: | Line 5,665: | ||
} | } | ||
m["paa- | m["paa-kmn"] = { | ||
"Kómnzo", | "Kómnzo", | ||
18344310, | 18344310, | ||
"paa- | "paa-wko", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 5,504: | Line 5,675: | ||
"Kuwani", | "Kuwani", | ||
6449056, | 6449056, | ||
" | "qfa-unc", -- poorly attested, possibly the same as or related to Kalabra | ||
"Latn", | "Latn", | ||
} | |||
m["paa-lei"] = { | |||
"Leitre", | |||
85776228, | |||
"paa-isk", | |||
} | } | ||
| Line 5,519: | Line 5,696: | ||
"Nungon", | "Nungon", | ||
128807788, | 128807788, | ||
" | "ngf-ynu", | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 5,905: | Line 6,082: | ||
3094838, | 3094838, | ||
"roa-git", | "roa-git", | ||
ancestors = "pms-old", | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 5,913: | Line 6,091: | ||
"roa-git", | "roa-git", | ||
"Latn", | "Latn", | ||
ancestors = "pms-old", | |||
} | } | ||
| Line 5,957: | Line 6,136: | ||
"roa-gap", | "roa-gap", | ||
"Latn", | "Latn", | ||
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ}, | |||
} | } | ||
| Line 6,008: | Line 6,187: | ||
"Baenan", | "Baenan", | ||
3401998, | 3401998, | ||
"qfa-unc", -- extinct, poorly attested; only known through 9 words | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,015: | Line 6,194: | ||
"Bagua", | "Bagua", | ||
5390321, | 5390321, | ||
"qfa-unc", -- extinct, poorly attested; possibly Cariban | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,037: | Line 6,216: | ||
"Cacán", | "Cacán", | ||
945482, | 945482, | ||
"qfa-unc", -- extinct, poorly attested; no consensus on classification | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,074: | Line 6,253: | ||
"Chirino", | "Chirino", | ||
5390321, | 5390321, | ||
"qfa-unc", -- extinct, only four words known; possibly related to Candoshi-Shapra (cbu) | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,117: | Line 6,296: | ||
"Comechingon", | "Comechingon", | ||
6644203, | 6644203, | ||
"qfa-unc", -- extinct, poorly attested; no consensus on classification | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,124: | Line 6,303: | ||
"Chono", | "Chono", | ||
5104704, | 5104704, | ||
"qfa-unc", -- extinct, poorly attested; no consensus on classification, possibly spurious | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,131: | Line 6,310: | ||
"Cañari", | "Cañari", | ||
5055572, | 5055572, | ||
"qfa-unc", -- extinct, poorly attested; possibly Chimuan or Barbacoan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,152: | Line 6,331: | ||
"Copallén", | "Copallén", | ||
5390321, | 5390321, | ||
"qfa-unc", -- extinct, only four words attested; possibly Cholonan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,166: | Line 6,345: | ||
"Catuquinaru", | "Catuquinaru", | ||
16858455, | 16858455, | ||
"qfa-unc", -- extinct, poorly attested; vocabulary does not resemble other languages | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,173: | Line 6,352: | ||
"Culli", | "Culli", | ||
2879660, | 2879660, | ||
"qfa-unc", -- extinct, poorly attested; often considered an isolate | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,180: | Line 6,359: | ||
"Cueva", | "Cueva", | ||
5192644, | 5192644, | ||
"qfa-unc", -- extinct, poorly attested; possibly Chocoan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,187: | Line 6,366: | ||
"Esmeralda", | "Esmeralda", | ||
3058083, | 3058083, | ||
"qfa-unc", -- extinct, poorly attested; possibly related to Yaruro | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,201: | Line 6,380: | ||
"Gamela", | "Gamela", | ||
5403661, | 5403661, | ||
"qfa-unc", -- extinct, poorly attested; possibly an isolate | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,215: | Line 6,394: | ||
"Guamo", | "Guamo", | ||
5613495, | 5613495, | ||
"qfa-unc", -- extinct; "Kaufman (1990) finds a connection with the Chapacuran languages convincing." [Wikipedia] Considered an isolate by Campbell (2024). | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,265: | Line 6,444: | ||
"Katembri", | "Katembri", | ||
6375925, | 6375925, | ||
"qfa-unc", -- extinct, poorly attested; "Kaufman (1990) has linked it with the nearly extinct Taruma, although this has not been accepted by other scholars." [Wikipedia] | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,272: | Line 6,451: | ||
"Malalí", | "Malalí", | ||
6741212, | 6741212, | ||
"sai-mje", -- considered the most divergent Maxakalían language (a subdivision of Macro-Jê), for which we have no entry | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,279: | Line 6,458: | ||
"Maratino", | "Maratino", | ||
6755055, | 6755055, | ||
"qfa-unc", -- extinct, poorly attested; possibly Uto-Aztecan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,286: | Line 6,465: | ||
"Matanawi", | "Matanawi", | ||
6786047, | 6786047, | ||
"qfa-unc", -- extinct; either an isolate or distantly related to the Muran languages; Campbell (2024) lists it as an isolate, Glottolog gives it as unclassified | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,293: | Line 6,472: | ||
"Mocana", | "Mocana", | ||
3402048, | 3402048, | ||
"qfa-unc", -- extinct, poorly attested; given as part of the Malibu languages (geographic grouping; not a clade) | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,314: | Line 6,493: | ||
"Malibu", | "Malibu", | ||
3402048, | 3402048, | ||
"qfa-unc", -- extinct, poorly attested; given as part of the Malibu languages (geographic grouping; not a clade) | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,328: | Line 6,507: | ||
"Mucuchí", | "Mucuchí", | ||
6931290, | 6931290, | ||
nil, | nil, -- generally considered Timotean, for which we have no entry | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,342: | Line 6,521: | ||
"Muzo", | "Muzo", | ||
6644203, | 6644203, | ||
"qfa-unc", -- extinct language of Colombia, poorly attested; may be Pijao (Cariban) | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,349: | Line 6,528: | ||
"Maynas", | "Maynas", | ||
16919393, | 16919393, | ||
"sai-cah", -- per Campbell (2024); formerly considered unclassified | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,356: | Line 6,535: | ||
"Natú", | "Natú", | ||
9006749, | 9006749, | ||
"qfa-unc", -- extinct, poorly attested; "only Greenberg dares to classify [it]".[Wikipedia, quoting Moseley, Christopher; Asher, R. E.; Tait, Mary (1994), Atlas of the world's languages] | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,385: | Line 6,564: | ||
"Palta", | "Palta", | ||
3042978, | 3042978, | ||
"qfa-unc", -- extinct, unclassified; possibly Chicham | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,399: | Line 6,578: | ||
"Paratió", | "Paratió", | ||
16890038, | 16890038, | ||
"qfa-unc", -- extinct, poorly attested; possibly Xukuruan | |||
"Latn", | |||
} | |||
m["sai-peb"] = { | |||
"Peba", | |||
3373890, | |||
"sai-pey", | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,406: | Line 6,592: | ||
"Panzaleo", | "Panzaleo", | ||
3123275, | 3123275, | ||
"qfa-unc", -- extinct, unclassified; possibly Paezan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,413: | Line 6,599: | ||
"Puruhá", | "Puruhá", | ||
3410994, | 3410994, | ||
"qfa-unc", -- extinct, poorly attested; possibly in a famil with Cañari | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,420: | Line 6,606: | ||
"Patagón", | "Patagón", | ||
128807870, | 128807870, | ||
"sai-tar", -- extinct, only known from 4 words, which suggest Cariban lineage (Campbell 2024) | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,448: | Line 6,634: | ||
"Quimbaya", | "Quimbaya", | ||
7272043, | 7272043, | ||
"qfa-unc", -- extinct, might not exist; few known words | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,462: | Line 6,648: | ||
"Rabona", | "Rabona", | ||
6644203, | 6644203, | ||
"qfa-unc", -- extinct, poorly attested, mostly plant names; possibly Candoshi-Shapra | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,469: | Line 6,655: | ||
"Ramanos", | "Ramanos", | ||
16902824, | 16902824, | ||
"qfa-unc", -- extinct, poorly attested, possibly an isolate; per Glottolog: "the minuscule wordlist ... shows no convincing resemblances to surrounding languages" | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,476: | Line 6,662: | ||
"Sácata", | "Sácata", | ||
5390321, | 5390321, | ||
"qfa-unc", -- extinct, only 3 words known; possibly Candoshí or Arawakan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,483: | Line 6,669: | ||
"Sanaviron", | "Sanaviron", | ||
16895999, | 16895999, | ||
"qfa-unc", -- extinct, unclassified; no consensus on classification | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,497: | Line 6,683: | ||
"Sechura", | "Sechura", | ||
7442912, | 7442912, | ||
"qfa-unc", -- extinct, poorly attested; possibly Catacaoan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,504: | Line 6,690: | ||
"Sinúfana", | "Sinúfana", | ||
7525275, | 7525275, | ||
"qfa-unc", -- moribund, poorly attested; possibly Chocoan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,519: | Line 6,705: | ||
"Tabancale", | "Tabancale", | ||
5390321, | 5390321, | ||
"qfa-unc", -- extinct, only 5 words known; no obvious connections, might be an isolate | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,526: | Line 6,712: | ||
"Tallán", | "Tallán", | ||
16910468, | 16910468, | ||
"qfa-unc", -- extinct, poorly attested; might be Catacaoan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,548: | Line 6,734: | ||
"Teushen", | "Teushen", | ||
3519243, | 3519243, | ||
"qfa-unc", -- probably extinct by the 1950's; possibly Chonan | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,555: | Line 6,741: | ||
"Timote", | "Timote", | ||
7806995, | 7806995, | ||
nil, | nil, -- possibly in a small Timotean family | ||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,569: | Line 6,755: | ||
"Tarairiú", | "Tarairiú", | ||
7685313, | 7685313, | ||
"qfa-unc", -- extinct, too poorly attested to classify | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,576: | Line 6,762: | ||
"Waitaká", | "Waitaká", | ||
16918610, | 16918610, | ||
"qfa-unc", -- extinct, possibly Purian | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,605: | Line 6,791: | ||
"Xocó", | "Xocó", | ||
12953620, | 12953620, | ||
"qfa-unc", -- extinct and poorly attested; not clear if one or three languages | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,640: | Line 6,826: | ||
"Yurumanguí", | "Yurumanguí", | ||
1281291, | 1281291, | ||
"qfa-unc", -- extinct, too poorly attested to classify | |||
"Latn", | "Latn", | ||
} | } | ||
| Line 6,721: | Line 6,907: | ||
"sem-can", | "sem-can", | ||
"Phnx", | "Phnx", | ||
-- Phnx translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,744: | Line 6,930: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,752: | Line 6,938: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,760: | Line 6,946: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,768: | Line 6,954: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,791: | Line 6,977: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
translit = " | -- Narb translit in [[Module:scripts/data]] | ||
} | |||
m["sem-sam"] = { | |||
"Samalian", | |||
85847147, | |||
"sem-nwe", | |||
"Phnx", | |||
-- Phnx translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,799: | Line 6,993: | ||
"sem-osa", | "sem-osa", | ||
"Sarb", | "Sarb", | ||
-- Sarb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,807: | Line 7,001: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,815: | Line 7,009: | ||
"sem-cen", | "sem-cen", | ||
"Narb", | "Narb", | ||
-- Narb translit in [[Module:scripts/data]] | |||
} | } | ||
| Line 6,870: | Line 7,064: | ||
"sit-tan", | "sit-tan", | ||
"Latn, Tibt", | "Latn, Tibt", | ||
override_translit = true, | override_translit = true, | ||
display_text | -- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]] | ||
} | } | ||
| Line 7,070: | Line 7,261: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
strip_diacritics = { | |||
remove_diacritics = c.grave .. c.acute .. c.tilde .. c.macron .. c.dgrave .. c.invbreve, | remove_diacritics = c.grave .. c.acute .. c.tilde .. c.macron .. c.dgrave .. c.invbreve, | ||
remove_exceptions = {'ś'}, | remove_exceptions = {'ś'}, | ||
| Line 7,130: | Line 7,321: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
} | } | ||
| Line 7,263: | Line 7,445: | ||
"trk-ssb", | "trk-ssb", | ||
"Latn, Cyrl, Mong", | "Latn, Cyrl, Mong", | ||
-- Mong translit, display_text and strip_diacritics in [[Module:scripts/data]] | |||
} | } | ||
| Line 7,274: | Line 7,454: | ||
"trk-ogz", | "trk-ogz", | ||
"ota-Arab", | "ota-Arab", | ||
strip_diacritics = {["ota-Arab"] = "ar-stripdiacritics"}, | |||
} | } | ||
| Line 7,282: | Line 7,462: | ||
"trk-ogz", | "trk-ogz", | ||
"ota-Arab", | "ota-Arab", | ||
strip_diacritics = {["ota-Arab"] = "ar-stripdiacritics"}, | |||
ancestors = "trk-eog", | ancestors = "trk-eog", | ||
} | } | ||
| Line 7,292: | Line 7,472: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
standard_chars = { | |||
Latn = " ()-abdegiklmnoprstuxyzïöüāčēīĺŋōŕšūǖȫẹ" .. c.macron, | Latn = " ()-abdegiklmnoprstuxyzïöüāčēīĺŋōŕšūǖȫẹ" .. c.macron, | ||
} | } | ||
| Line 7,325: | Line 7,505: | ||
"tut", | "tut", | ||
"Latn", | "Latn", | ||
type = "reconstructed" | type = "reconstructed" | ||
} | } | ||
| Line 7,384: | Line 7,564: | ||
"Old Komi", | "Old Komi", | ||
86679962, | 86679962, | ||
" | "kv", | ||
"Perm, Cyrs", | "Perm, Cyrs", | ||
translit = "urj-koo-translit", | translit = "urj-koo-translit", | ||
sort_key | -- Cyrs strip_diacritics, sort_key in [[Module:scripts/data]]; previously, Cyrs strip_diacritics not present | ||
} | } | ||
| Line 7,401: | Line 7,581: | ||
"Komi-Yazva", | "Komi-Yazva", | ||
2365210, | 2365210, | ||
" | "kv", | ||
"Cyrl", | "Cyrl", | ||
translit = "kv-translit", | translit = "kv-translit", | ||
override_translit = true, | override_translit = true, | ||
strip_diacritics = {remove_diacritics = c.acute}, | |||
} | } | ||
| Line 7,475: | Line 7,655: | ||
m["yok-gsy"] = { | m["yok-gsy"] = { | ||
"Gashowu", | "Gashowu Yokuts", | ||
3098708, | 3098708, | ||
"yok", | "yok", | ||
| Line 7,496: | Line 7,676: | ||
m["yok-ply"] = { | m["yok-ply"] = { | ||
"Palewyami", | "Palewyami Yokuts", | ||
2387391, | 2387391, | ||
"yok", | "yok", | ||
| Line 7,522: | Line 7,702: | ||
"Latn", | "Latn", | ||
type = "reconstructed", | type = "reconstructed", | ||
} | |||
m["yrk-for"] = { | |||
"Forest Nenets", | |||
1295107, | |||
"yrk", | |||
"Cyrl", | |||
translit = "yrk-for-translit", | |||
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.macron .. c.breve .. c.dotabove}, | |||
} | |||
m["yrk-tun"] = { | |||
"Tundra Nenets", | |||
36452, | |||
"yrk", | |||
"Cyrl", | |||
strip_diacritics = { | |||
from = {"ӑ", "а̄", "э̇", "ӣ", "ы̄", "ӯ", "ю̄", "я̆", "я̄"}, | |||
to = {"а", "а", "э", "и", "ы", "у", "ю", "я", "я"}, | |||
}, | |||
translit = "yrk-tun-translit", | |||
} | } | ||
| Line 7,567: | Line 7,768: | ||
"Cyrs, Glag", | "Cyrs, Glag", | ||
translit = {Cyrs = "Cyrs-translit", Glag = "Glag-translit"}, | translit = {Cyrs = "Cyrs-translit", Glag = "Glag-translit"}, | ||
-- Cyrs strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 7,581: | Line 7,781: | ||
Arab = "zle-ort-Arab-translit", | Arab = "zle-ort-Arab-translit", | ||
}, | }, | ||
strip_diacritics = { | |||
remove_diacritics = | Cyrs = { | ||
remove_diacritics = m_langdata.chars_substitutions["Cyrs_remove_diacritics"], | |||
Arab = "ar- | remove_exceptions = {"Ї", "ї"}, | ||
}, | |||
Arab = "ar-stripdiacritics", | |||
}, | }, | ||
sort_key | -- Cyrs sort_key in [[Module:scripts/data]] | ||
} | } | ||
| Line 7,599: | Line 7,801: | ||
Glag = "Glag-translit" | Glag = "Glag-translit" | ||
}, | }, | ||
-- Cyrs strip_diacritics, sort_key in [[Module:scripts/data]] | |||
} | } | ||
| Line 7,619: | Line 7,816: | ||
"zlw-lch", | "zlw-lch", | ||
"Latn", | "Latn", | ||
strip_diacritics = {remove_diacritics = c.ringabove}, | |||
} | } | ||
| Line 7,634: | Line 7,831: | ||
"zlw-pom", | "zlw-pom", | ||
"Latn", | "Latn", | ||
strip_diacritics = {remove_diacritics = c.macron .. c.breve}, | |||
} | } | ||
return require("Module:languages").finalizeData(m, "language") | return require("Module:languages").finalizeData(m, "language") | ||