Update spelling converter to deal with the ambiguity of the ooy - wey issue. In Peshawer published books they are writing ځاے etc

This commit is contained in:
lingdocs 2022-04-18 19:12:54 +05:00
parent 14465065b9
commit 6bc8e391c2
3 changed files with 28 additions and 16 deletions

View File

@ -8,7 +8,7 @@
version="1.1" version="1.1"
id="svg5" id="svg5"
inkscape:version="1.1.1 (c3084ef, 2021-09-22)" inkscape:version="1.1.1 (c3084ef, 2021-09-22)"
sodipodi:docname="sentence-structure.svg" sodipodi:docname="vp-structure.svg"
xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape" xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd" xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
xmlns="http://www.w3.org/2000/svg" xmlns="http://www.w3.org/2000/svg"
@ -30,9 +30,9 @@
fit-margin-bottom="10" fit-margin-bottom="10"
units="px" units="px"
width="708.26672px" width="708.26672px"
inkscape:zoom="0.51029737" inkscape:zoom="0.35279519"
inkscape:cx="455.6167" inkscape:cx="633.51204"
inkscape:cy="436.02028" inkscape:cy="-296.20585"
inkscape:window-width="1440" inkscape:window-width="1440"
inkscape:window-height="847" inkscape:window-height="847"
inkscape:window-x="0" inkscape:window-x="0"
@ -199,8 +199,8 @@
x="16.162476" x="16.162476"
y="11.622981" /> y="11.622981" />
<path <path
style="fill:none;stroke:#000000;stroke-width:0.868766;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:none;stroke-opacity:1" style="fill:none;stroke:#000000;stroke-width:0.892521;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:none;stroke-opacity:1"
d="M 100.74353,24.58879 V 145.4719" d="M 100.74353,24.58879 V 152.17302"
id="path75" /> id="path75" />
<g <g
aria-label="intransitive" aria-label="intransitive"
@ -460,8 +460,7 @@
id="path79166" /> id="path79166" />
</g> </g>
<g <g
aria-label="infl. 1st + 2nd aria-label="infl. 1st + 2nd pronoun"
pronoun"
transform="matrix(0.26458333,0,0,0.26458333,38.760473,-57.593256)" transform="matrix(0.26458333,0,0,0.26458333,38.760473,-57.593256)"
id="text31446" id="text31446"
style="font-size:18.6667px;line-height:1.25;white-space:pre;shape-inside:url(#rect31448)"> style="font-size:18.6667px;line-height:1.25;white-space:pre;shape-inside:url(#rect31448)">
@ -765,8 +764,7 @@ pronoun"
id="path79296" /> id="path79296" />
</g> </g>
<g <g
aria-label="controls the verb aria-label="controls the verb can be left out"
can be left out"
transform="matrix(0.26458333,0,0,0.26458333,-8.6327206,30.587097)" transform="matrix(0.26458333,0,0,0.26458333,-8.6327206,30.587097)"
id="text72313-6" id="text72313-6"
style="font-size:18.6667px;line-height:1.25;white-space:pre;shape-inside:url(#rect72315-4)"> style="font-size:18.6667px;line-height:1.25;white-space:pre;shape-inside:url(#rect72315-4)">

Before

Width:  |  Height:  |  Size: 98 KiB

After

Width:  |  Height:  |  Size: 98 KiB

View File

@ -15,8 +15,15 @@ const pairsWPakistaniUndotted = [
["سړی", "سړے"], ["سړی", "سړے"],
["موسیٰ", "موسیٰ"], ["موسیٰ", "موسیٰ"],
["فرمايي", "فرمائی"], ["فرمايي", "فرمائی"],
["چای", "چائ"], ["چای", "چاے"],
["زوی", "زوئ"], [
"وی",
"وے",
],
[
"زوی",
"زوے",
],
["ښويېدل", "ښوئېدل"], ["ښويېدل", "ښوئېدل"],
["ويي", "وئی"], ["ويي", "وئی"],
["دوستي", "دوستی"], ["دوستي", "دوستی"],
@ -31,8 +38,15 @@ const pairsWPakistaniDotted = [
["سړی", "سړے"], ["سړی", "سړے"],
["موسیٰ", "موسیٰ"], ["موسیٰ", "موسیٰ"],
["فرمايي", "فرمائي"], ["فرمايي", "فرمائي"],
["چای", "چائ"], ["چای", "چاے"],
["زوی", "زوئ"], [
"وی",
"وے",
],
[
"زوی",
"زوے",
],
["ښويېدل", "ښوئېدل"], ["ښويېدل", "ښوئېدل"],
["ويي", "وئي"], ["ويي", "وئي"],
["دوستي", "دوستي"], ["دوستي", "دوستي"],

View File

@ -19,8 +19,8 @@ export function convertSpelling(input: string, spelling: T.Spelling): string {
if (spelling === "Afghan") { if (spelling === "Afghan") {
return input; return input;
} }
return input.replace(/ای(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, "ائ") return input.replace(/ای(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, "اے")
.replace(/وی(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, ئ") .replace(/وی(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, ے")
.replace(/ی(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, "ے") .replace(/ی(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, "ے")
.replace(/ي(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, (spelling === "Pakistani ی") .replace(/ي(?![\u0621-\u065f\u0670-\u06d3\u06d5])/g, (spelling === "Pakistani ی")
? "ی" ? "ی"