From 595c2cf96c6eb87f082de03a0fd21810d44f7d93 Mon Sep 17 00:00:00 2001 From: Steven Baltakatei Sandoval Date: Fri, 26 Jan 2024 00:47:17 +0000 Subject: [PATCH 1/1] feat(unitproc/bkt-replace_apos) Handle more replacement cases MIME-Version: 1.0 Content-Type: text/plain; charset=utf8 Content-Transfer-Encoding: 8bit - possessive `bossʼs` and `bossʼ` - general name, e.g. `Trinʼeba` --- unitproc/bkt-replace_apos | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/unitproc/bkt-replace_apos b/unitproc/bkt-replace_apos index 15714a7..1e0cfd3 100644 --- a/unitproc/bkt-replace_apos +++ b/unitproc/bkt-replace_apos @@ -7,7 +7,7 @@ function replace_apos() { # Input: stdin # arg1 file path # Output: stdout - # Version: 1.1.2 (BK-2020-03) + # Version: 1.2.0 (BK-2020-03) # Depends: GNU sed 4.8 # Check input @@ -64,7 +64,7 @@ function replace_apos() { -e "s/(she|She|SHE)'(d|D|ll|LL|s|S)/\1ʼ\2/g" \ -e "s/(shan|Shan|SHAN)'(t|T)/\1ʼ\2/g" \ -e "s/'(s|S)\b/ʼ\1/g" \ - -e "s/(s|S)'( |$)/\1ʼ\2/g" \ + -e "s/(s|S)'( |,|.|$)/\1ʼ\2/g" \ -e "s/(oughtn|Oughtn|OUGHTN)'(t|T)'(ve|VE)/\1ʼ\2ʼ\3/g" \ -e "s/(oughtn|Oughtn|OUGHTN)'(t|T)/\1ʼ\2/g" \ -e "s/(o|O)'(clock|CLOCK)/\1ʼ\2/g" \ @@ -90,6 +90,7 @@ function replace_apos() { -e "s/(hadn|Hadn|HADN)'(t|T)/\1ʼ\2/g" \ -e "s/'(em\b)/ʼ\1/g" \ -e "s/(d|D)'(ya|YA|you|YOU)/\1ʼ\2/g" \ + -e "s/([[:alnum:]])'(d|D)/\1ʼ\2/g" \ -e "s/(don|Don|DON)'(t|T)/\1ʼ\2/g" \ -e "s/(doesn|Doesn|DOESN)'(t|T)/\1ʼ\2/g" \ -e "s/(didn|Didn|DIDN)'(t|T)/\1ʼ\2/g" \ @@ -104,6 +105,7 @@ function replace_apos() { -e "s/(aren|Aren|AREN)'(t|T)/\1ʼ\2/g" \ -e "s/(ate|Ate|ATE)'(nt|NT)/\1ʼ\2/g" \ -e "s/(ain|Ain|AIN)'(t|T)/\1ʼ\2/g" \ + -e "s/([[:alpha:]])'([[:alpha:]])/\1ʼ\2/g" \ "$input" }; # replace ' with ʼ -- 2.30.2