%% This OTP simply places word-start and word-end markers.
input:
1;
output:
1;
aliases:
SPACE = 32
;
W_SPACE = (0-32) % white space
;
LATIN_ALPHABET = (65-90|94|97-122)
;
NON_LATIN = ^(65-90|94|97-122)
;
expressions:
{LATIN_ALPHABET}{W_SPACE} => \1 255 % word ending
<= \2
;
{LATIN_ALPHABET}{NON_LATIN} => \1 255
<= \2
;
{LATIN_ALPHABET} end: => \1 255
;
{W_SPACE}{LATIN_ALPHABET} => \1 254 % word beginning
<= \2
;
{NON_LATIN}{LATIN_ALPHABET} => \1 254
<= \2
;
beg: {LATIN_ALPHABET} => 254
<= \1
;