pkgsrc/mk/tools/msgfmt-msgid_plural.awk
joerg 5f72a77f4a Refactor msgfmt.sh script to conditionally strip the msgid_plural for
old NetBSD versions and to strip msgctx if requested by the package.
This allows to replace the use of msgfmtstrip in various packages by
setting MSGFMT_STRIP_MSGCTX.
2009-03-20 16:13:02 +00:00

262 lines
7.1 KiB
Awk

# $NetBSD: msgfmt-msgid_plural.awk,v 1.1 2009/03/20 16:13:02 joerg Exp $
#
# Strip msgid_plural which is not understood by msgfmt before 0.10.36.
#
#
# strip_bad_ctrl_sequences(string)
# If we see \c, where c is anything but a legal character as
# defined by msgfmt-0.10.35, then replace the backslash with a
# '?'. Yes, this is a hack, but it works around a bug in the
# way that older msgfmt mis-identifies some "control" sequences.
#
function strip_bad_ctrl_sequences(string, left, right) {
left = ""
right = string
while (match(right, /\\/) > 0) {
if (substr(right, RSTART + 1, 1) ~ /[bfnrtxX0-7"\\]/) {
left = left substr(right, 1, RSTART + 1)
right = substr(right, RSTART + 2)
} else {
left = left substr(right, 1, RSTART - 1) "?"
right = substr(right, RSTART + 1)
}
}
return left right
}
BEGIN {
EMPTY = "^$"
SPACE = "[ ]*"
KEYWORD_SEP = "([ ]+|[ ]*\"|$)"
OBSOLETE = "#~ "
OBSOLETE_RE = "^(#~[ ]+)?[ ]*"
OBSOLETE_RE_MATCH = "^#~[ ]+"
MSG_CONTINUATION_RE = OBSOLETE_RE "\""
result = getline
if (result < 1) exit result
s = 0
p = 0
obsolete = ""
while (result == 1) {
# Buffer any "msgid" statements into the singular array.
# Strip all trailing empty strings that have no effect on
# the output.
#
MSGID_RE = OBSOLETE_RE "msgid"
if ($0 ~ MSGID_RE KEYWORD_SEP) {
obsolete = ""
if ($0 ~ OBSOLETE_RE_MATCH) obsolete = OBSOLETE
sub(MSGID_RE SPACE, "");
s = 0
if ($0 ~ EMPTY) $0 = "\"\""
$0 = strip_bad_ctrl_sequences($0)
singular[s++] = $0
while (result = getline) {
if ($0 ~ OBSOLETE_RE "$") continue
if ($0 !~ MSG_CONTINUATION_RE) break
sub(OBSOLETE_RE , "")
$0 = strip_bad_ctrl_sequences($0)
singular[s++] = $0
}
if (result < 0) break
while ((s > 1) && (singular[s-1] ~ /^""$/)) s--
continue
}
# Buffer any "msgid_plural" statements into the plural
# array. Strip all trailing empty strings that have no
# effect on the output.
#
MSGID_PLURAL_RE = OBSOLETE_RE "msgid_plural"
if ($0 ~ MSGID_PLURAL_RE KEYWORD_SEP) {
obsolete = ""
if ($0 ~ OBSOLETE_RE_MATCH) obsolete = OBSOLETE
sub(MSGID_PLURAL_RE SPACE, "");
p = 0
if ($0 ~ EMPTY) $0 = "\"\""
$0 = strip_bad_ctrl_sequences($0)
plural[p++] = $0
while (result = getline) {
if ($0 ~ OBSOLETE_RE "$") continue
if ($0 !~ MSG_CONTINUATION_RE) break
sub(OBSOLETE_RE, "")
$0 = strip_bad_ctrl_sequences($0)
plural[p++] = $0
}
if (result < 0) break
while ((p > 1) && (plural[p-1] ~ /^""$/)) p--
continue
}
# If we see "msgstr", then we are outputting the
# translation of a singular form of a message, so dump
# the contents of the singular array and output the
# "msgstr" translation. Strip all trailing empty strings
# that have no effect on the output, and handle "\n"
# pickiness between msgid and msgstr.
#
MSGSTR_RE = OBSOLETE_RE "msgstr"
if ($0 ~ MSGSTR_RE KEYWORD_SEP) {
if (s > 0) {
print obsolete "msgid " singular[0]
for (i = 1; i < s; i++)
print obsolete singular[i]
}
if ($0 ~ OBSOLETE_RE_MATCH) obsolete = OBSOLETE
sub(MSGSTR_RE SPACE, "")
t = 0
if ($0 ~ EMPTY) $0 = "\"\""
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
while (result = getline) {
if ($0 !~ MSG_CONTINUATION_RE) break
sub(OBSOLETE_RE, "")
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
}
if (result < 0) break
while ((t > 1) && (translation[t-1] ~ /^""$/)) t--
if ((singular[s-1] ~ /\\n"$/) &&
(translation[t-1] !~ /\\n"$/)) {
if (translation[t-1] !~ /""/)
sub("\"$", "\\n\"", translation[t-1])
}
if (t > 0) {
print obsolete "msgstr " translation[0]
for (i = 1; i < t; i++)
print obsolete translation[i]
}
continue
}
# If we see "msgstr[0]", then we are outputting the
# translation of a singular form of a message, so dump
# the contents of the singular array and output the
# "msgstr[0]" translation. Strip all trailing empty
# strings that have no effect on the output, and handle
# "\n" pickiness between msgid and msgstr.
#
MSGSTR0_RE = OBSOLETE_RE "msgstr[[]0[]]"
if ($0 ~ MSGSTR0_RE KEYWORD_SEP) {
if (s > 0) {
print obsolete "msgid " singular[0]
for (i = 1; i < s; i++)
print obsolete singular[i]
}
if ($0 ~ OBSOLETE_RE_MATCH) obsolete = OBSOLETE
sub(MSGSTR0_RE SPACE, "");
t = 0
if ($0 ~ EMPTY) $0 = "\"\""
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
while (result = getline) {
if ($0 !~ MSG_CONTINUATION_RE) break
sub(OBSOLETE_RE, "")
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
}
if (result < 0) break
while ((t > 1) && (translation[t-1] ~ /^""$/)) t--
if ((singular[s-1] ~ /\\n"$/) &&
(translation[t-1] !~ /\\n"$/)) {
if (translation[t-1] !~ /""/)
sub("\"$", "\\n\"", translation[t-1])
}
if (t > 0) {
print obsolete "msgstr " translation[0]
for (i = 1; i < t; i++)
print obsolete translation[i]
}
continue
}
# If we see "msgstr[1]", then we are outputting the
# translation of a plural form of a message, so dump
# the contents of the plural array and output the
# "msgstr[1]" translation. Strip all trailing empty
# strings that have no effect on the output, and handle
# "\n" pickiness between msgid and msgstr.
#
MSGSTR1_RE = OBSOLETE_RE "msgstr[[]1[]]"
if ($0 ~ MSGSTR1_RE KEYWORD_SEP) {
#
# Check if the singular and plural arrays are equal.
# If they are, then we do not need to output an
# additional plural translation at all since the
# "singular" form is already correct.
#
equal = 0
if (s == p) {
equal = 1;
for (i = 0; i < s; i++) {
if (singular[i] != plural[i]) {
equal = 0; break
}
}
}
if (equal == 1) {
while (result = getline) {
if ($0 !~ MSG_CONTINUATION_RE) break
}
if (result < 0) break
s = 0; p = 0
continue
}
if (p > 0) {
print obsolete "msgid " plural[0]
for (i = 1; i < p; i++)
print obsolete plural[i]
}
if ($0 ~ OBSOLETE_RE_MATCH) obsolete = OBSOLETE
sub(MSGSTR1_RE SPACE, "");
t = 0
if ($0 ~ EMPTY) $0 = "\"\""
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
while (result = getline) {
if ($0 !~ MSG_CONTINUATION_RE) break
sub(OBSOLETE_RE, "")
$0 = strip_bad_ctrl_sequences($0)
translation[t++] = $0
}
if (result < 0) break
while ((t > 1) && (translation[t-1] ~ /^""$/)) t--
if ((plural[p-1] ~ /\\n"$/) &&
(translation[t-1] !~ /\\n"$/)) {
if (translation[t-1] !~ /""/)
sub("\"$", "\\n\"", translation[t-1])
}
if (t > 0) {
print obsolete "msgstr " translation[0]
for (i = 1; i < t; i++)
print obsolete translation[i]
}
continue
}
# We drop all other "msgstr[N]" translations since the
# old format only supported a single translation per
# plural form.
#
MSGSTRN_RE = OBSOLETE_RE "msgstr[[][0-9]+[]]"
if ($0 ~ MSGSTRN_RE KEYWORD_SEP) {
while (result = getline) {
if ($0 !~ MSG_CONTINUATION_RE) break
print $0
}
if (result < 0) break
continue
}
# Pass everything else verbatim.
print $0
result = getline
if (result < 0) break
}
}