mirror of
https://git.tukaani.org/xz.git
synced 2024-04-04 12:36:23 +02:00
6a4a4a7d26
Also replace one use of expr with printf.
The rationale for LC_ALL=C was already mentioned in
69d1b3fc29
that fixed a security
issue. However, unrelated uses weren't changed in that commit yet.
POSIX says that with sed and such tools one should use LC_ALL=C
to ensure predictable behavior when strings contain byte sequences
that aren't valid multibyte characters in the current locale. See
under "Application usage" in here:
https://pubs.opengroup.org/onlinepubs/9699919799/utilities/sed.html
With GNU sed invalid multibyte strings would work without this;
it's documented in its Texinfo manual. Some other implementations
aren't so forgiving.
244 lines
7 KiB
Text
244 lines
7 KiB
Text
#!@POSIX_SHELL@
|
|
|
|
# xzgrep -- a wrapper around a grep program that decompresses files as needed
|
|
# Adapted from a version sent by Charles Levert <charles@comm.polymtl.ca>
|
|
|
|
# Copyright (C) 1998, 2001, 2002, 2006, 2007 Free Software Foundation
|
|
# Copyright (C) 1993 Jean-loup Gailly
|
|
|
|
# Modified for XZ Utils by Andrew Dudman and Lasse Collin.
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
# (at your option) any later version.
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
|
|
@enable_path_for_scripts@
|
|
#SET_PATH - This line is a placeholder to ease patching this script.
|
|
|
|
# Instead of unsetting XZ_OPT, just make sure that xz will use file format
|
|
# autodetection. This way memory usage limit and thread limit can be
|
|
# specified via XZ_OPT. With gzip, bzip2, and lzop it's OK to just unset the
|
|
# environment variables.
|
|
xz='@xz@ --format=auto'
|
|
unset GZIP BZIP BZIP2 LZOP
|
|
|
|
case ${0##*/} in
|
|
*egrep*) prog=xzegrep; grep=${GREP:-grep -E};;
|
|
*fgrep*) prog=xzfgrep; grep=${GREP:-grep -F};;
|
|
*) prog=xzgrep; grep=${GREP:-grep};;
|
|
esac
|
|
|
|
version="$prog (@PACKAGE_NAME@) @VERSION@"
|
|
|
|
usage="Usage: ${0##*/} [OPTION]... [-e] PATTERN [FILE]...
|
|
Look for instances of PATTERN in the input FILEs, using their
|
|
uncompressed contents if they are compressed.
|
|
|
|
OPTIONs are the same as for '$grep'.
|
|
|
|
Report bugs to <@PACKAGE_BUGREPORT@>."
|
|
|
|
# sed script to escape all ' for the shell, and then (to handle trailing
|
|
# newlines correctly) turn trailing X on last line into '.
|
|
escape='
|
|
s/'\''/'\''\\'\'''\''/g
|
|
$s/X$/'\''/
|
|
'
|
|
operands=
|
|
have_pat=0
|
|
files_with_matches=0
|
|
files_without_matches=0
|
|
no_filename=0
|
|
with_filename=0
|
|
|
|
while test $# -ne 0; do
|
|
option=$1
|
|
shift
|
|
optarg=
|
|
|
|
case $option in
|
|
(-[0123456789abcdEFGhHiIKlLnoPqrRsTuUvVwxyzZ]*[!0123456789]*)
|
|
# Something like -Fiv was specified, that is, $option contains more
|
|
# than one option of which the first option (in this example -F)
|
|
# doesn't take an argument. Split the first option into a standalone
|
|
# argument and continue parsing the rest of the options (in this example,
|
|
# replace -Fiv with -iv in the argument list and set option=-F).
|
|
#
|
|
# If there are digits [0-9] they are treated as if they were a single
|
|
# option character because this syntax is an alias for -C for GNU grep.
|
|
# For example, "grep -25F" is equivalent to "grep -C25 -F". If only
|
|
# digits are specified like "grep -25" we don't get here because the
|
|
# above pattern in the case-statement doesn't match such strings.
|
|
arg2=-\'$(LC_ALL=C expr "X${option}X" : 'X-.[0-9]*\(.*\)' |
|
|
LC_ALL=C sed "$escape")
|
|
eval "set -- $arg2 "'${1+"$@"}'
|
|
option=$(LC_ALL=C expr "X$option" : 'X\(-.[0-9]*\)');;
|
|
(--binary-*=* | --[lm]a*=* | --reg*=*)
|
|
# These options require an argument and an argument has been provided
|
|
# with the --foo=argument syntax. All is good.
|
|
;;
|
|
(-[ABCDefmX] | --binary-* | --file | --[lm]a* | --reg*)
|
|
# These options require an argument which should now be in $1.
|
|
# If it isn't, display an error and exit.
|
|
case ${1?"$option option requires an argument"} in
|
|
(*\'*)
|
|
optarg=" '"$(printf '%sX\n' "$1" | LC_ALL=C sed "$escape");;
|
|
(*)
|
|
optarg=" '$1'";;
|
|
esac
|
|
shift;;
|
|
(--)
|
|
break;;
|
|
(-?*)
|
|
;;
|
|
(*)
|
|
case $option in
|
|
(*\'*)
|
|
operands="$operands '"$(printf '%sX\n' "$option" |
|
|
LC_ALL=C sed "$escape");;
|
|
(*)
|
|
operands="$operands '$option'";;
|
|
esac
|
|
${POSIXLY_CORRECT+break}
|
|
continue;;
|
|
esac
|
|
|
|
case $option in
|
|
(-[drRzZ] | --di* | --exc* | --inc* | --rec* | --nu*)
|
|
printf >&2 '%s: %s: Option not supported\n' "$0" "$option"
|
|
exit 2;;
|
|
(-[ef]* | --file | --file=* | --reg*)
|
|
have_pat=1;;
|
|
(--h | --he | --hel | --help)
|
|
echo "$usage" || exit 2
|
|
exit;;
|
|
(-H | --wi | --wit | --with | --with- | --with-f | --with-fi \
|
|
| --with-fil | --with-file | --with-filen | --with-filena | --with-filenam \
|
|
| --with-filename)
|
|
with_filename=1
|
|
continue;;
|
|
(-l | --files-with-*)
|
|
files_with_matches=1
|
|
continue;;
|
|
(-L | --files-witho*)
|
|
files_without_matches=1
|
|
continue;;
|
|
(-h | --no-f*)
|
|
no_filename=1;;
|
|
(-V | --v | --ve | --ver | --vers | --versi | --versio | --version)
|
|
echo "$version" || exit 2
|
|
exit;;
|
|
esac
|
|
|
|
case $option in
|
|
(*\'?*)
|
|
option=\'$(printf '%sX\n' "$option" | LC_ALL=C sed "$escape");;
|
|
(*)
|
|
option="'$option'";;
|
|
esac
|
|
|
|
grep="$grep $option$optarg"
|
|
done
|
|
|
|
if test $files_with_matches -eq 1 || test $files_without_matches -eq 1; then
|
|
grep="$grep -q"
|
|
fi
|
|
|
|
eval "set -- $operands "'${1+"$@"}'
|
|
|
|
if test $have_pat -eq 0; then
|
|
case ${1?"Missing pattern; try \`${0##*/} --help' for help"} in
|
|
(*\'*)
|
|
grep="$grep -- '"$(printf '%sX\n' "$1" | LC_ALL=C sed "$escape");;
|
|
(*)
|
|
grep="$grep -- '$1'";;
|
|
esac
|
|
shift
|
|
fi
|
|
|
|
if test $# -eq 0; then
|
|
set -- -
|
|
fi
|
|
|
|
exec 3>&1
|
|
|
|
# res=1 means that no file matched yet
|
|
res=1
|
|
|
|
for i; do
|
|
case $i in
|
|
*[-.][zZ] | *_z | *[-.]gz | *.t[ag]z) uncompress="gzip -cdf";;
|
|
*[-.]bz2 | *[-.]tbz | *.tbz2) uncompress="bzip2 -cdf";;
|
|
*[-.]lzo | *[-.]tzo) uncompress="lzop -cdf";;
|
|
*[-.]zst | *[-.]tzst) uncompress="zstd -cdfq";; # zstd needs -q.
|
|
*) uncompress="$xz -cdf";;
|
|
esac
|
|
# Fail if xz or grep (or sed) fails.
|
|
xz_status=$(
|
|
exec 5>&1
|
|
($uncompress -- "$i" 5>&-; echo $? >&5) 3>&- |
|
|
if test $files_with_matches -eq 1; then
|
|
eval "$grep" && { printf '%s\n' "$i" || exit 2; }
|
|
elif test $files_without_matches -eq 1; then
|
|
eval "$grep" || {
|
|
r=$?
|
|
if test $r -eq 1; then
|
|
printf '%s\n' "$i" || r=2
|
|
fi
|
|
exit $r
|
|
}
|
|
elif test $with_filename -eq 0 &&
|
|
{ test $# -eq 1 || test $no_filename -eq 1; }; then
|
|
eval "$grep"
|
|
else
|
|
# Append a colon so that the last character will never be a newline
|
|
# which would otherwise get lost in shell command substitution.
|
|
i="$i:"
|
|
|
|
# Escape & \ | and newlines only if such characters are present
|
|
# (speed optimization).
|
|
case $i in
|
|
(*'
|
|
'* | *'&'* | *'\'* | *'|'*)
|
|
i=$(printf '%s\n' "$i" | LC_ALL=C sed 's/[&\|]/\\&/g; $!s/$/\\/');;
|
|
esac
|
|
|
|
# $i already ends with a colon so don't add it here.
|
|
sed_script="s|^|$i|"
|
|
|
|
# Fail if grep or sed fails.
|
|
r=$(
|
|
exec 4>&1
|
|
(eval "$grep" 4>&-; echo $? >&4) 3>&- |
|
|
LC_ALL=C sed "$sed_script" >&3 4>&-
|
|
) || r=2
|
|
exit $r
|
|
fi >&3 5>&-
|
|
)
|
|
r=$?
|
|
|
|
# fail occurred previously, nothing worse can happen
|
|
test $res -gt 1 && continue
|
|
|
|
if test "$xz_status" -eq 0; then
|
|
:
|
|
elif test "$xz_status" -ge 128 \
|
|
&& test "$(kill -l "$xz_status" 2> /dev/null)" = "PIPE"; then
|
|
:
|
|
else
|
|
r=2
|
|
fi
|
|
|
|
# still no match
|
|
test $r -eq 1 && continue
|
|
|
|
# 0 == match, >=2 == fail
|
|
res=$r
|
|
done
|
|
exit $res
|