2003-09-18 01:58:19 +08:00
|
|
|
<sect1 id="postlfs-config-compressdoc" xreflabel="compressdoc">
|
|
|
|
<?dbhtml filename="compressdoc.html" dir="postlfs"?>
|
|
|
|
<title>Compressing man and info pages</title>
|
|
|
|
|
2003-09-22 00:44:58 +08:00
|
|
|
<para>Man and info reader programs can transparently process gzip'ed or
|
|
|
|
bzip2'ed pages, a feature you can use to free some disk space while keeping
|
2003-09-18 01:58:19 +08:00
|
|
|
your documentation available. However, things are not that simple: man
|
|
|
|
directories tend to contain links - hard and symbolic - which defeat simple
|
2003-09-22 00:44:58 +08:00
|
|
|
ideas like recursively calling <command>gzip</command> on them. A better way
|
|
|
|
to go is to use the script below.
|
2003-09-18 01:58:19 +08:00
|
|
|
</para>
|
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
<screen><userinput><command>cat > /usr/bin/compressdoc << "EOF"</command>
|
2003-09-18 01:58:19 +08:00
|
|
|
|
|
|
|
#!/bin/sh
|
|
|
|
|
|
|
|
function changefileext
|
|
|
|
{
|
2003-09-21 04:03:47 +08:00
|
|
|
# prints the given filename with the new extension instead of
|
|
|
|
# the old one. ! - always prints an absolute filename even if
|
|
|
|
# the caller provides a relative one.
|
|
|
|
# parameters : 1 - file name
|
|
|
|
# 2 - old extension
|
|
|
|
# 3 - new extension (may be empty)
|
|
|
|
|
|
|
|
echo `dirname $1`\/`basename $1 $2`$3
|
2003-09-18 01:58:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
# check that the command line is right, if not print a relevant message.
|
|
|
|
|
|
|
|
if [ ! -d $1 -o -z $1 ] || [ "$2" != "gz" -a "$2" != "bz2" ]
|
|
|
|
then
|
2003-09-21 04:03:47 +08:00
|
|
|
echo "Usage : $0 /path/to/doc/dir gz/bz2"
|
|
|
|
echo "e.g. $0 /usr/info gz to compress info pages in gzip format"
|
|
|
|
echo "or $0 /usr/X11R6/man bz2 to compact X man pages using bzip2."
|
|
|
|
exit 1
|
2003-09-18 01:58:19 +08:00
|
|
|
fi
|
|
|
|
|
|
|
|
# set up a few variables.
|
|
|
|
|
2003-09-23 21:35:57 +08:00
|
|
|
NEWEXT=.$2 # NEWEXT = extension of newly compressed files
|
2003-09-18 01:58:19 +08:00
|
|
|
|
|
|
|
if [ "$NEWEXT" == ".bz2" ]
|
|
|
|
then
|
2003-09-21 04:03:47 +08:00
|
|
|
OLDEXT=".gz" # OLDEXT = extensions of files to recompress
|
2003-09-23 21:35:57 +08:00
|
|
|
DECOMPRESS="gunzip -f" # DECOMPRESS = command to decompress a file
|
|
|
|
COMPRESS="bzip2 -f9" # COMPRESS = command to compress a file
|
2003-09-18 01:58:19 +08:00
|
|
|
else
|
2003-09-21 04:03:47 +08:00
|
|
|
OLDEXT=".bz2"
|
|
|
|
DECOMPRESS="bunzip2 -f"
|
|
|
|
COMPRESS="gzip -f9"
|
2003-09-18 01:58:19 +08:00
|
|
|
fi
|
|
|
|
|
|
|
|
# process all files not in the target format under the provided root directory.
|
|
|
|
# I use cd instead of giving $1 as an argument to find because this causes
|
|
|
|
# problems with symbolic links, e.g. /usr/man -> /usr/share/man.
|
|
|
|
|
|
|
|
cd $1
|
|
|
|
|
|
|
|
for f in `find . \! -name "*$NEWEXT"`
|
|
|
|
do
|
2003-09-21 04:03:47 +08:00
|
|
|
# the following test is needed because we have to update links ahead of
|
|
|
|
# ourselves, so $f is sometimes a nonexistent file or a link to one.
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
if [ -f $f -o -L $f ]
|
|
|
|
then
|
2003-09-23 21:35:57 +08:00
|
|
|
FILE=$f # the file being processed
|
|
|
|
BASEFILE=`basename $FILE` # its basename (see HLINKS)
|
|
|
|
INODE=`find $FILE -printf %i` # its inode number (see HLINKS)
|
|
|
|
NEWFILE=`changefileext $FILE $OLDEXT $NEWEXT` # new file name
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
# HLINKS is the list of all hard links to the current file.
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
HLINKS=`find . \! -name $BASEFILE -inum $INODE`
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
if [ -L $FILE ]
|
|
|
|
then
|
|
|
|
# the current file is a symbolic link, so we change
|
|
|
|
# its name and the name of its target.
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
TARGET=`readlink $FILE`
|
|
|
|
rm -f $FILE
|
|
|
|
ln -sf `changefileext $TARGET $OLDEXT $NEWEXT` $NEWFILE
|
|
|
|
elif [ -f $FILE ]
|
|
|
|
then
|
|
|
|
# the current file is a regular file.
|
2003-09-18 01:58:19 +08:00
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
TEMPFILE=`changefileext $FILE $OLDEXT`
|
2003-09-18 01:58:19 +08:00
|
|
|
|
|
|
|
# if there are several versions of a page (at worst, there can be
|
|
|
|
# one uncompressed, one old-compressed and one new-compressed), then
|
|
|
|
# we have to make sure that only the most recent file is kept, because
|
|
|
|
# it most likely means the user installed several versions of a package.
|
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
# first, if we are dealing with an old-compressed file,
|
|
|
|
# expand it if it is more recent than the uncompressed
|
|
|
|
# file *and* the new-compressed file, else delete it.
|
|
|
|
# (works even if TEMPFILE and/or NEWFILE do not exist)
|
|
|
|
|
|
|
|
if [ "$FILE" != "$TEMPFILE" ]
|
|
|
|
then
|
|
|
|
if [ $FILE -nt $TEMPFILE -a $FILE -nt $NEWFILE ]
|
|
|
|
then
|
|
|
|
$DECOMPRESS $FILE
|
|
|
|
else
|
|
|
|
rm -f $FILE
|
|
|
|
fi
|
|
|
|
FILE=$TEMPFILE
|
|
|
|
fi
|
|
|
|
|
|
|
|
# now we are dealing with an uncompressed file that may
|
|
|
|
# exist or not (because of the above). If it is newer
|
|
|
|
# than both the new-compressed and the old-compressed
|
|
|
|
# files then it is compressed, else it is deleted.
|
|
|
|
|
|
|
|
if [ -f $FILE ]
|
|
|
|
then
|
|
|
|
if [ $FILE -nt $NEWFILE -a $FILE -nt $FILE$OLDEXT ]
|
|
|
|
then
|
|
|
|
$COMPRESS $FILE
|
|
|
|
else
|
|
|
|
rm -f $FILE
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
|
|
|
# update the hard links to the current files,
|
|
|
|
# as the new inode number is now known.
|
|
|
|
|
|
|
|
for g in $HLINKS
|
|
|
|
do
|
|
|
|
rm -f $g
|
|
|
|
ln -f $NEWFILE `changefileext $g $OLDEXT $NEWEXT`
|
|
|
|
done
|
|
|
|
fi
|
2003-09-18 01:58:19 +08:00
|
|
|
done
|
|
|
|
|
|
|
|
<command>EOF
|
2003-09-23 21:35:57 +08:00
|
|
|
chmod 755 /usr/bin/compressdoc</command></userinput></screen>
|
2003-09-18 01:58:19 +08:00
|
|
|
|
|
|
|
<para>Now, as root, you can issue a
|
2003-09-22 00:44:58 +08:00
|
|
|
<command>/usr/bin/compressdoc /usr/man bz2</command>
|
2003-09-18 01:58:19 +08:00
|
|
|
to compress your system man pages. Similarly, you can run it on the
|
|
|
|
<filename class="directory">/usr/info</filename> directory. Don't forget
|
|
|
|
<filename class="directory">/usr/X11R6/man</filename> if you install the
|
|
|
|
<application>X</application> Window system. A few other programs, like
|
|
|
|
<application>XEmacs</application>, also install their documentation in
|
|
|
|
nonstandard places.</para>
|
|
|
|
|
2003-09-21 04:03:47 +08:00
|
|
|
<para>Generally, package installation systems do not compress man/info pages,
|
|
|
|
which means you will need to run the script again if you want to keep the size
|
|
|
|
of your documentation as small as possible. Also, note that running the script
|
|
|
|
after upgrading a package is safe: when you have several versions of a page
|
|
|
|
(for example, one compressed and one uncompressed), the most recent one is kept
|
|
|
|
and the others deleted.</para>
|
2003-09-18 01:58:19 +08:00
|
|
|
|
|
|
|
</sect1>
|
|
|
|
|