#!/usr/bin/ksh # # CDDL HEADER START # # The contents of this file are subject to the terms of the # Common Development and Distribution License (the "License"). # You may not use this file except in compliance with the License. # # You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE # or http://www.opensolaris.org/os/licensing. # See the License for the specific language governing permissions # and limitations under the License. # # When distributing Covered Code, include this CDDL HEADER in each # file and include the License file at usr/src/OPENSOLARIS.LICENSE. # If applicable, add the following below this CDDL HEADER, with the # fields enclosed by brackets "[]" replaced with your own identifying # information: Portions Copyright [yyyy] [name of copyright owner] # # CDDL HEADER END # # Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T # All Rights Reserved # # Copyright 2009 Sun Microsystems, Inc. All rights reserved. # Use is subject to license terms. PATH=/usr/bin USAGE="usage: dircmp [-d] [-s] [-wn] dir1 dir2" TEMPDIR=`mktemp -d /var/tmp/dir.XXXXXX` if [ -z "$TEMPDIR" ]; then exit 1; fi trap "rm -f -r $TEMPDIR;exit" 0 1 2 3 15 typeset -i exitstat=0 typeset -i sizediff typeset -i cmpdiff typeset -i Sflag=0 typeset -i Dflag=0 typeset -i fsize1 typeset -i fsize2 typeset -l LFBOUND=2147483648 width=72 # # function to generate consistent "diff" output whether or not files are intact # function dodiffs { type=`LC_MESSAGES=C file $D1/"$a"` case "$type" in *text) ;; *script) ;; *empty*) echo $D1/`basename "$a"` is an empty file | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; *cannot*) echo $D1/`basename "$a"` does not exist | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; *) echo $D1/`basename "$a"` is an object file | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; esac type=`LC_MESSAGES=C file $D2/"$a"` case "$type" in *text) ;; *script) ;; *empty*) echo $D2/`basename "$a"` is an empty file | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; *cannot*) echo $D2/`basename "$a"` does not exist | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; *) echo $D2/`basename "$a"` is an object file | pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g continue ;; esac # # If either is a "large file" use bdiff (LF aware), # else use diff. # if (( fsize1 < LFBOUND && fsize2 < LFBOUND )) then cmd="diff" else cmd="bdiff" fi ($cmd "$D1"/"$a" "$D2"/"$a"; echo $? > $TEMPDIR/dc$$status) | \ pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g if [[ `cat $TEMPDIR/dc$$status` != 0 ]] then exitstat=$diffstat fi } # # dircmp entry point # while getopts dsw: i do case $i in d) Dflag=1;; s) Sflag=1;; w) width=`expr $OPTARG + 0 2>/dev/null` if [ $? = 2 ] then echo "dircmp: numeric argument required" exit 2 fi ;; \?) echo $USAGE exit 2;; esac done shift `expr $OPTIND - 1` # D0=`pwd` D1=$1 D2=$2 if [ $# -lt 2 ] then echo $USAGE exit 1 elif [ ! -d "$D1" ] then echo $D1 not a directory ! exit 2 elif [ ! -d "$D2" ] then echo $D2 not a directory ! exit 2 fi # # find all dirs/files in both directory hierarchies. Use "comm" to identify # which are common to both hierarchies as well as unique to each. # At this point, print those that are unique. # cd "$D1" find . -print | sort > $TEMPDIR/dc$$a cd "$D0" cd "$D2" find . -print | sort > $TEMPDIR/dc$$b comm $TEMPDIR/dc$$a $TEMPDIR/dc$$b | sed -n \ -e "/^ /w $TEMPDIR/dc$$c" \ -e "/^ [^ ]/w $TEMPDIR/dc$$d" \ -e "/^[^ ]/w $TEMPDIR/dc$$e" rm -f $TEMPDIR/dc$$a $TEMPDIR/dc$$b pr -w${width} -h "$D1 only and $D2 only" -m $TEMPDIR/dc$$e $TEMPDIR/dc$$d rm -f $TEMPDIR/dc$$e $TEMPDIR/dc$$d # # Generate long ls listings for those dirs/files common to both hierarchies. # Use -lgn to avoid problem when user or group names are too long, causing # expected field separator to be missing # Avoid other potential problems by piping through sed: # - Remove: Spaces in size field for block & character special files # '71, 0' becomes '710' # - For file name, do not print '-> some_file' # '/tmp/foo -> FOO' becomes '/tmp/foo' # The following sed is to read filenames with special characters sed -e 's/..//' -e 's/\([^-a-zA-Z0-9/_.]\)/\\\1/g' < $TEMPDIR/dc$$c > $TEMPDIR/dc$$f cat $TEMPDIR/dc$$f | xargs ls -lLgnd | \ sed -e '/^[bc]/ s/, *//' -e '/^l/ s/ -> .*//' > $TEMPDIR/dc$$i 2>/dev/null cd "$D0" cd "$D1" cat $TEMPDIR/dc$$f | xargs ls -lLgnd | \ sed -e '/^[bc]/ s/, *//' -e '/^l/ s/ -> .*//' > $TEMPDIR/dc$$h 2>/dev/null cd "$D0" > $TEMPDIR/dc$$g # # Process the results of the 'ls -lLgnd' to obtain file size info # and identify a large file's existence. # while read -u3 tmp tmp tmp fsize1 tmp tmp tmp a && read -u4 tmp tmp tmp fsize2 tmp tmp tmp b; do # # A window of opportunity exists where the ls -lLgnd above # could produce different # results if any of the files were removed since the find command. # If the pair of reads above results in different values (file names) for 'a' # and 'b', then get the file pointers in sync before continuing, and display # "different" message as customary. # if [[ "$a" != "$b" ]]; then while [[ "$a" < "$b" ]]; do if (( Sflag != 1 )) then echo "different $a" dodiffs fi read -u3 tmp tmp tmp fsize1 tmp tmp tmp a done while [[ "$a" > "$b" ]]; do if (( Sflag != 1 )) then echo "different $b" dodiffs fi read -u4 tmp tmp tmp fsize2 tmp tmp tmp b done fi cmpdiff=0 sizediff=0 if [ -d "$D1"/"$a" ] then if (( Sflag != 1 )) then echo "directory $a" fi elif [ -f "$D1"/"$a" ] then # # If the file sizes are different, then we can skip the run # of "cmp" which is only used to determine 'same' or 'different'. # If the file sizes are the same, we still need to run "cmp" # if (( fsize1 != fsize2 )) then sizediff=1 else cmp -s "$D1"/"$a" "$D2"/"$a" cmpdiff=$? fi if (( sizediff == 0 && cmpdiff == 0 )) then if (( Sflag != 1 )) then echo "same $a" fi else echo "different $a" if (( Dflag == 1 )) then dodiffs fi fi elif (( Sflag != 1 )) then echo "special $a" fi done 3<$TEMPDIR/dc$$h 4<$TEMPDIR/dc$$i | pr -r -h "Comparison of $D1 $D2" if (( Dflag == 1 )) then cat $TEMPDIR/dc$$g fi exit $exitstat