#!/usr/bin/ksh
#
# CDDL HEADER START
#
# The contents of this file are subject to the terms of the
# Common Development and Distribution License (the "License").
# You may not use this file except in compliance with the License.
#
# You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
# or http://www.opensolaris.org/os/licensing.
# See the License for the specific language governing permissions
# and limitations under the License.
#
# When distributing Covered Code, include this CDDL HEADER in each
# file and include the License file at usr/src/OPENSOLARIS.LICENSE.
# If applicable, add the following below this CDDL HEADER, with the
# fields enclosed by brackets "[]" replaced with your own identifying
# information: Portions Copyright [yyyy] [name of copyright owner]
#
# CDDL HEADER END
#
#	Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T
#	  All Rights Reserved

#
#	Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
#	Use is subject to license terms.
PATH=/usr/bin
USAGE="usage: dircmp [-d] [-s] [-wn] dir1 dir2"

TEMPDIR=`mktemp -d /var/tmp/dir.XXXXXX`
if [ -z "$TEMPDIR" ]; then exit 1; fi 

trap "rm -f -r $TEMPDIR;exit" 0 1 2 3 15
typeset -i exitstat=0
typeset -i sizediff
typeset -i cmpdiff
typeset -i Sflag=0
typeset -i Dflag=0
typeset -i fsize1
typeset -i fsize2
typeset -l LFBOUND=2147483648
width=72

#
# function to generate consistent "diff" output whether or not files are intact
#
function dodiffs {

	type=`LC_MESSAGES=C file $D1/"$a"`
	case "$type" in
		*text)  ;;
		*script) ;;
		*empty*) echo $D1/`basename "$a"` is an empty file |
			  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
        	*cannot*) echo $D1/`basename "$a"` does not exist |
			  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
        	*)	echo $D1/`basename "$a"` is an object file |
		   	  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
	esac
	type=`LC_MESSAGES=C file $D2/"$a"`
	case "$type" in
        	*text)  ;;
        	*script) ;;
        	*empty*) echo $D2/`basename "$a"` is an empty file |
			  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
        	*cannot*) echo $D2/`basename "$a"` does not exist |
			  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
        	*)	echo $D2/`basename "$a"` is an object file |
			  pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
			continue
        	;;
	esac
	#   
	# If either is a "large file" use bdiff (LF aware),
	# else use diff.
	#
	if (( fsize1 < LFBOUND && fsize2 < LFBOUND ))
	then cmd="diff"
	else cmd="bdiff"
	fi
	($cmd "$D1"/"$a" "$D2"/"$a"; echo $? > $TEMPDIR/dc$$status) | \
	    pr -h "diff of $a in $D1 and $D2" >> $TEMPDIR/dc$$g
	if [[ `cat $TEMPDIR/dc$$status` != 0 ]]
	then exitstat=$diffstat
	fi
}
#
# dircmp entry point
#
while getopts dsw: i
do
	case $i in
	d)	Dflag=1;; 
	s)	Sflag=1;; 
	w)	width=`expr $OPTARG + 0 2>/dev/null`
		if [ $? = 2 ]
		then echo "dircmp: numeric argument required"
			exit 2
		fi
		;;
	\?)	echo $USAGE
		exit 2;;
	esac
done
shift `expr $OPTIND - 1`
#
D0=`pwd`
D1=$1
D2=$2
if [ $# -lt 2 ]
then echo $USAGE
     exit 1
elif [ ! -d "$D1" ]
then echo $D1 not a directory !
     exit 2
elif [ ! -d "$D2" ]
then echo $D2 not a directory !
     exit 2
fi
#
# find all dirs/files in both directory hierarchies. Use "comm" to identify
# which are common to both hierarchies as well as unique to each.
# At this point, print those that are unique.
#
cd "$D1"
find . -print | sort > $TEMPDIR/dc$$a
cd "$D0"
cd "$D2"
find . -print | sort > $TEMPDIR/dc$$b
comm $TEMPDIR/dc$$a $TEMPDIR/dc$$b | sed -n \
	-e "/^		/w $TEMPDIR/dc$$c" \
	-e "/^	[^	]/w $TEMPDIR/dc$$d" \
	-e "/^[^	]/w $TEMPDIR/dc$$e"
rm -f $TEMPDIR/dc$$a $TEMPDIR/dc$$b
pr -w${width} -h "$D1 only and $D2 only" -m $TEMPDIR/dc$$e $TEMPDIR/dc$$d
rm -f $TEMPDIR/dc$$e $TEMPDIR/dc$$d
#
# Generate long ls listings for those dirs/files common to both hierarchies.
# Use -lgn to avoid problem when user or group names are too long, causing
# expected field separator to be missing
# Avoid other potential problems by piping through sed:
#  - Remove: Spaces in size field for block & character special files
#      '71, 0' becomes '710'
#  - For file name, do not print '-> some_file'
#      '/tmp/foo -> FOO' becomes '/tmp/foo'

# The following sed is to read filenames with special characters
sed -e 's/..//'  -e  's/\([^-a-zA-Z0-9/_.]\)/\\\1/g' < $TEMPDIR/dc$$c > $TEMPDIR/dc$$f


cat $TEMPDIR/dc$$f | xargs ls -lLgnd | \
  sed -e '/^[bc]/ s/, *//' -e '/^l/ s/ -> .*//' > $TEMPDIR/dc$$i 2>/dev/null
cd "$D0"
cd "$D1"


cat $TEMPDIR/dc$$f | xargs ls -lLgnd | \
sed -e '/^[bc]/ s/, *//' -e '/^l/ s/ -> .*//' > $TEMPDIR/dc$$h 2>/dev/null
cd "$D0"
> $TEMPDIR/dc$$g
#
# Process the results of the 'ls -lLgnd' to obtain file size info
# and identify a large file's existence.
#
while read -u3 tmp tmp tmp fsize1 tmp tmp tmp a &&
      read -u4 tmp tmp tmp fsize2 tmp tmp tmp b; do
	#
	# A window of opportunity exists where the ls -lLgnd above
	# could produce different
	# results if any of the files were removed since the find command.
	# If the pair of reads above results in different values (file names) for 'a'
	# and 'b', then get the file pointers in sync before continuing, and display
	# "different" message as customary.
	#
	if [[ "$a" != "$b" ]]; then
	while [[ "$a" < "$b" ]]; do
		if (( Sflag != 1 ))
		then echo "different	$a"
		dodiffs
		fi
		read -u3 tmp tmp tmp fsize1 tmp tmp tmp a
	done
	while [[ "$a" > "$b" ]]; do
		if (( Sflag != 1 ))
		then echo "different	$b"
		dodiffs
		fi
		read -u4 tmp tmp tmp fsize2 tmp tmp tmp b
	done
	fi
	cmpdiff=0
	sizediff=0
	if [ -d "$D1"/"$a" ]
	then if (( Sflag != 1 ))
	     then echo "directory	$a"
	     fi
	elif [ -f "$D1"/"$a" ]
	then 
	     #
	     # If the file sizes are different, then we can skip the run
	     # of "cmp" which is only used to determine 'same' or 'different'.
	     # If the file sizes are the same, we still need to run "cmp"
	     #
	     if (( fsize1 != fsize2 ))
	     then
		sizediff=1
	     else
		cmp -s "$D1"/"$a" "$D2"/"$a"
		cmpdiff=$?
	     fi
	     if (( sizediff == 0 && cmpdiff == 0 ))
	     then if (( Sflag != 1 ))
		  then echo "same     	$a"
		  fi
	     else echo "different	$a"
		  if (( Dflag == 1 ))
		  then
			dodiffs
		  fi
	     fi
	elif (( Sflag != 1 ))
	then echo "special  	$a"
	fi
done 3<$TEMPDIR/dc$$h 4<$TEMPDIR/dc$$i | pr -r -h "Comparison of $D1 $D2"
if (( Dflag == 1 ))
then cat $TEMPDIR/dc$$g
fi
exit $exitstat