1#!/bin/sh 2 3# NAME: 4# meta2deps.sh - extract useful info from .meta files 5# 6# SYNOPSIS: 7# meta2deps.sh SB="SB" "meta" ... 8# 9# DESCRIPTION: 10# This script looks each "meta" file and extracts the 11# information needed to deduce build and src dependencies. 12# 13# To do this, we extract the 'CWD' record as well as all the 14# syscall traces which describe 'R'ead, 'C'hdir and 'E'xec 15# syscalls. 16# 17# The typical meta file looks like:: 18#.nf 19# 20# # Meta data file "path" 21# CMD "command-line" 22# CWD "cwd" 23# TARGET "target" 24# -- command output -- 25# -- filemon acquired metadata -- 26# # buildmon version 2 27# V 2 28# E "pid" "path" 29# R "pid" "path" 30# C "pid" "cwd" 31# R "pid" "path" 32# X "pid" "status" 33#.fi 34# 35# The fact that all the syscall entry lines start with a single 36# character make these files quite easy to process using sed(1). 37# 38# To simplify the logic the 'CWD' line is made to look like a 39# normal 'C'hdir entry, and "cwd" is remembered so that it can 40# be prefixed to any "path" which is not absolute. 41# 42# If the "path" being read ends in '.srcrel' it is the content 43# of (actually the first line of) that file that we are 44# interested in. 45# 46# Any "path" which lies outside of the sandbox "SB" is generally 47# not of interest and is ignored. 48# 49# The output, is a set of absolute paths with "SB" like: 50#.nf 51# 52# $SB/obj-i386/bsd/include 53# $SB/obj-i386/bsd/lib/csu/i386 54# $SB/obj-i386/bsd/lib/libc 55# $SB/src/bsd/include 56# $SB/src/bsd/sys/i386/include 57# $SB/src/bsd/sys/sys 58# $SB/src/pan-release/rtsock 59# $SB/src/pfe-shared/include/jnx 60#.fi 61# 62# Which can then be further processed by 'gendirdeps.mk' 63# 64# If we are passed 'DPDEPS='"dpdeps", then for each src file 65# outside of "CURDIR" we read, we output a line like: 66#.nf 67# 68# DPDEPS_$path += $RELDIR 69#.fi 70# 71# with "$path" geting turned into reldir's, so that we can end 72# up with a list of all the directories which depend on each src 73# file in another directory. This can allow for efficient yet 74# complete testing of changes. 75 76 77# RCSid: 78# $FreeBSD$ 79# $Id: meta2deps.sh,v 1.14 2020/10/02 03:11:17 sjg Exp $ 80 81# Copyright (c) 2010-2013, Juniper Networks, Inc. 82# All rights reserved. 83# 84# Redistribution and use in source and binary forms, with or without 85# modification, are permitted provided that the following conditions 86# are met: 87# 1. Redistributions of source code must retain the above copyright 88# notice, this list of conditions and the following disclaimer. 89# 2. Redistributions in binary form must reproduce the above copyright 90# notice, this list of conditions and the following disclaimer in the 91# documentation and/or other materials provided with the distribution. 92# 93# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 94# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 95# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 96# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 97# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 98# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 99# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 100# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 101# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 102# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 103# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 104 105meta2src() { 106 cat /dev/null "$@" | 107 sed -n '/^R .*\.[chyl]$/s,^..[0-9]* ,,p' | 108 sort -u 109} 110 111meta2dirs() { 112 cat /dev/null "$@" | 113 sed -n '/^R .*\/.*\.[a-z0-9][^\/]*$/s,^..[0-9]* \(.*\)/[^/]*$,\1,p' | 114 sort -u 115} 116 117add_list() { 118 sep=' ' 119 suffix= 120 while : 121 do 122 case "$1" in 123 "|") sep="$1"; shift;; 124 -s) suffix="$2"; shift 2;; 125 *) break;; 126 esac 127 done 128 name=$1 129 shift 130 eval list="\$$name" 131 for top in "$@" 132 do 133 case "$sep$list$sep" in 134 *"$sep$top$suffix$sep"*) continue;; 135 esac 136 list="${list:+$list$sep}$top$suffix" 137 done 138 eval "$name=\"$list\"" 139} 140 141_excludes_f() { 142 egrep -v "$EXCLUDES" 143} 144 145error() { 146 echo "ERROR: $@" >&2 147 exit 1 148} 149 150meta2deps() { 151 DPDEPS= 152 SRCTOPS=$SRCTOP 153 OBJROOTS= 154 EXCLUDES= 155 while : 156 do 157 case "$1" in 158 *=*) eval export "$1"; shift;; 159 -a) MACHINE_ARCH=$2; shift 2;; 160 -m) MACHINE=$2; shift 2;; 161 -C) CURDIR=$2; shift 2;; 162 -H) HOST_TARGET=$2; shift 2;; 163 -S) add_list SRCTOPS $2; shift 2;; 164 -O) add_list OBJROOTS $2; shift 2;; 165 -X) add_list EXCLUDES '|' $2; shift 2;; 166 -R) RELDIR=$2; shift 2;; 167 -T) TARGET_SPEC=$2; shift 2;; 168 *) break;; 169 esac 170 done 171 172 _th= _o= 173 case "$MACHINE" in 174 host) _ht=$HOST_TARGET;; 175 esac 176 177 for o in $OBJROOTS 178 do 179 case "$MACHINE,/$o/" in 180 host,*$HOST_TARGET*) ;; 181 *$MACHINE*|*${TARGET_SPEC:-$MACHINE}*) ;; 182 *) add_list _o $o; continue;; 183 esac 184 for x in $_ht $TARGET_SPEC $MACHINE 185 do 186 case "$o" in 187 "") continue;; 188 */$x/) add_list _o ${o%$x/}; o=;; 189 */$x) add_list _o ${o%$x}; o=;; 190 *$x/) add_list _o ${o%$x/}; o=;; 191 *$x) add_list _o ${o%$x}; o=;; 192 esac 193 done 194 done 195 OBJROOTS="$_o" 196 197 case "$OBJTOP" in 198 "") 199 for o in $OBJROOTS 200 do 201 OBJTOP=$o${TARGET_SPEC:-$MACHINE} 202 break 203 done 204 ;; 205 esac 206 src_re= 207 obj_re= 208 add_list '|' -s '/*' src_re $SRCTOPS 209 add_list '|' -s '*' obj_re $OBJROOTS 210 211 [ -z "$RELDIR" ] && unset DPDEPS 212 tf=/tmp/m2d$$-$USER 213 rm -f $tf.* 214 trap 'rm -f $tf.*; trap 0' 0 215 216 > $tf.dirdep 217 > $tf.qual 218 > $tf.srcdep 219 > $tf.srcrel 220 > $tf.dpdeps 221 222 seenit= 223 seensrc= 224 lpid= 225 case "$EXCLUDES" in 226 "") _excludes=cat;; 227 *) _excludes=_excludes_f;; 228 esac 229 # handle @list files 230 case "$@" in 231 *@[!.]*) 232 for f in "$@" 233 do 234 case "$f" in 235 *.meta) cat $f;; 236 @*) xargs cat < ${f#@};; 237 *) cat $f;; 238 esac 239 done 240 ;; 241 *) cat /dev/null "$@";; 242 esac 2> /dev/null | 243 sed -e 's,^CWD,C C,;/^[CREFLMV] /!d' -e "s,',,g" | 244 $_excludes | ( version=no 245 while read op pid path junk 246 do 247 : op=$op pid=$pid path=$path 248 # we track cwd and ldir (of interest) per pid 249 # CWD is bmake's cwd 250 case "$lpid,$pid" in 251 ,C) CWD=$path cwd=$path ldir=$path 252 if [ -z "$SB" ]; then 253 SB=`echo $CWD | sed 's,/obj.*,,'` 254 fi 255 SRCTOP=${SRCTOP:-$SB/src} 256 case "$verion" in 257 no) ;; # ignore 258 0) error "no filemon data";; 259 *) ;; 260 esac 261 version=0 262 continue 263 ;; 264 $pid,$pid) ;; 265 *) 266 case "$lpid" in 267 "") ;; 268 *) eval ldir_$lpid=$ldir;; 269 esac 270 eval ldir=\${ldir_$pid:-$CWD} cwd=\${cwd_$pid:-$CWD} 271 lpid=$pid 272 ;; 273 esac 274 275 case "$op,$path" in 276 V,*) version=$path; continue;; 277 W,*srcrel|*.dirdep) continue;; 278 C,*) 279 case "$path" in 280 /*) cwd=$path;; 281 *) cwd=`cd $cwd/$path 2> /dev/null && /bin/pwd`;; 282 esac 283 # watch out for temp dirs that no longer exist 284 test -d ${cwd:-/dev/null/no/such} || cwd=$CWD 285 eval cwd_$pid=$cwd 286 continue 287 ;; 288 F,*) # $path is new pid 289 eval cwd_$path=$cwd ldir_$path=$ldir 290 continue 291 ;; 292 *) dir=${path%/*} 293 case "$path" in 294 $src_re|$obj_re) ;; 295 /*/stage/*) ;; 296 /*) continue;; 297 *) for path in $ldir/$path $cwd/$path 298 do 299 test -e $path && break 300 done 301 dir=${path%/*} 302 ;; 303 esac 304 ;; 305 esac 306 # avoid repeating ourselves... 307 case "$DPDEPS,$seensrc," in 308 ,*) 309 case ",$seenit," in 310 *,$dir,*) continue;; 311 esac 312 ;; 313 *,$path,*) continue;; 314 esac 315 # canonicalize if needed 316 case "/$dir/" in 317 */../*|*/./*) 318 rdir=$dir 319 dir=`cd $dir 2> /dev/null && /bin/pwd` 320 seen="$rdir,$dir" 321 ;; 322 *) seen=$dir;; 323 esac 324 case "$dir" in 325 ${CURDIR:-.}|"") continue;; 326 $src_re) 327 # avoid repeating ourselves... 328 case "$DPDEPS,$seensrc," in 329 ,*) 330 case ",$seenit," in 331 *,$dir,*) continue;; 332 esac 333 ;; 334 esac 335 ;; 336 *) 337 case ",$seenit," in 338 *,$dir,*) continue;; 339 esac 340 ;; 341 esac 342 if [ -d $path ]; then 343 case "$path" in 344 */..) ldir=${dir%/*};; 345 *) ldir=$path;; 346 esac 347 continue 348 fi 349 [ -f $path ] || continue 350 case "$dir" in 351 $CWD) continue;; # ignore 352 $src_re) 353 seenit="$seenit,$seen" 354 echo $dir >> $tf.srcdep 355 case "$DPDEPS,$reldir,$seensrc," in 356 ,*) ;; 357 *) seensrc="$seensrc,$path" 358 echo "DPDEPS_$dir/${path##*/} += $RELDIR" >> $tf.dpdeps 359 ;; 360 esac 361 continue 362 ;; 363 esac 364 # if there is a .dirdep we cannot skip 365 # just because we've seen the dir before. 366 if [ -s $path.dirdep ]; then 367 # this file contains: 368 # '# ${RELDIR}.<machine>' 369 echo $path.dirdep >> $tf.qual 370 continue 371 elif [ -s $dir.dirdep ]; then 372 echo $dir.dirdep >> $tf.qual 373 seenit="$seenit,$seen" 374 continue 375 fi 376 seenit="$seenit,$seen" 377 case "$dir" in 378 $obj_re) 379 echo $dir;; 380 esac 381 done > $tf.dirdep 382 case "$version" in 383 0) error "no filemon data";; 384 esac ) || exit 1 385 _nl=echo 386 for f in $tf.dirdep $tf.qual $tf.srcdep 387 do 388 [ -s $f ] || continue 389 case $f in 390 *qual) # a list of .dirdep files 391 # we can prefix everything with $OBJTOP to 392 # tell gendirdeps.mk that these are 393 # DIRDEP entries, since they are already 394 # qualified with .<machine> as needed. 395 # We strip .$MACHINE though 396 xargs cat < $f | sort -u | 397 sed "s,^# ,,;s,^,$OBJTOP/,;s,\.${TARGET_SPEC:-$MACHINE}\$,,;s,\.$MACHINE\$,," 398 ;; 399 *) sort -u $f;; 400 esac 401 _nl=: 402 done 403 if [ -s $tf.dpdeps ]; then 404 case "$DPDEPS" in 405 */*) ;; 406 *) echo > $DPDEPS;; # the echo is needed! 407 esac 408 sort -u $tf.dpdeps | 409 sed "s,${SRCTOP}/,,;s,${SB_BACKING_SB:-$SB}/src/,," >> $DPDEPS 410 fi 411 # ensure we produce _something_ else egrep -v gets upset 412 $_nl 413} 414 415case /$0 in 416*/meta2dep*) meta2deps "$@";; 417*/meta2dirs*) meta2dirs "$@";; 418*/meta2src*) meta2src "$@";; 419esac 420