1#!/bin/sh
2#
3# SPDX-License-Identifier: BSD-2-Clause
4#
5# Copyright (c) September 1995-2022 Wolfram Schneider <wosch@FreeBSD.org>
6# All rights reserved.
7#
8# Redistribution and use in source and binary forms, with or without
9# modification, are permitted provided that the following conditions
10# are met:
11# 1. Redistributions of source code must retain the above copyright
12#    notice, this list of conditions and the following disclaimer.
13# 2. Redistributions in binary form must reproduce the above copyright
14#    notice, this list of conditions and the following disclaimer in the
15#    documentation and/or other materials provided with the distribution.
16#
17# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20# ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27# SUCH DAMAGE.
28#
29# mklocatedb - build locate database
30# 
31# usage: mklocatedb [-presort] < filelist > database
32#
33
34# stop on first error
35set -e
36set -o pipefail
37
38# The directory containing locate subprograms
39: ${LIBEXECDIR:=/usr/libexec}; export LIBEXECDIR
40: ${TMPDIR:=/var/tmp}; export TMPDIR
41
42PATH=$LIBEXECDIR:/bin:/usr/bin:$PATH; export PATH
43
44# utilities to built locate database
45: ${bigram:=locate.bigram}
46: ${code:=locate.code}
47: ${locate:=locate}
48: ${sort:=sort}
49
50sort_opt="-u -T $TMPDIR -S 20%"
51
52bigrams=$(mktemp -t mklocatedb.bigrams)
53filelist=$(mktemp -t mklocatedb.filelist)
54
55trap 'rm -f $bigrams $filelist' 0 1 2 3 5 10 15
56
57# Input already sorted
58if [ X"$1" = "X-presort" ]; then
59    shift; 
60
61    # Locate database bootstrapping
62    # 1. first build a temp database without bigram compression
63    # 2. create the bigram from the temp database
64    # 3. create the real locate database with bigram compression.
65    #
66    # This scheme avoid large temporary files in /tmp
67
68    $code $bigrams > $filelist
69    $locate -d $filelist / | $bigram | $sort -nr | \
70      awk 'NR <= 128 && /^[ \t]*[1-9][0-9]*[ \t]+..$/ { printf("%s", substr($0, length($0)-1, 2)) }' > $bigrams
71    $locate -d $filelist / | $code $bigrams
72else
73    $sort $sort_opt > $filelist
74    $bigram < $filelist | $sort -nr | \
75      awk 'NR <= 128 && /^[ \t]*[1-9][0-9]*[ \t]+..$/ { printf("%s", substr($0, length($0)-1, 2)) }' > $bigrams
76    $code $bigrams < $filelist
77fi
78
79#EOF
80