111 lines
2.9 KiB
Bash
111 lines
2.9 KiB
Bash
|
#!/bin/sh
|
||
|
# Generate test data repository using the given parameters.
|
||
|
# When omitted, we create "gen-many-files-d-w-f.git".
|
||
|
#
|
||
|
# Usage: [-r repo] [-d depth] [-w width] [-f files]
|
||
|
#
|
||
|
# -r repo: path to the new repo to be generated
|
||
|
# -d depth: the depth of sub-directories
|
||
|
# -w width: the number of sub-directories at each level
|
||
|
# -f files: the number of files created in each directory
|
||
|
#
|
||
|
# Note that all files will have the same SHA-1 and each
|
||
|
# directory at a level will have the same SHA-1, so we
|
||
|
# will potentially have a large index, but not a large
|
||
|
# ODB.
|
||
|
#
|
||
|
# Ballast will be created under "ballast/".
|
||
|
|
||
|
EMPTY_BLOB=e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
|
||
|
|
||
|
set -e
|
||
|
|
||
|
# (5, 10, 9) will create 999,999 ballast files.
|
||
|
# (4, 10, 9) will create 99,999 ballast files.
|
||
|
depth=5
|
||
|
width=10
|
||
|
files=9
|
||
|
|
||
|
while test "$#" -ne 0
|
||
|
do
|
||
|
case "$1" in
|
||
|
-r)
|
||
|
shift;
|
||
|
test "$#" -ne 0 || { echo 'error: -r requires an argument' >&2; exit 1; }
|
||
|
repo=$1;
|
||
|
shift ;;
|
||
|
-d)
|
||
|
shift;
|
||
|
test "$#" -ne 0 || { echo 'error: -d requires an argument' >&2; exit 1; }
|
||
|
depth=$1;
|
||
|
shift ;;
|
||
|
-w)
|
||
|
shift;
|
||
|
test "$#" -ne 0 || { echo 'error: -w requires an argument' >&2; exit 1; }
|
||
|
width=$1;
|
||
|
shift ;;
|
||
|
-f)
|
||
|
shift;
|
||
|
test "$#" -ne 0 || { echo 'error: -f requires an argument' >&2; exit 1; }
|
||
|
files=$1;
|
||
|
shift ;;
|
||
|
*)
|
||
|
echo "error: unknown option '$1'" >&2; exit 1 ;;
|
||
|
esac
|
||
|
done
|
||
|
|
||
|
# Inflate the index with thousands of empty files.
|
||
|
# usage: dir depth width files
|
||
|
fill_index() {
|
||
|
awk -v arg_dir=$1 -v arg_depth=$2 -v arg_width=$3 -v arg_files=$4 '
|
||
|
function make_paths(dir, depth, width, files, f, w) {
|
||
|
for (f = 1; f <= files; f++) {
|
||
|
print dir "/file" f
|
||
|
}
|
||
|
if (depth > 0) {
|
||
|
for (w = 1; w <= width; w++) {
|
||
|
make_paths(dir "/dir" w, depth - 1, width, files)
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
END { make_paths(arg_dir, arg_depth, arg_width, arg_files) }
|
||
|
' </dev/null |
|
||
|
sed "s/^/100644 $EMPTY_BLOB /" |
|
||
|
git update-index --index-info
|
||
|
return 0
|
||
|
}
|
||
|
|
||
|
[ -z "$repo" ] && repo=gen-many-files-$depth.$width.$files.git
|
||
|
|
||
|
mkdir $repo
|
||
|
cd $repo
|
||
|
git init .
|
||
|
|
||
|
# Create an initial commit just to define master.
|
||
|
touch many-files.empty
|
||
|
echo "$depth $width $files" >many-files.params
|
||
|
git add many-files.*
|
||
|
git commit -q -m params
|
||
|
|
||
|
# Create ballast for p0006 based upon the given params and
|
||
|
# inflate the index with thousands of empty files and commit.
|
||
|
git checkout -b p0006-ballast
|
||
|
fill_index "ballast" $depth $width $files
|
||
|
git commit -q -m "ballast"
|
||
|
|
||
|
nr_files=$(git ls-files | wc -l)
|
||
|
|
||
|
# Modify 1 file and commit.
|
||
|
echo "$depth $width $files" >>many-files.params
|
||
|
git add many-files.params
|
||
|
git commit -q -m "ballast plus 1"
|
||
|
|
||
|
# Checkout master to put repo in canonical state (because
|
||
|
# the perf test may need to clone and enable sparse-checkout
|
||
|
# before attempting to checkout a commit with the ballast
|
||
|
# (because it may contain 100K directories and 1M files)).
|
||
|
git checkout master
|
||
|
|
||
|
echo "Repository "$repo" ($depth, $width, $files) created. Ballast $nr_files."
|
||
|
exit 0
|