aboutsummaryrefslogtreecommitdiff
path: root/exp/exp.sh
blob: 8a7af40cbeab86cedda52a9b29933b40f4f06556 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
#!/bin/bash

# This script expects the following variables to be exported:
# - DNA_BACKUP: the path to dna-backup binary
# - REPO_PATH: the path of the repo the experiment is based on
# - MAX_VERSION: the max number for versions for the experiment
# - COMMITS: the name of the file that contains the lists of versions
# - DNA_4K: the path fo the dna-backup dir with 4K chunksize
# - DNA_8K: the path fo the dna-backup dir with 8K chunksize
# - DIFFS: the path of the git diff dir

log() {
	echo -e "\033[90m$(date +%T.%3N)\033[0m" $*
}

GITC="git -C $REPO_PATH"
OUT=/tmp/dna-backup-exp-out

# "empty tree" commit
prev="4b825dc642cb6eb9a060e54bf8d69288fbee4904"
last=$(tail --lines=1 $COMMITS | cut -f1)

i=0
cat $COMMITS | while read line
do
	# Get hash
	hash=$(echo "$line" | cut -f1)

	# Check out repo
	log "check out $hash"
	$GITC checkout $hash 2> $OUT \
	|| (log "error checking out"; cat $OUT; exit 1)

	# Create git diff for this version
	log "create git diff for this version"
	diff=$(printf "%s/%05d.diff.gz" $DIFFS $i)
	$GITC diff --minimal --binary --unified=0 -l0 $prev \
	| gzip \
	> $diff

	# Create 4k dna backup for this version
	log "create 4k dna backup for this version"
	$DNA_BACKUP commit -v 2 -c 4096 $REPO_PATH $DNA_4K

	# Create 8k dna backup for this version
	log "create 8k dna backup for this version"
	$DNA_BACKUP commit -v 2 $REPO_PATH $DNA_8K

	if [[ $(( $i % 4 )) == 0 ]]
	then
		# Check restore from git diffs
		log "restore from git diffs"
		TEMP=$(mktemp -d)
		for n in $(seq 0 $i)
		do
			diff=$(printf "%s/%05d.diff.gz" $DIFFS $n)
			cat $diff \
			| gzip --decompress \
			| git -C $TEMP apply --binary --unidiff-zero --whitespace=nowarn -
		done
		cp $REPO_PATH/.git $TEMP/
		log "check restore from diffs"
		diff --brief --recursive $REPO_PATH $TEMP \
		|| log "git patchs restore do not match source"
		rm -rf $TEMP

		# Check restore from 4k dna backup
		log "restore from 4k dna backup"
		TEMP=$(mktemp -d)
		$DNA_BACKUP restore -v 2 -c 4096 $DNA_4K $TEMP
		log "check restore from backup"
		diff --brief --recursive $REPO_PATH $TEMP \
		|| log "dna backup restore do not match source"
		rm -rf $TEMP

		# Check restore from 8k dna backup
		log "restore from 8k dna backup"
		TEMP=$(mktemp -d)
		$DNA_BACKUP restore -v 2 $DNA_8K $TEMP
		log "check restore from backup"
		diff --brief --recursive $REPO_PATH $TEMP \
		|| log "dna backup restore do not match source"
		rm -rf $TEMP
	fi

	prev=$hash
	let i++
	if [[ $i == $MAX_VERSION ]]
	then
		break
	fi
done

# cleanup
log "clean up $REPO_PATH"
$GITC checkout $last 2> $OUT \
|| (log "error checking out back to latest commit"; cat $OUT; exit 2)