blob: 52e8995ba32ff4c4669c3618977d8ea820c4cf22 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
|
#!/bin/bash
# Copyright © 2013-2014 Luke Shumaker <lukeshu@sbcglobal.net>
# This work is free. You can redistribute it and/or modify it under the
# terms of the Do What The Fuck You Want To Public License, Version 2,
# as published by Sam Hocevar. See the COPYING file for more details.
sep='<no-filename-ever-contains-this>'
safe_types_regexp=('^(inode|text|image|video|audio)/')
safe_types_string=('application/pdf' 'application/postscript' 'application/xml' 'application/ogg' 'message/rfc822')
safe_files_regexp=('/\.(git|hg|svn)/' '/[^/]*\.git/' '/po/[^/]*.gmo$')
safe_files_string=()
# don't care about files less than 3 bytes.
min_size=3
normalize_filename() {
local cwd="`pwd`"
readlink -m -- "$1"|sed "s|^$cwd/|./|"
}
matches_string() {
local needle=$1
shift
for straw in "$@"; do
if [[ "$needle" = "$straw" ]]; then
return 0
fi
done
return 1
}
matches_regexp() {
local needle=$1
shift
for straw in "$@"; do
if [[ "$needle" =~ $straw ]]; then
return 0
fi
done
return 1
}
print-human() {
libremessages warning "The source directory %s contains binary files:" "$PWD"
sed 's/./ -> &/'
}
print-machine() {
cat
}
main() {
local format=human
# Parse arguments
for arg in "$@"; do
case "$arg" in
-m) format=machine;;
*) safe_files_string+=("$(normalize_filename "$arg")");;
esac
done
# Init
local unsafe_files="$(mktemp)"
cleanup() { rm -f -- "$unsafe_files"; }
trap cleanup EXIT
# Heavy lifting
find . -type f -printf '%s %h/%f\n' | # find all files
while read -r size file; do # filter out files smaller than $min_size
[[ $size -lt $min_size ]] || printf '%s\n' "$file"
done |
xargs -d'\n' file --mime-type -r -F "$sep" | # identify the filetypes
sed -r "s@(.*)${sep}\s*(.*)@\2:\1@" | # reformat the output to be easier to parse
while IFS=: read -r type file; do
file="$(normalize_filename "$file")"
if \
matches_string "$file" "${safe_files_string[@]}" || \
matches_string "$type" "${safe_types_string[@]}" || \
matches_regexp "$file" "${safe_files_regexp[@]}" || \
matches_regexp "$type" "${safe_types_regexp[@]}" ; then
: # do nothing
else
printf "%s\n" "$file"
fi
done > "$unsafe_files"
if [[ "$(stat -c '%s' -- "$unsafe_files")" -gt 0 ]]; then
<"$unsafe_files" sort | print-$format
exit 1
fi
}
main "$@"
|