-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathzeek_log_transport.sh
executable file
·264 lines (224 loc) · 10.9 KB
/
zeek_log_transport.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
#!/bin/bash
#Version 0.4.1
#This sends any bro/zeek logs less than three days old to the rita/aihunter server.
#Any logs that already exist on the target system are not retransferred.
#Before using this, run these on the rita/aihunter server (use zeek in place of bro if necesssary):
#sudo adduser dataimport
#sudo passwd dataimport
#sudo mkdir -p /opt/bro/remotelogs/ /home/dataimport/.ssh/
#add the dataimport user's ssh public key to /home/dataimport/.ssh/authorized_keys in the rita/aihunter server
#sudo chown -R dataimport /opt/bro/remotelogs/ /home/dataimport/.ssh/
#sudo chmod go-rwx -R /home/dataimport/.ssh/
export PATH="/sbin:/usr/sbin:$PATH" #Note that cron does _NOT_ include /sbin in the path, so attempts to locate the "ip" binary fail without this fix
default_user_on_aihunter='dataimport'
can_ssh () {
#Test that we can reach the target system over ssh.
success_code=1
if [ "$1" = "127.0.0.1" ]; then
success_code=0
elif [ -n "$1" ]; then
token="$RANDOM.$RANDOM"
if [ "$2" = "-o" -a "$3" = 'PasswordAuthentication=no' ]; then
status "Attempting to verify that we can ssh to $1"
else
status "Attempting to verify that we can ssh to $@ - you may need to provide a password to access this system."
fi
ssh_out=`ssh "$@" '/bin/echo '"$token"`
if [ "$token" = "$ssh_out" ]; then
#status "successfully connected to $@"
success_code=0
#else
#status "cannot connect to $@"
fi
else
fail "Please supply an ssh target as a command line parameter to can_ssh"
fi
return $success_code
}
fail () {
echo "$@ , exiting." >&2
exit 1
}
status () {
echo "==== $@"
}
usage () {
cat <<HEREDOC >&2
Usage: $0 [--all] [--dest where_to_ssh] [--localdir /local/top/dir/] [--remotedir /remote/top/dir/] [--rsyncparams '--aparam --anotherparam']
Options:
--all Sync all Zeek log types instead of the default subset.
--dest SSH destination target (e.g hostname, IP, user@hostname, user@ip)
--localdir Location of Zeek logs on local system. (default: searches common locations)
--remotedir Location of Zeek logs on remote system. (default: /opt/zeek/remotelogs/<sensorname>/)
--rsyncparams Allows specifying parameters for rsync. Enclose in a pair of single quotes.
Suggestions:
--bwlimit=NNN Limit bandwidth used to NNN kilobytes/sec
-v Verbose; list out the files being transferred
-q Turn off any messages that are not errors
-n Dry run, do not actually transfer files
HEREDOC
exit
}
require_util () {
#Returns true if all binaries listed as parameters exist somewhere in the path, False if one or more missing.
while [ -n "$1" ]; do
if ! type -path "$1" >/dev/null 2>/dev/null ; then
echo Missing utility "$1". Please install it. >&2
return 1 #False, app is not available.
fi
shift
done
return 0 #True, app is there.
} #End of requireutil
#Check that we have basic tools to continue
require_util awk cut date egrep find grep hostname ip nice rsync sed ssh sort tr || fail "Missing a required utility"
#ionice is not stricly required; if it exists we'll use it to give all other processes on the system first access to the disk, effectively eliminating the chance that we cause dropped packets from disk contention.
if type -path ionice >/dev/null 2>/dev/null ; then
nice_me=' ionice -c 3 nice -n 19 '
else
nice_me=' nice -n 19 '
fi
#Default log types to send
log_type_regex='(conn|dns|http|ssl|x509|known_certs|capture_loss|notice|stats)'
#Parse command line flags
while [ -n "$1" ]; do
if [ "z$1" = "z--all" ]; then
log_type_regex='.' #dot matches all log types
elif [ "z$1" = "z--localdir" -a -e "$2" ]; then
local_tld="$2"
shift
elif [ "z$1" = "z--remotedir" -a -n "$2" ]; then
remote_top_dir="$2"
shift
elif [ "z$1" = "z--dest" -a -n "$2" ]; then
if echo "$2" | grep -q '@' ; then
#User has supplied an "@" symbol in target system, do not add $default_user_on_aihunter
aih_location="${2}"
else
#No "@" symbol in target system, force username to $default_user_on_aihunter
aih_location="${default_user_on_aihunter}@${2}"
fi
shift
elif [ "z$1" = "z--rsyncparams" -a -n "$2" ]; then
rsyncparams="$2"
shift
elif [ "z$1" = "z-h" -o "z$1" = "z--help" ]; then
usage
else
usage
fi
shift
done
if [ -z "$rsyncparams" ]; then
rsyncparams=" -q "
fi
#Where should we send the bro/zeek logs?
if [ -z "$aih_location" ]; then
if [ -s /etc/rita/agent.yaml ]; then
aih_location="${default_user_on_aihunter}@`grep '^[^#]*DatabaseLocation' /etc/rita/agent.yaml 2>/dev/null | sed -e 's/^.*DatabaseLocation:*\W*//'`"
else
fail "Destination not set on the command line and no /etc/rita/agent.yaml file to autodetect destination."
fi
fi
#Find a unique name for this bro/zeek node
#Note that the ID cannot contain: “/, \, ., “, *, <, >, :, |, ?, $,“. It also cannot contain a single space or null character. Avoiding comma too just in case.
#It must also be <=53 characters, as mongo has a maximum database name size of 64 chars and we need to leave space for -YYYY-MM-DD
if [ -s /etc/rita/agent.yaml -a -n "`grep '^[^#]*Name' /etc/rita/agent.yaml 2>/dev/null | sed -e 's/^.*Name:*\W*//'`" ]; then
#Manually setting the hostname to use in agent.yaml is preferred...
my_id=`grep '^[^#]*Name' /etc/rita/agent.yaml 2>/dev/null | sed -e 's/^.*Name:*\W*//' | tr -dc 'a-zA-Z0-9_^+=' | cut -c -52`
else
#...but if no name is forced, we use the short hostname + the primary IP, which should be unique.
#Following is short form of the hostname, then "__", then the primary IP ipv4 address (one for the default route) of the system.
#The tr command strips off spaces or odd characters in hostname
my_id=`hostname -s | tr -dc 'a-zA-Z0-9_^+='`"__"`ip route get 8.8.8.8 | awk '{print $NF;exit}' | tr -dc 'a-zA-Z0-9_^+='`
my_id=`echo "$my_id" | cut -c -52`
fi
extra_ssh_params=' '
if [ -s "$HOME/.ssh/id_rsa_dataimport" ]; then
extra_ssh_params=" -i $HOME/.ssh/id_rsa_dataimport "
fi
#Make sure we can ssh to the aihunter system first
if ! can_ssh "$aih_location" "-o" 'PasswordAuthentication=no' $extra_ssh_params ; then
if [ -s "$HOME/.ssh/id_rsa" -a -s "$HOME/.ssh/id_rsa.pub" ]; then
status "Transferring the RSA key to $aih_location - please provide the password when prompted"
cat "$HOME/.ssh/{id_dsa.pub,id_ecdsa.pub,id_rsa.pub,id_rsa_dataimport.pub}" 2>/dev/null \
| ssh "$aih_location" 'mkdir -p .ssh ; cat >>.ssh/authorized_keys ; chmod go-rwx ./ .ssh/ .ssh/authorized_keys'
elif [ -s "$HOME/.ssh/id_rsa" -o -s "$HOME/.ssh/id_rsa.pub" ]; then
fail "Unable to ssh to $aih_location, and one of the keys exist. Please transfer the public key to $aih_location, make sure you can ssh from here, and rerun this script"
elif [ ! type -path ssh-keygen >/dev/null 2>/dev/null ]; then
fail "Unable to ssh to $aih_location, and we do not have a key generator. Please create a keypair, transfer the public key to $aih_location, make sure you can ssh from here, and rerun this script"
else
#Create ssh key if it doesn't exist, and push to aihunter server or ask user to do so.
status "Creating a new RSA key with no passphrase"
ssh-keygen -b 2048 -t rsa -N '' -f "$HOME/.ssh/id_rsa"
status "Transferring the RSA key to $aih_location - please provide the password when prompted"
cat "$HOME/.ssh/{id_dsa.pub,id_ecdsa.pub,id_rsa.pub}" 2>/dev/null \
| ssh "$aih_location" 'mkdir -p .ssh ; cat >>.ssh/authorized_keys ; chmod go-rwx ./ .ssh/ .ssh/authorized_keys'
fi
if ! can_ssh "$aih_location" "-o" 'PasswordAuthentication=no' $extra_ssh_params ; then
fail "Unable to ssh to $aih_location using something other than a password"
fi
fi
#What local directory holds the bro/zeek logs?
#Make sure the directory ends in a "/".
if [ -z "$local_tld" ]; then
# Check for zeek paths first
if [ -d /storage/zeek/logs/ ]; then #Custom
local_tld='/storage/zeek/logs/'
elif [ -d /opt/zeek/logs/ ]; then #Zeek as installed by Rita
local_tld='/opt/zeek/logs/'
elif [ -d /usr/local/zeek/logs/ ]; then #Zeek default
local_tld='/usr/local/zeek/logs/'
elif [ -d /var/lib/docker/volumes/var_log_zeek/_data/ ]; then #Blue vector
local_tld='/var/lib/docker/volumes/var_log_zeek/_data/'
elif [ -d /nsm/zeek/logs/ ]; then #Security onion
local_tld='/nsm/zeek/logs/'
# Check Bro paths
elif [ -d /storage/bro/logs/ ]; then #Custom
local_tld='/storage/bro/logs/'
elif [ -d /opt/bro/logs/ ]; then #Bro as installed by Rita
local_tld='/opt/bro/logs/'
elif [ -d /usr/local/bro/logs/ ]; then #Bro default
local_tld='/usr/local/bro/logs/'
elif [ -d /var/lib/docker/volumes/var_log_bro/_data/ ]; then #Blue vector
local_tld='/var/lib/docker/volumes/var_log_bro/_data/'
elif [ -d /nsm/bro/logs/ ]; then #Security onion
local_tld='/nsm/bro/logs/'
else
fail 'Unable to locate top level directory for bro/zeek logs, please rerun script, specifying the top level path to bro/zeek logs with --localdir .'
fi
fi
ids_name='zeek'
if [[ $local_tld == *"bro"* ]]; then
ids_name='bro'
fi
if [ -z "$remote_top_dir" ]; then
remote_top_dir="/opt/$ids_name/remotelogs/$my_id/"
fi
today=`date '+%Y-%m-%d'`
yesterday=`date '+%Y-%m-%d' --date=yesterday`
twoda=`date '+%Y-%m-%d' --date='2 days ago'`
threeda=`date '+%Y-%m-%d' --date='3 days ago'`
status "Sending logs to rita/aihunter server $aih_location , My name: $my_id , local dir: $local_tld , remote dir: $remote_top_dir"
status "Preparing remote directories"
ssh $extra_ssh_params "$aih_location" "mkdir -p ${remote_top_dir}/$today/ ${remote_top_dir}/$yesterday/ ${remote_top_dir}/$twoda/ ${remote_top_dir}/$threeda/ ${remote_top_dir}/current/"
cd "$local_tld" || fail "Unable to change to $local_tld"
send_candidates=`find . -type f -mtime -3 -iname '*.gz' | egrep "$log_type_regex" | grep -v '/\.' | sort -u`
if [ ${#send_candidates} -eq 0 ]; then
echo
printf "WARNING: No logs found, if your log directory is not $local_tld please use the flag: --localdir [bro_zeek_log_directory]"
echo
fi
status "Transferring files to $aih_location"
flock -xn "$HOME/rsync_log_transport.`echo $aih_location | sed -e 's/@/_/g'`.lck" timeout --kill-after=60 7080 $nice_me rsync $rsyncparams -avR -e "ssh $extra_ssh_params" $send_candidates "$aih_location:${remote_top_dir}/" --delay-updates --chmod=Do+rx,Fo+r
retval=$?
if [ "$retval" == "1" ]; then
status "Unable to obtain lock and run a new copy of rsync as the previous rsync appears to still be running."
elif [ "$retval" == "124" -o "$retval" == "129" ]; then
status "Rsync was forcibly terminated as it was running too long."
elif [ "$retval" == "0" ]; then
status "Rsync finished transferring without error."
fi
#Note: after we added a user option to set the destination dir, we remove the --temp-dir option as this dir may not be on the same mount point as the destination dir.
#rsync will put temporary files in a .~tmp~ directory under each destination subdir.
#Originally: --temp-dir="/opt/bro/tmp/$my_id/"