This repository has been archived by the owner on Feb 25, 2020. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 64
/
start-shard.sh
executable file
·691 lines (587 loc) · 22.8 KB
/
start-shard.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
##
## ____ ____ _____ ____ ___ ____
## | _ \ | _ \ | ____| / ___| / _/ / ___| Precog (R)
## | |_) | | |_) | | _| | | | | /| | | _ Advanced Analytics Engine for NoSQL Data
## | __/ | _ < | |___ | |___ |/ _| | | |_| | Copyright (C) 2010 - 2013 SlamData, Inc.
## |_| |_| \_\ |_____| \____| /__/ \____| All Rights Reserved.
##
## This program is free software: you can redistribute it and/or modify it under the terms of the
## GNU Affero General Public License as published by the Free Software Foundation, either version
## 3 of the License, or (at your option) any later version.
##
## This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
## without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
## the GNU Affero General Public License for more details.
##
## You should have received a copy of the GNU Affero General Public License along with this
## program. If not, see <http://www.gnu.org/licenses/>.
##
##
#!/bin/bash
MAX_PORT_OPEN_TRIES=60
# Parse opts to determine settings
while getopts ":a:d:lbZYR" opt; do
case $opt in
a)
echo "Forcing rebuild of assemblies: $OPTARG" >&2
REBUILD="$OPTARG"
;;
d)
WORKDIR=$(cd $OPTARG; pwd)
;;
l)
DONTCLEAN=1
;;
b)
BUILDMISSING=1
;;
Z)
TESTQUIT=1
rm -rf stress-data && mkdir stress-data
WORKDIR=$(cd stress-data; pwd)
;;
R)
TESTRESUME=1
WORKDIR=$(cd stress-data; pwd)
;;
Y)
( $0 -Z && $0 -R ) 2>&1 | grep ';;;'
exit ${PIPESTATUS[0]}
;;
\?)
echo "Usage: `basename $0` [-l] [-d <work directory>]"
echo " -l: If a temp workdir is used, don't clean up afterward"
echo " -d: Use the provided workdir"
echo " -a abc,...: Unconditionally build assemblies for abc, ..."
echo " -b: Build missing artifacts prior to run (depends on sbt in path)"
echo " -Y: Run ingest consistency check"
echo " -Z: (private to -Y) first pass to be interrupted"
echo " -R: (private to -Y) second pass to compelte"
exit 1
;;
esac
done
[ -n "$TESTQUIT" ] && echo ";;; starting service for test-quit"
[ -n "$TESTRESUME" ] && echo ";;; starting service for test-resume"
# Taken from http://blog.publicobject.com/2006/06/canonical-path-of-file-in-bash.html
function path-canonical-simple() {
local dst="${1}"
cd -P -- "$(dirname -- "${dst}")" &> /dev/null && echo "$(pwd -P)/$(basename -- "${dst}")" | sed 's#/\.##'
}
function random_port() {
# We'll try 100 times until we find an unused port, at which point we give up
for tryseq in `seq 1 100`; do
TRYPORT=$((20000 + $RANDOM))
if ! port_is_open $TRYPORT; then
echo $TRYPORT
return 0
fi
sleep 1
done
echo "Failed to locate unused port for $1!" >&2
exit 1
}
function port_is_open() {
netstat -an | egrep "[\.:]$1[[:space:]]+.*LISTEN" > /dev/null
}
function wait_until_port_open () {
for tryseq in `seq 1 $MAX_PORT_OPEN_TRIES`; do
if port_is_open $1; then
return 0
fi
sleep 1
done
echo "Time out waiting for open port: $1" >&2
exit 1
}
BASEDIR=$(path-canonical-simple `dirname $0`)
VERSION=`git describe`
INGEST_ASSEMBLY="$BASEDIR"/ingest/target/ingest-assembly-$VERSION.jar
AUTH_ASSEMBLY="$BASEDIR"/auth/target/auth-assembly-$VERSION.jar
ACCOUNTS_ASSEMBLY="$BASEDIR"/accounts/target/accounts-assembly-$VERSION.jar
JOBS_ASSEMBLY="$BASEDIR"/dvergr/target/dvergr-assembly-$VERSION.jar
SHARD_ASSEMBLY="$BASEDIR"/bifrost/target/bifrost-assembly-$VERSION.jar
RATATOSKR_ASSEMBLY="$BASEDIR"/ratatoskr/target/ratatoskr-assembly-$VERSION.jar
#GC_OPTS="-XX:+UseConcMarkSweepGC -XX:+CMSIncrementalMode -XX:-CMSIncrementalPacing -XX:CMSIncrementalDutyCycle=100"
GC_OPTS=""
JAVA="java $GC_OPTS"
SHARD_OPTS=""
# pre-flight checks to make sure we have everything we need, and to make sure there aren't any conflicting daemons running
MISSING_ARTIFACTS=""
for ASM in "$INGEST_ASSEMBLY" "$SHARD_ASSEMBLY" "$RATATOSKR_ASSEMBLY" "$AUTH_ASSEMBLY" "$ACCOUNTS_ASSEMBLY" "$JOBS_ASSEMBLY"; do
NEED_REBUILD=""
BUILDTARGETBASE=$(basename "$ASM")
NAME="${BUILDTARGETBASE%%-*}"
BUILDTARGET="$NAME/assembly"
FORCED_REBUILD=`echo "$REBUILD" | awk -v name="$NAME" -v RS='[,\n]' '$0==name{printf(1)}'`
if [ -n "$FORCED_REBUILD" ]; then
NEED_REBUILD="yes"
else
if [ ! -f "$ASM" ]; then
if [ -n "$BUILDMISSING" ]; then
NEED_REBUILD="yes"
else
MISSING_ARTIFACTS="$MISSING_ARTIFACTS $ASM"
fi
fi
fi
if [ -n "$NEED_REBUILD" ]; then
sbt "$BUILDTARGET" || {
echo "Failed to build $BUILDTARGET!" >&2
exit 1
}
fi
done
if [ -n "$MISSING_ARTIFACTS" ]; then
echo "foo"
echo "Up-to-date ingest, bifrost, auth, accounts and ratatoskr assemblies are required before running. Please build and re-run, or run with the -b flag." >&2
for ASM in $MISSING_ARTIFACTS; do
echo " missing `basename $ASM`" >&2
done
exit 1
fi
# Make sure we have the tools we need on OSX
if [ `uname` == "Darwin" ]; then
echo "Running on OSX"
alias tar="/usr/bin/gnutar"
MONGOURL="http://fastdl.mongodb.org/osx/mongodb-osx-x86_64-2.2.0.tgz"
else
MONGOURL="http://fastdl.mongodb.org/linux/mongodb-linux-x86_64-2.2.0.tgz"
fi
function exists {
for fl in "$@"; do
if [ -f "$fl" ]; then return 0; fi
done
return 1
}
# Check for prereqs first
ARTIFACTDIR="$BASEDIR/standaloneArtifacts"
echo "Using artifacts in $ARTIFACTDIR"
[ -d "$ARTIFACTDIR" ] || mkdir "$ARTIFACTDIR"
(exists "$ARTIFACTDIR"/zookeeper* && echo " ZooKeeper exists") || {
echo "Downloading current ZooKeeper artifact"
pushd "$ARTIFACTDIR" > /dev/null
wget -nd -q http://ops.reportgrid.com.s3.amazonaws.com/zookeeper/zookeeper-3.4.3.tar.gz || {
echo "Failed to download zookeeper" >&2
exit 3
}
popd > /dev/null
}
(exists "$ARTIFACTDIR"/kafka* && echo " Kafka exists") || {
echo "Downloading current Kafka artifact"
pushd "$ARTIFACTDIR" > /dev/null
wget -nd -q http://s3.amazonaws.com/ops.reportgrid.com/kafka/kafka-0.7.5.zip || {
echo "Failed to download kafka" >&2
exit 3
}
popd > /dev/null
}
(exists "$ARTIFACTDIR"/mongo* && echo " Mongo exists") || {
echo "Downloading current Mongo artifact"
pushd "$ARTIFACTDIR" > /dev/null
wget -nd -q $MONGOURL || {
echo "Failed to download kafka" >&2
exit 3
}
popd > /dev/null
}
unset REBEL_OPTS
if [ -e "$REBEL_HOME" ]; then
REBEL_OPTS="-noverify -javaagent:$REBEL_HOME/jrebel.jar -Dplatform.root=`dirname $0`"
else
REBEL_OPTS=''
fi
if [ "$WORKDIR" == "" ]; then
WORKDIR=`mktemp -d -t standaloneShard.XXXXXX 2>&1`
if [ $? -ne 0 ]; then
echo "Couldn't create temp workdir! ($WORKDIR)" >&2
exit 1
fi
else
# Do *not* allow cleanup of provided directories
DONTCLEAN=1
fi
# Set up dirs for all components
ZKBASE="$WORKDIR"/zookeeper
ZKDATA="$WORKDIR"/zookeeper-data
KFBASE="$WORKDIR"/kafka
KFGLOBALDATA="$WORKDIR"/kafka-global
KFLOCALDATA="$WORKDIR"/kafka-local
MONGOBASE="$WORKDIR"/mongo
MONGODATA="$WORKDIR"/mongodata
rm -rf $ZKBASE $KFBASE
mkdir -p $ZKBASE $KFBASE $ZKDATA $MONGOBASE $MONGODATA "$WORKDIR"/{configs,configs/templates,logs,bifrost-data/data,bifrost-data/archive,bifrost-data/scratch,bifrost-data/ingest_failures}
echo "Running standalone bifrost under $WORKDIR"
# Set shutdown hook
function on_exit() {
echo "========== Shutting down system =========="
function is_running() {
[ ! -z "$1" ] && kill -0 "$1" &> /dev/null
}
if is_running $INGESTPID; then
echo "Stopping ingest..."
kill $INGESTPID
wait $INGESTPID
fi
if is_running $SHARDPID; then
echo "Stopping bifrost..."
kill $SHARDPID
wait $SHARDPID
fi
if is_running $ACCOUNTSPID; then
echo "Stopping accounts..."
kill $ACCOUNTSPID
wait $ACCOUNTSPID
fi
if is_running $JOBSPID; then
echo "Stopping jobs..."
kill $JOBSPID
wait $JOBSPID
fi
if is_running $AUTHPID; then
echo "Stopping auth..."
kill $AUTHPID
wait $AUTHPID
fi
if is_running $MONGOPID; then
echo "Stopping mongo..."
kill $MONGOPID
wait $MONGOPID
fi
if is_running $KFGLOBALPID; then
echo "Stopping kafka..."
# Kafka is somewhat of a pain, since the Java process daemonizes from within the startup script. That means that killing the script detaches
# the Java process, leaving it running. Instead, we kill all child processes
for pid in `ps -o pid,ppid | awk -v PID=$KFGLOBALPID '$2==PID{print $1}'`; do kill $pid; done
wait $KFGLOBALPID
fi
if is_running $KFLOCALPID; then
for pid in `ps -o pid,ppid | awk -v PID=$KFLOCALPID '{ if($2 == PID) print $1}'`; do kill $pid; done
wait $KFLOCALPID
fi
echo "Stopping zookeeper..."
cd $ZKBASE/bin
./zkServer.sh stop
if [ -z "$DONTCLEAN" ]; then
echo "Cleaning up temp work dir"
rm -rf "$WORKDIR"
fi
echo "Shutdown complete"
}
trap on_exit EXIT
# Get zookeeper up and running first
pushd $ZKBASE > /dev/null
tar --strip-components=1 --exclude='docs*' --exclude='src*' --exclude='dist-maven*' --exclude='contrib*' --exclude='recipes*' -xvzf "$ARTIFACTDIR"/zookeeper* > /dev/null 2>&1 || {
echo "Failed to unpack zookeeper" >&2
exit 3
}
popd > /dev/null
# Copy in a simple config
ZOOKEEPER_PORT=$(random_port "Zookeeper")
echo "# the directory where the snapshot is stored." >> $ZKBASE/conf/zoo.cfg
echo "dataDir=$ZKDATA" >> $ZKBASE/conf/zoo.cfg
echo "# the port at which the clients will connect" >> $ZKBASE/conf/zoo.cfg
echo "clientPort=$ZOOKEEPER_PORT" >> $ZKBASE/conf/zoo.cfg
# Set up logging for zookeeper
cat > $ZKBASE/bin/log4j.properties <<EOF
log4j.rootLogger=INFO, file
log4j.appender.file=org.apache.log4j.RollingFileAppender
log4j.appender.file.File=$WORKDIR/logs/zookeeper.log
log4j.appender.file.MaxFileSize=1MB
log4j.appender.file.MaxBackupIndex=1
log4j.appender.file.layout=org.apache.log4j.PatternLayout
log4j.appender.file.layout.ConversionPattern=%d{ABSOLUTE} %5p %c{1}:%L - %m%n
EOF
# Start it up!
echo "Starting zookeeper on port $ZOOKEEPER_PORT"
cd $ZKBASE/bin
./zkServer.sh start &> $WORKDIR/logs/zookeeper.stdout
wait_until_port_open $ZOOKEEPER_PORT
# Now, start global and local kafkas
cd "$WORKDIR"
unzip "$ARTIFACTDIR"/kafka* > /dev/null || {
echo "Failed to unpack kafka" >&2
exit 3
}
# Transform the provided config into global and local configs, and start services
cd "$WORKDIR"/kafka/config
chmod +x $KFBASE/bin/kafka-server-start.sh
KAFKA_GLOBAL_PORT=$(random_port "Kafka global")
sed -e "s#log.dir=.*#log.dir=$KFGLOBALDATA#; s/port=.*/port=$KAFKA_GLOBAL_PORT/; s/zk.connect=localhost:2181/zk.connect=localhost:$ZOOKEEPER_PORT/" < server.properties > server-global.properties
$KFBASE/bin/kafka-server-start.sh $KFBASE/config/server-global.properties &> $WORKDIR/logs/kafka-global.stdout &
KFGLOBALPID=$!
wait_until_port_open $KAFKA_GLOBAL_PORT
KAFKA_LOCAL_PORT=$(random_port "Kafka local")
sed -e "s#log.dir=.*#log.dir=$KFLOCALDATA#; s/port=.*/port=$KAFKA_LOCAL_PORT/; s/enable.zookeeper=.*/enable.zookeeper=false/; s/zk.connect=localhost:2181/zk.connect=localhost:$ZOOKEEPER_PORT/" < server.properties > server-local.properties
$KFBASE/bin/kafka-server-start.sh $KFBASE/config/server-local.properties &> $WORKDIR/logs/kafka-local.stdout &
KFLOCALPID=$!
wait_until_port_open $KAFKA_LOCAL_PORT
echo "Kafka Global = $KFGLOBALPID"
echo "Kafka Local = $KFLOCALPID"
MONGO_PORT=$(random_port "Mongo")
# Start up mongo and set test token
cd $MONGOBASE
tar --strip-components=1 -xvzf "$ARTIFACTDIR"/mongo* &> /dev/null
$MONGOBASE/bin/mongod --port $MONGO_PORT --dbpath $MONGODATA --nojournal --nounixsocket --noauth --noprealloc &> $WORKDIR/logs/mongo.stdout &
MONGOPID=$!
wait_until_port_open $MONGO_PORT
if [ ! -e "$WORKDIR"/root_token.txt ]; then
echo "Retrieving new root token"
$JAVA $REBEL_OPTS -jar "$RATATOSKR_ASSEMBLY" tokens -s "localhost:$MONGO_PORT" -d dev_auth_v1 -c | tail -n 1 > "$WORKDIR"/root_token.txt || {
echo "Error retrieving new root token" >&2
exit 3
}
fi
TOKENID=`cat "$WORKDIR"/root_token.txt`
# FIXME: There's a potential for collisions here because we're
# assigning before actually starting services, but proper ordering
# would make things a bit more complicated and with bash's RNG this is
# low-risk
INGEST_PORT=$(random_port "Ingest")
AUTH_PORT=$(random_port "Auth")
ACCOUNTS_PORT=$(random_port "Accounts")
JOBS_PORT=$(random_port "Jobs service")
SHARD_PORT=$(random_port "Shard")
# Set up ingest and bifrost services
sed -e "s#port = 30062#port = $AUTH_PORT#; \
s#rootKey = .*#rootKey = \"$TOKENID\"#; \
s#/var/log#$WORKDIR/logs#; \
s#\[\"localhost\"\]#\[\"localhost:$MONGO_PORT\"\]#" < \
"$BASEDIR"/auth/configs/dev/dev-auth-v1.conf > \
"$WORKDIR"/configs/auth-v1.conf || echo "Failed to update auth config"
sed -e "s#/var/log/precog#$WORKDIR/logs#" < \
"$BASEDIR"/auth/configs/dev/dev-auth-v1.logging.xml > \
"$WORKDIR"/configs/auth-v1.logging.xml
sed -e "s#port = 30064#port = $ACCOUNTS_PORT#; \
s#/var/log#$WORKDIR/logs#; \
s#port = 30062#port = $AUTH_PORT#; \
s#rootKey = .*#rootKey = \"$TOKENID\"#; \
s#\[\"localhost\"\]#\[\"localhost:$MONGO_PORT\"\]#; \
s#/etc/precog/templates#$WORKDIR/configs/templates#; \
s#hosts = localhost:2181#hosts = localhost:$ZOOKEEPER_PORT#" < \
"$BASEDIR"/accounts/configs/dev/accounts-v1.conf > \
"$WORKDIR"/configs/accounts-v1.conf || echo "Failed to update accounts config"
sed -e "s#/var/log/precog#$WORKDIR/logs#" < \
"$BASEDIR"/accounts/configs/dev/accounts-v1.logging.xml > \
"$WORKDIR"/configs/accounts-v1.logging.xml
# Copy email templates for accounts
cp "$BASEDIR"/accounts/src/test/resources/reset.* "$WORKDIR"/configs/templates/
sed -e "s#port = 30066#port = $JOBS_PORT#; \
s#/var/log#$WORKDIR/logs#; \
s#port = 30062#port = $AUTH_PORT#; \
s#rootKey = .*#rootKey = \"$TOKENID\"#; \
s#\[\"localhost\"\]#\[\"localhost:$MONGO_PORT\"\]#; \
s#hosts = localhost:2181#hosts = localhost:$ZOOKEEPER_PORT#" < \
"$BASEDIR"/dvergr/configs/dev/jobs-v1.conf > \
"$WORKDIR"/configs/jobs-v1.conf || echo "Failed to update jobs config"
sed -e "s#/var/log/precog#$WORKDIR/logs#" < \
"$BASEDIR"/dvergr/configs/dev/jobs-v1.logging.xml > \
"$WORKDIR"/configs/jobs-v1.logging.xml
sed -e "s/port = 30060/port = $INGEST_PORT/; \
s#/var/log#$WORKDIR/logs#; \
s#port = 30062#port = $AUTH_PORT#; \
s#rootKey = .*#rootKey = \"$TOKENID\"#;
s#port = 30064#port = $ACCOUNTS_PORT#; \
s#port = 30066#port = $JOBS_PORT#; \
s#port = 30070#port = $SHARD_PORT#; \
s#port = 9082#port = $KAFKA_LOCAL_PORT#; \
s#port = 9092#port = $KAFKA_GLOBAL_PORT#; \
s#connect = localhost:2181#connect = localhost:$ZOOKEEPER_PORT#" < \
"$BASEDIR"/ingest/configs/dev/ingest-v2.conf > \
"$WORKDIR"/configs/ingest-v2.conf || echo "Failed to update ingest config"
sed -e "s#/var/log/precog#$WORKDIR/logs#" < "$BASEDIR"/ingest/configs/dev/ingest-v2.logging.xml > "$WORKDIR"/configs/ingest-v2.logging.xml
sed -e "s#port = 30070#port = $SHARD_PORT#; \
s#/var/log#$WORKDIR/logs#; \
s#/opt/precog/bifrost#$WORKDIR/bifrost-data#; \
s#port = 30062#port = $AUTH_PORT#; \
s#rootKey = .*#rootKey = \"$TOKENID\"#; \
s#port = 30064#port = $ACCOUNTS_PORT#; \
s#port = 30066#port = $JOBS_PORT#; \
s#port = 9092#port = $KAFKA_GLOBAL_PORT#; \
s#hosts = localhost:2181#hosts = localhost:$ZOOKEEPER_PORT#" < \
"$BASEDIR"/bifrost/configs/dev/bifrost-v2.conf > \
"$WORKDIR"/configs/bifrost-v2.conf || echo "Failed to update bifrost config"
sed -e "s#/var/log/precog#$WORKDIR/logs#" < \
"$BASEDIR"/bifrost/configs/dev/bifrost-v2.logging.xml > \
"$WORKDIR"/configs/bifrost-v2.logging.xml
cd "$BASEDIR"
# Prior to ingest startup, we need to set an initial checkpoint if it's not already there
if [ ! -e "$WORKDIR"/initial_checkpoint.json ]; then
$JAVA $REBEL_OPTS -jar "$RATATOSKR_ASSEMBLY" zk -z "localhost:$ZOOKEEPER_PORT" -uc "/precog-dev/bifrost/checkpoint/`hostname`:initial" &> $WORKDIR/logs/checkpoint_init.stdout || {
echo "Couldn't set initial checkpoint!" >&2
exit 3
}
touch "$WORKDIR"/initial_checkpoint.json
fi
echo "Starting auth service on $AUTH_PORT"
$JAVA $REBEL_OPTS -Dlogback.configurationFile="$WORKDIR"/configs/auth-v1.logging.xml -jar "$AUTH_ASSEMBLY" --configFile "$WORKDIR"/configs/auth-v1.conf &> $WORKDIR/logs/auth-v1.stdout &
AUTHPID=$!
echo "Starting accounts service on $ACCOUNTS_PORT"
$JAVA $REBEL_OPTS -Dlogback.configurationFile="$WORKDIR"/configs/accounts-v1.logging.xml -jar "$ACCOUNTS_ASSEMBLY" --configFile "$WORKDIR"/configs/accounts-v1.conf &> $WORKDIR/logs/accounts-v1.stdout &
ACCOUNTSPID=$!
echo "Starting jobs service on $JOBS_PORT"
$JAVA $REBEL_OPTS -Dlogback.configurationFile="$WORKDIR"/configs/jobs-v1.logging.xml -jar "$JOBS_ASSEMBLY" --configFile "$WORKDIR"/configs/jobs-v1.conf &> $WORKDIR/logs/jobs-v1.stdout &
JOBSPID=$!
wait_until_port_open $AUTH_PORT
wait_until_port_open $ACCOUNTS_PORT
wait_until_port_open $JOBS_PORT
# Now we need two accounts for testing: the root account and the test account
if [ ! -e "$WORKDIR"/account_token.txt ]; then
echo "Creating root account"
ROOTACCOUNTID=$(set -e; curl -S -s -H 'Content-Type: application/json' -d '{"email":"[email protected]","password":"1234"}' "http://localhost:$ACCOUNTS_PORT/accounts/v1/accounts/" | sed 's/.*\([0-9]\{10\}\).*/\1/')
echo "Created root account: $ROOTACCOUNTID"
echo "Updating root account with prior root APIKey"
echo -e "db.accounts.update({\"accountId\":\"$ROOTACCOUNTID\"},{\$set:{\"apiKey\":\"$TOKENID\"}})" | "$WORKDIR"/mongo/bin/mongo --port $MONGO_PORT accounts_v1
echo "Update of root account complete"
echo "Creating test account"
ACCOUNTID=$(set -e; curl -S -s -H 'Content-Type: application/json' -d '{"email":"[email protected]","password":"fooble"}' "http://localhost:$ACCOUNTS_PORT/accounts/v1/accounts/" | sed 's/.*\([0-9]\{10\}\).*/\1/')
echo "Created test account: $ACCOUNTID"
echo $ACCOUNTID > "$WORKDIR"/account_id.txt
ACCOUNTTOKEN=$(set -e; curl -S -s -u '[email protected]:fooble' -H 'Content-Type: application/json' -G "http://localhost:$ACCOUNTS_PORT/accounts/v1/accounts/$ACCOUNTID" | grep apiKey | sed 's/.*apiKey"[^"]*"\([^"]*\)".*/\1/')
echo "Account token is $ACCOUNTTOKEN"
echo $ACCOUNTTOKEN > "$WORKDIR"/account_token.txt
else
ACCOUNTID=$(cat "$WORKDIR"/account_id.txt)
ACCOUNTTOKEN=$(cat "$WORKDIR"/account_token.txt)
fi
echo "Starting ingest service on $INGEST_PORT"
$JAVA $REBEL_OPTS -Dlogback.configurationFile="$WORKDIR"/configs/ingest-v2.logging.xml -jar "$INGEST_ASSEMBLY" --configFile "$WORKDIR"/configs/ingest-v2.conf &> $WORKDIR/logs/ingest-v2.stdout &
INGESTPID=$!
echo "Starting bifrost service on $SHARD_PORT"
$JAVA $REBEL_OPTS -Dlogback.configurationFile="$WORKDIR"/configs/bifrost-v2.logging.xml -jar "$SHARD_ASSEMBLY" --configFile "$WORKDIR"/configs/bifrost-v2.conf &> $WORKDIR/logs/bifrost-v2.stdout &
SHARDPID=$!
# Let the ingest/bifrost services startup in parallel
wait_until_port_open $INGEST_PORT
wait_until_port_open $SHARD_PORT
cat > $WORKDIR/ports.txt <<EOF
MONGO_PORT=$MONGO_PORT
KAFKA_LOCAL_PORT=$KAFKA_LOCAL_PORT
KAFKA_GLOBAL_PORT=$KAFKA_GLOBAL_PORT
ZOOKEEPER_PORT=$ZOOKEEPER_PORT
INGEST_PORT=$INGEST_PORT
AUTH_PORT=$AUTH_PORT
ACCOUNTS_PORT=$ACCOUNTS_PORT
JOBS_PORT=$JOBS_PORT
SHARD_PORT=$SHARD_PORT
EOF
echo "Startup complete, running in $WORKDIR"
echo "============================================================"
echo "Root token: $TOKENID"
echo "Root account ID: $ROOTACCOUNTID"
echo "Test account ID: $ACCOUNTID"
echo "Test account token: $ACCOUNTTOKEN"
echo "Base path: $WORKDIR"
cat <<EOF
MONGO_PORT: $MONGO_PORT
KAFKA_LOCAL_PORT: $KAFKA_LOCAL_PORT
KAFKA_GLOBAL_PORT: $KAFKA_GLOBAL_PORT
ZOOKEEPER_PORT: $ZOOKEEPER_PORT
INGEST_PORT: $INGEST_PORT
AUTH_PORT: $AUTH_PORT
ACCOUNTS_PORT: $ACCOUNTS_PORT
JOBS_PORT: $JOBS_PORT
SHARD_PORT: $SHARD_PORT
EOF
echo "============================================================"
cat > bifrost.out <<EOF
basedir $WORKDIR
id $ACCOUNTID
token $ACCOUNTTOKEN
accounts $ACCOUNTS_PORT
auth $AUTH_PORT
ingest $INGEST_PORT
jobs $JOBS_PORT
bifrost $SHARD_PORT
EOF
function query() {
curl -s -G \
--data-urlencode "q=$1" \
--data-urlencode "apiKey=$ACCOUNTTOKEN" \
"http://localhost:$SHARD_PORT/analytics/v1/analytics/fs/$ACCOUNTID"
}
function count() {
query "count(//xyz)" | tr -d "[]"
}
function wait_til_nonzero() {
wait_til_n_rows 1 $1
return $?
}
function now() {
date "+%s"
}
function check_time() {
expr `now` '>' $1
}
function wait_til_n_rows() {
N=$1
LIMIT=$( expr `now` '+' $2 )
RESULT=$( count )
echo "!!! count returned $RESULT"
while [ -z "$RESULT" ] || [ "$RESULT" -lt "$N" ]; do
sleep 0.05
[ `check_time $LIMIT` -eq 1 ] && return 1
RESULT=$( count )
echo "!!! count returned $RESULT"
done
return 0
}
function count_lines() {
wc -l $1 | awk '{print $1}'
}
TESTJSON="n100k.json"
TESTURL="http://ops.reportgrid.com.s3.amazonaws.com/datasets/$TESTJSON"
function download_testjson() {
echo "downloading json"
wget $TESTURL
if [ $? -ne 0 ]; then
echo "Failed to download $TESTURL" >&2
exit 3
fi
echo "done"
}
if [ -n "$TESTQUIT" ]; then
echo "trying??"
( [ -r $TESTJSON ] && [ `count_lines $TESTJSON` -eq 100000 ] ) || download_testjson
echo "what????"
echo ";;; ingesting $TESTJSON"
curl -o /dev/null -v \
-H 'Content-Type: application/json' \
--data-bin "@$TESTJSON" \
"http://localhost:$INGEST_PORT/ingest/v1/fs/$ACCOUNTID/xyz?apiKey=$ACCOUNTTOKEN"
echo ";;; polling for rows via count()"
wait_til_nonzero 60
trap EXIT
if [ $? -eq 0 ]; then
echo ";;; ingest rows detected--killing service now!"
kill -9 $INGESTPID
kill -9 $SHARDPID
kill -9 $ACCOUNTSPID
kill -9 $JOBSPID
kill -9 $AUTHPID
on_exit
exit 0
else
echo ";;; no rows ingested after 60s--failed!"
on_exit
exit 1
fi
fi
if [ -n "$TESTRESUME" ]; then
NROWS=`wc -l $TESTJSON | awk '{print $1}'`
wait_til_n_rows $NROWS 60
trap EXIT
echo ";;; verifying that bifrost resumes ingest"
if [ $? -eq 0 ]; then
echo ";;; resume succeeded (found $NROWS rows)"
echo ";;; ok"
on_exit
exit 0
else
echo ";;; resume failed (timed out before seeing $NROWS rows)"
echo ";;; ERROR!"
on_exit 1
exit 1
fi
fi
# Wait forever until the user Ctrl-C's the system
while true; do sleep 30; done