forked from alexrashed/hackathon202304
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun.sh
executable file
·55 lines (48 loc) · 1.63 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
#!/usr/bin/env bash
# fail on errors
set -eo pipefail
# enable alias in script
shopt -s expand_aliases
if [ $# -eq 1 ] && [ $1 = "aws" ]; then
echo "Deploying on AWS."
else
echo "Deploying on LocalStack."
alias aws='awslocal'
alias terraform='tflocal'
fi
# Start deployment
terraform init; terraform plan; terraform apply --auto-approve
ingest_function_url=$(terraform output --raw ingest_lambda_url)
elasticsearch_endpoint=$(terraform output --raw elasticsearch_endpoint)
# download the dataset
temp_dir=$(mktemp --directory)
echo "Downloading Movie Dataset..."
movie_dataset_url="https://docs.aws.amazon.com/opensearch-service/latest/developerguide/samples/sample-movies.zip"
curl -L $movie_dataset_url > $temp_dir/sample-movies.zip
unzip $temp_dir/sample-movies.zip -d $temp_dir/
# remove the bulk insert instructions (lines starting with index info) from the bulk import file
# (we want to stream the data in there, instead of using the bulk import)
echo "Pre-processing Movie Dataset..."
sed -i '/^{ "index"/d' $temp_dir/sample-movies.bulk
echo "Invoking function for each movie..."
cat $temp_dir/sample-movies.bulk | while read line
do
echo -n "."
echo $line | curl -s -X POST $ingest_function_url \
-H 'Content-Type: application/json' \
-d @- > /dev/null
done
echo ""
echo "Testing a search query:"
# Send a sample fuzzy query
curl -X POST $elasticsearch_endpoint/movies/_search -H "Content-Type: application/json" -d \
'{
"query": {
"multi_match": {
"fields": [ "title", "directors", "actors" ],
"query": "Tarantino",
"fuzziness": "AUTO",
"type": "best_fields"
}
}
}' | jq