-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathingest_all.sh
executable file
·31 lines (29 loc) · 1.14 KB
/
ingest_all.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
#!/bin/bash
DATA_DIR=~/data/d3m
SCHEMA=/data/mergedDataSchema.json
MERGED=/data/merged.csv
CLASSIFICATION=/data/classification.json
SUMMARY=/data/summary.json
SUMMARY_MACHINE=/data/summary-machine.json
IMPORTANCE=/data/importance.json
METADATA_INDEX=datasets
DATASETS=(r_26 r_27 r_32 r_60 o_185 o_196 o_313 o_38 o_4550)
ES_ENDPOINT=http://localhost:9200
for DATASET in "${DATASETS[@]}"
do
echo "--------------------------------------------------------------------------------"
echo " Ingesting $DATASET dataset"
echo "--------------------------------------------------------------------------------"
go run cmd/distil-ingest/main.go \
--es-endpoint="$ES_ENDPOINT" \
--es-metadata-index="$METADATA_INDEX" \
--es-data-index="$DATASET" \
--schema="$DATA_DIR/$DATASET/$SCHEMA" \
--dataset="$DATA_DIR/$DATASET/$MERGED" \
--classification="$DATA_DIR/$DATASET/$CLASSIFICATION" \
--summary="$DATA_DIR/$DATASET/$SUMMARY" \
--summary-machine="$DATA_DIR/$DATASET/$SUMMARY_MACHINE" \
--importance="$DATA_DIR/$DATASET/$IMPORTANCE" \
--clear-existing \
--include-raw-dataset
done