stellar · sreuland · Aug 17, 2022 · Aug 1, 2022 · Aug 4, 2022 · Aug 13, 2022
diff --git a/.github/workflows/horizon.yml b/.github/workflows/horizon.yml
@@ -134,14 +134,27 @@ jobs:
  # Any range should do for basic testing, this range was chosen pretty early in history so that it only takes a few mins to run
  run: |
  chmod 755 ./exp/lighthorizon/build/build.sh
- ./exp/lighthorizon/build/build.sh ledgerexporter stellar latest false
- docker run -e ARCHIVE_TARGET=file:https:///ledgerexport-test\
+ mkdir $PWD/ledgerexport
+ mkdir $PWD/index
+
+ ./exp/lighthorizon/build/build.sh all stellar latest false
+ docker run -e ARCHIVE_TARGET=file:https:///ledgerexport\
  -e START=5\
- -e END=50\
+ -e END=150\
  -e NETWORK_PASSPHRASE="Test SDF Network ; September 2015"\
  -e CAPTIVE_CORE_CONFIG="/captive-core-testnet.cfg"\
  -e HISTORY_ARCHIVE_URLS="https://history.stellar.org/prd/core-testnet/core_testnet_001,https://history.stellar.org/prd/core-testnet/core_testnet_002"\
+ -v $PWD/ledgerexport:/ledgerexport\
  stellar/lighthorizon-ledgerexporter
+
+ # run map job
+ docker run -e NETWORK_PASSPHRASE='testnet' -e JOB_INDEX_ENV=AWS_BATCH_JOB_ARRAY_INDEX -e AWS_BATCH_JOB_ARRAY_INDEX=0 -e BATCH_SIZE=64 -e FIRST_CHECKPOINT=64 \
+ -e WORKER_COUNT=1 -e RUN_MODE=map -v $PWD/ledgerexport:/ledgermeta -e TXMETA_SOURCE=file:https:///ledgermeta -v $PWD/index:/index -e INDEX_TARGET=file:https:///index stellar/lighthorizon-index-batch
+
+ # run reduce job
+ docker run -e NETWORK_PASSPHRASE='testnet' -e JOB_INDEX_ENV=AWS_BATCH_JOB_ARRAY_INDEX -e AWS_BATCH_JOB_ARRAY_INDEX=0 -e MAP_JOB_COUNT=1 -e REDUCE_JOB_COUNT=1 \
+ -e WORKER_COUNT=1 -e RUN_MODE=reduce -v $PWD/index:/index -e INDEX_SOURCE_ROOT=file:https:///index -e INDEX_TARGET=file:https:///index stellar/lighthorizon-index-batch
+
  # Push images
  - if: github.ref == 'refs/heads/master' || github.ref == 'refs/heads/lighthorizon'
  name: Login to DockerHub

diff --git a/exp/lighthorizon/build/index-batch/README.md b/exp/lighthorizon/build/index-batch/README.md
@@ -0,0 +1,7 @@
+# `stellar/horizon-indexer`
+
+This docker image contains the ledger/checkpoint indexing executables. It allows running multiple instances of `map`/`reduce` on a single machine or running it in [AWS Batch](https://aws.amazon.com/batch/).
+
+## Env variables
+
+See the [package documentation](../../index/cmd/batch/doc.go) for more details
diff --git a/exp/lighthorizon/build/index-batch/start b/exp/lighthorizon/build/index-batch/start
@@ -5,7 +5,6 @@ set -e
 
 export TRACY_NO_INVARIANT_CHECK=1
 NETWORK_PASSPHRASE="${NETWORK_PASSPHRASE:=Public Global Stellar Network ; September 2015}"
-
 if [ "$RUN_MODE" == "reduce" ]; then
  echo "Running Reduce, REDUCE JOBS: $REDUCE_JOB_COUNT MAP JOBS: $MAP_JOB_COUNT TARGET INDEX: $INDEX_TARGET"
  /reduce 

diff --git a/exp/lighthorizon/build/k8s/lighthorizon_batch_map_job.yml b/exp/lighthorizon/build/k8s/lighthorizon_batch_map_job.yml
@@ -0,0 +1,43 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+ name: 'batch-map-job'
+spec:
+ completions: 52
+ parallelism: 10
+ completionMode: Indexed
+ template:
+ spec:
+ restartPolicy: Never
+ containers:
+ - name: 'worker'
+ image: 'stellar/lighthorizon-index-batch'
+ imagePullPolicy: Always
+ envFrom:
+ - secretRef:
+ name: <reference to secret name here if needed for source/target>
+ env:
+ - name: RUN_MODE
+ value: "map" 
+ - name: BATCH_SIZE
+ value: "10048" 
+ - name: FIRST_CHECKPOINT
+ value: "41426080"
+ - name: WORKER_COUNT
+ value: "8" 
+ - name: TXMETA_SOURCE
+ value: "<url of txmeta source>"
+ - name: JOB_INDEX_ENV
+ value: "JOB_COMPLETION_INDEX" 
+ - name: NETWORK_PASSPHRASE
+ value: "pubnet"
+ - name: INDEX_TARGET
+ value: "url of target index"
+ resources:
+ limits:
+ cpu: 4
+ memory: 5Gi
+ requests:
+ cpu: 500m
+ memory: 500Mi
+
diff --git a/exp/lighthorizon/build/k8s/lighthorizon_batch_reduce_job copy.yml b/exp/lighthorizon/build/k8s/lighthorizon_batch_reduce_job copy.yml
@@ -0,0 +1,42 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+ name: 'batch-reduce-job'
+spec:
+ completions: 52
+ parallelism: 10
+ completionMode: Indexed
+ template:
+ spec:
+ restartPolicy: Never
+ containers:
+ - name: 'worker'
+ image: 'stellar/lighthorizon-index-batch'
+ imagePullPolicy: Always
+ envFrom:
+ - secretRef:
+ name: <reference to secret name here if needed for source/target>
+ env:
+ - name: RUN_MODE
+ value: "reduce" 
+ - name: MAP_JOB_COUNT
+ value: 52
+ - name: REDUCE_JOB_COUNT
+ value: 52 
+ - name: WORKER_COUNT
+ value: 8 
+ - name: INDEX_SOURCE_ROOT
+ value: "<url of index location>"
+ - name: JOB_INDEX_ENV
+ value: JOB_COMPLETION_INDEX 
+ - name: INDEX_TARGET
+ value: "<url of index location>"
+ resources:
+ limits:
+ cpu: 4
+ memory: 5Gi
+ requests:
+ cpu: 500m
+ memory: 500Mi
+
+
diff --git a/exp/lighthorizon/index/backend/file.go b/exp/lighthorizon/index/backend/file.go
@@ -25,6 +25,12 @@ func NewFileBackend(dir string, parallel uint32) (*FileBackend, error) {
  parallel = 1
  }
 
+ err := os.MkdirAll(dir, fs.ModeDir|0755)
+ if err != nil {
+ log.Errorf("Unable to mkdir %s, %v", dir, err)
+ return nil, err
+ }
+
  return &FileBackend{
  dir: dir,
  parallel: parallel,

diff --git a/exp/lighthorizon/index/cmd/batch/map/main.go b/exp/lighthorizon/index/cmd/batch/map/main.go
@@ -24,7 +24,7 @@ type BatchConfig struct {
 
 const (
  batchSizeEnv = "BATCH_SIZE"
- jobIndexEnv  = "AWS_BATCH_JOB_ARRAY_INDEX"
+ jobIndexEnvName = "JOB_INDEX_ENV"
  firstCheckpointEnv = "FIRST_CHECKPOINT"
  txmetaSourceUrlEnv = "TXMETA_SOURCE"
  indexTargetUrlEnv = "INDEX_TARGET"
@@ -39,6 +39,10 @@ func NewBatchConfig() (*BatchConfig, error) {
  return nil, errors.New("required parameter: " + indexTargetUrlEnv)
  }
 
+ jobIndexEnv := os.Getenv(jobIndexEnvName)
+ if jobIndexEnv == "" {
+ return nil, errors.New("env variable can't be empty " + jobIndexEnvName)
+ }
  jobIndex, err := strconv.ParseUint(os.Getenv(jobIndexEnv), 10, 32)
  if err != nil {
  return nil, errors.Wrap(err, "invalid parameter "+jobIndexEnv)

diff --git a/exp/lighthorizon/index/cmd/batch/reduce/main.go b/exp/lighthorizon/index/cmd/batch/reduce/main.go
@@ -37,11 +37,16 @@ func ReduceConfigFromEnvironment() (*ReduceConfig, error) {
  mapJobsEnv = "MAP_JOB_COUNT"
  reduceJobsEnv = "REDUCE_JOB_COUNT"
  workerCountEnv = "WORKER_COUNT"
- jobIndexEnv  = "AWS_BATCH_JOB_ARRAY_INDEX"
+ jobIndexEnvName = "JOB_INDEX_ENV"
  indexRootSourceEnv = "INDEX_SOURCE_ROOT"
  indexTargetEnv = "INDEX_TARGET"
  )
 
+ jobIndexEnv := os.Getenv(jobIndexEnvName)
+ if jobIndexEnv == "" {
+ return nil, errors.New("env variable can't be empty " + jobIndexEnvName)
+ }
+
  jobIndex, err := strconv.ParseUint(strings.TrimSpace(os.Getenv(jobIndexEnv)), 10, 32)
  if err != nil {
  return nil, errors.Wrap(err, "invalid parameter "+jobIndexEnv)

diff --git a/exp/lighthorizon/index/cmd/map.sh b/exp/lighthorizon/index/cmd/map.sh
@@ -68,7 +68,7 @@ for (( i=0; i < $BATCH_COUNT; i++ ))
 do
  echo -n "Creating map job $i... "
 
- NETWORK_PASSPHRASE='testnet' MODULES='accounts_unbacked,transactions' \
+ NETWORK_PASSPHRASE='testnet' JOB_INDEX_ENV='AWS_BATCH_JOB_ARRAY_INDEX' MODULES='accounts_unbacked,transactions' \
  AWS_BATCH_JOB_ARRAY_INDEX=$i BATCH_SIZE=$BATCH_SIZE FIRST_CHECKPOINT=$FIRST \
  TXMETA_SOURCE=file:https://$1 INDEX_TARGET=file:https://$2 WORKER_COUNT=1 \
  ./map &

diff --git a/exp/lighthorizon/index/cmd/reduce.sh b/exp/lighthorizon/index/cmd/reduce.sh
@@ -47,7 +47,7 @@ for (( i=0; i < $REDUCE_JOB_COUNT; i++ ))
 do
  echo -n "Creating reduce job $i... "
 
- AWS_BATCH_JOB_ARRAY_INDEX=$i MAP_JOB_COUNT=$MAP_JOB_COUNT \
+ AWS_BATCH_JOB_ARRAY_INDEX=$i JOB_INDEX_ENV="AWS_BATCH_JOB_ARRAY_INDEX" MAP_JOB_COUNT=$MAP_JOB_COUNT \
  REDUCE_JOB_COUNT=$REDUCE_JOB_COUNT WORKER_COUNT=4 \
  INDEX_SOURCE_ROOT=file:https://$1 INDEX_TARGET=file:https://$2 \
  timeout -k 30s 10s ./reduce &