https://github.com/voldemort/voldemort
Raw File
Tip revision: ff7f3e3e87b29e61a47e3c4a5fbc356ec55e3dc2 authored by Bhavani Sudha Saktheeswaran on 03 October 2014, 22:37:48 UTC
Releasing Voldemort 1.9.1
Tip revision: ff7f3e3
rebalance-zone-expansion.sh
#!/bin/bash -e

#
#   Copyright 2013 LinkedIn, Inc
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# This script generates a cluster.xml and a plan for the zone expansion.
# The final cluster is placed in output_dir/
# Argument = -c current_cluster -s current_stores -i interim_cluster -f final_stores
#            -o output dir

# This script uses getopts which means only single character switches are allowed.
# Using getopt would allow for multi charcter switch names but would come at a
# cost of not being cross compatible.

# Function to display usage
usage_and_exit() {
  echo "ERROR: $1."
  cat <<EOF
  
  Usage: $0 options 
  OPTIONS:
   -h     Show this message
   -c     Current cluster that describes the cluster
   -s     Current stores that describes the store. If you do not have info about the stores yet, look
          under 'voldemort_home/config/tools/' for some store examples.
   -i     Interim Cluster that corresponds to zone expansion.
   -f     Final Stores that corresponds to zone expansion.
   -o     Output dir where all interim and final files will be stored.
EOF
exit 1
}

# initialize  variables to an empty string
current_cluster=""
current_stores=""
interim_cluster=""
final_stores=""
output_dir=""

# Figure out voldemort home directory
dir="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
vold_home="$(dirname "$dir")"

# Parse options
while getopts “hc:s:i:f:o:” OPTION
do
  case $OPTION in
  h)
    usage_and_exit
    exit 1
    ;;
  c)
    current_cluster=$OPTARG
    echo "[rebalance-zone-expansion] Will rebalance on the cluster described in '$current_cluster'."
    ;;
  s)
    current_stores=$OPTARG
    echo "[rebalance-zone-expansion] Will rebalance on the stores described in '$current_stores'."
    ;;
  i)
    interim_cluster=$OPTARG
    echo "[rebalance-zone-expansion] Will rebalance on the interim cluster described in '$interim_cluster'."
    ;;
  f)
    final_stores=$OPTARG
    echo "[rebalance-zone-expansion] Will rebalance on the final stores described in '$final_stores'."
    ;;
  o)
    output_dir=$OPTARG
    output_dir=$(readlink -m $output_dir)
    mkdir -p $output_dir
    echo "[rebalance-zone-expansion] Using '$output_dir' for all interim and final files generated."
    ;;
  ?)
    usage_and_exit
  ;;
     esac
done

if  [[ -z $current_cluster ]] || [[ -z $current_stores ]] || [[ -z $interim_cluster ]] \
    || [[ -z $final_stores ]] || [[ -z $output_dir ]]
then
     printf "\n"
     echo "[rebalance-zone-expansion] Missing argument. Check again."
     usage_and_exit
     exit 1
fi

if [ ! -e $current_cluster ]; then
    usage_and_exit "File '$current_cluster' does not exist."
fi

if [ ! -e $current_stores ]; then
    usage_and_exit "File '$current_stores' does not exist."
fi

if [ ! -e $interim_cluster ]; then
    usage_and_exit "File '$interim_cluster' does not exist."
fi

if [ ! -e $final_stores ]; then
    usage_and_exit "File '$final_stores' does not exist."
fi


# The final cluster.xml for zone expansion is generated in three steps.
# Step 1 : In step 1 1000 separate iterations of the repartitioner is executed and the one 
#          with the minimal utility value is chose for step 2.
# Step 2: In step 2, the cluster.xml from step 1 is fed to the repartitioner along with random swap 
#         attempts. The repartitioner randomly swaps the partitions only in zone 2 
#         and tries to balance the ring.
# Step 3: Finally, a plan is generated on how to reach from the orignal cluster topology to
#         the one that is generated in step 2. 
#

step2_zoneid=2
step2_swap_attempts=1000
step2_overall_iterations=5


# Step 1
for i in {1..1000} 
do    
    mkdir -p $output_dir/step1/$i
    $vold_home/bin/run-class.sh voldemort.tools.RepartitionerCLI \
                                --current-cluster $current_cluster \
                                --current-stores $current_stores \
                                --interim-cluster $interim_cluster \
                                --final-stores $final_stores \
                                --attempts 1 \
                                --output-dir $output_dir/step1/$i
done

#find the run with the best (minimal) utility value 
bestUtil="$(grep "Utility" $output_dir/step1/*/final-cluster.xml.analysis | sort -nk 3 | head -n 1 | cut -f1 -d ' ')"
remove=".analysis:Utility"
path_to_bestUtil=${bestUtil%%$remove}

if [ ! -e $path_to_bestUtil ]; then
    usage_and_exit "final cluster.xml from step1 does not exist"
fi

# Step 2
$vold_home/bin/run-class.sh voldemort.tools.RepartitionerCLI \
                            --current-cluster $path_to_bestUtil \
                            --current-stores $final_stores \
                            --output-dir $output_dir/step2 \
                            --enable-random-swaps \
                            --random-swap-zoneids $step2_zoneid \
                            --attempts $step2_overall_iterations \
                            --random-swap-attempts $step2_swap_attempts \

# Step 3
mkdir -p $output_dir/step3/
$vold_home/bin/run-class.sh voldemort.tools.RebalancePlanCLI \
                             --current-cluster $current_cluster \
                             --current-stores $current_stores \
                             --final-cluster $output_dir/step2/final-cluster.xml \
                             --final-stores $final_stores \
                             --output-dir $output_dir/step3/
                             
echo "[rebalance-zone-expansion] Placing final-cluster.xml in '$output_dir'"
cp $output_dir/step3/final-cluster.xml $output_dir/final-cluster.xml
echo "[rebalance-zone-expansion] Placing plan.out in '$output_dir'"
cp $output_dir/step3/plan.out $output_dir/plan.out
echo "[rebalance-zone-expansion] Placing final-cluster.xml.analysis in '$output_dir'"
cp $output_dir/step2/final-cluster.xml $output_dir/final-cluster.xml.analysis
back to top