#!/usr/bin/env bash # vim:ts=4:sts=4:sw=4:et # # Author: Hari Sekhon # Date: 2019-11-27 16:09:34 +0000 (Wed, 27 Nov 2019) # # https://github.com/harisekhon/bash-tools # # License: see accompanying Hari Sekhon LICENSE file # # If you're using my code you're welcome to connect with me on LinkedIn and optionally send me feedback # # https://www.linkedin.com/in/harisekhon # set -euo pipefail [ -n "${DEBUG:-}" ] && set -x usage(){ cat < EOF exit 3 } if [[ "${1:-}" =~ ^- ]]; then usage fi skip_zero_byte_files(){ if [ -n "${SKIP_ZERO_BYTE_FILES:-}" ]; then awk '{if($5 != 0) print }' else cat fi } set_replication_factor_3(){ if [ -n "${SET_REPLICATION_FACTOR_3:-}" ]; then xargs --no-run-if-empty hdfs dfs -setrep 3 else cat fi } hdfs dfs -ls -R "$@" | grep -v '^d' | skip_zero_byte_files | awk '{ if ($2 == 1) { $1=$2=$3=$4=$5=$6=$7=""; print } }' | sed 's/^[[:space:]]*//' | set_replication_factor_3