Sha256: 9d99fc7efd9c2c64344bff7a798029f6de24f2f6c6392eac2a92e776ff82a9c2

Contents?: true

Size: 1.26 KB

Versions: 46

Compression:

Stored size: 1.26 KB

Contents

#! /bin/bash

NUMBER_OF_SPLIT_LINES=10000
SPLIT_FILE_PREFIX='small-'
BIG_FILE_PATH=master.csv
SPLIT_FILES=$SPLIT_FILE_PREFIX*

COMMAND_COLOR='\033[0;36m'
HIGHLIGHT_COLOR='\033[0;33m'
NO_COLOR='\033[0m' # No Color

# cd_split_folder () {
#   cd regions/
# }

split_big_csv_into_small_chunks () {
  header=$(head -1 $BIG_FILE_PATH)
  echo -e "Parsing the HEADER"
  echo -e "${HIGHLIGHT_COLOR}$header${NO_COLOR}"

  # Separate the data from the header
  echo -e "\nMoving the data file out"
  echo -e "${COMMAND_COLOR}tail -n +2 $BIG_FILE_PATH > output.data${NO_COLOR}"
  tail -n +2 $BIG_FILE_PATH > output.data

  echo -e "\nSplit $BIG_FILE_PATH file into small chunks with size $NUMBER_OF_SPLIT_LINES lines..."
  echo -e "${COMMAND_COLOR}split -l $NUMBER_OF_SPLIT_LINES output.data $SPLIT_FILE_PREFIX${NO_COLOR}"
  split -l $NUMBER_OF_SPLIT_LINES output.data $SPLIT_FILE_PREFIX
}

add_header_row_split_files () {
  for part in `ls -1 $SPLIT_FILE_PREFIX*`
  do
    printf "%s\n%s" "$header" "`cat $part`" > $part
  done
}

add_csv_extension_to_split_files () {
  for part in `ls -1 $SPLIT_FILE_PREFIX*`
  do
    mv ${part} ${part}.csv
  done
}

# cd_split_folder
split_big_csv_into_small_chunks
add_header_row_split_files
add_csv_extension_to_split_files

echo -e "\nCleaning ...."
rm output.data

Version data entries

46 entries across 46 versions & 2 rubygems

Version Path
kuppayam-0.2.12.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.11.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.10.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.9.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.8.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.7.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.6.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.5.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.4.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.3.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.2.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.1.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.2.0.pre.materialize db/test_data/split_files/split_csv.sh
kuppayam-0.1.39 db/test_data/split_files/split_csv.sh
kuppayam-0.1.38 db/test_data/split_files/split_csv.sh
kuppayam-0.1.37 db/test_data/split_files/split_csv.sh
kuppayam-0.1.36 db/test_data/split_files/split_csv.sh
kuppayam-0.1.35 db/test_data/split_files/split_csv.sh
kuppayam-0.1.34 db/test_data/split_files/split_csv.sh
kuppayam-0.1.33 db/test_data/split_files/split_csv.sh