Processing/bin/downloadFiles.sh

#!/bin/bash
#---------------------------------------------------------------------------------------------------
# Download a list of files
#---------------------------------------------------------------------------------------------------

# read the arguments
echo ""
echo "downloadFiles.sh  $*"
echo ""
dataDir=$1;      shift
book=$1;         shift
dataset=$1;      shift
target=$1;       shift
condorOutput=$1; shift
first=$1;        shift
last=$1;         shift

# prepare environment
echo " "
echo " Process dataset: $dataset  of book: $book"
echo "   in directory : $dataDir"
echo "   to target    : $target"
echo "   condor output: $condorOutput"
echo "   file range   : $first  -- $last"

mkdir -p $condorOutput/$book/$dataset
script=`which downloadFile.sh`

# make sure the request is good
nFiles=`wc -l $condorOutput/$book/$dataset/fileList.txt | cut -d ' ' -f 1`
if [ $first -gt $nFiles ] ||  [ $last -gt $nFiles ]
then
  echo "Request makes no sense: nFiles=$nFile but first=$first and last=$last"
  exit 0
fi

# see how many we do in this job
nFilesPerJob=$(($last - $first + 1))
fList=`head -$last $condorOutput/$book/$dataset/fileList.txt | tail -$nFilesPerJob | cut -d' ' -f 2`

echo LIST $fList

# spread the jobs out by a bit
sleep $first

# loop through our list now
for file in $fList
do
  file=`basename $file`
  # find the line to this dataset and do further analysis
  line=`grep $file $condorOutput/$book/$dataset/fileList.txt`
  # find potential JSON file
  export size=`echo $line | tr -s ' ' | cut -d ' ' -f 1`
  # now run the download
  echo "$script $dataDir/$book/$dataset/$file $target/$book/$dataset/$file"
  $script $dataDir/$book/$dataset/$file $target/$book/$dataset/$file
done

exit 0
Revision:	1.3
Committed:	Thu Jan 6 22:30:07 2011 UTC (14 years, 3 months ago) by paus
Content type:	application/x-sh
Branch:	MAIN
CVS Tags:	Mit_020pre1, Mit_018
Changes since 1.2:	+0 -1 lines
Log Message:	Adding more powerful copy.
#	User	Rev	Content
1	paus	1.1	#!/bin/bash
2			#---------------------------------------------------------------------------------------------------
3			# Download a list of files
4			#---------------------------------------------------------------------------------------------------
5
6			# read the arguments
7			echo ""
8			echo "downloadFiles.sh $*"
9			echo ""
10			dataDir=$1; shift
11			book=$1; shift
12			dataset=$1; shift
13			target=$1; shift
14			condorOutput=$1; shift
15			first=$1; shift
16			last=$1; shift
17
18			# prepare environment
19			echo " "
20			echo " Process dataset: $dataset of book: $book"
21			echo " in directory : $dataDir"
22			echo " to target : $target"
23			echo " condor output: $condorOutput"
24	ceballos	1.2	echo " file range : $first -- $last"
25	paus	1.1
26			mkdir -p $condorOutput/$book/$dataset
27			script=`which downloadFile.sh`
28
29			# make sure the request is good
30	ceballos	1.2	nFiles=`wc -l $condorOutput/$book/$dataset/fileList.txt \| cut -d ' ' -f 1`
31	paus	1.1	if [ $first -gt $nFiles ] \|\| [ $last -gt $nFiles ]
32			then
33			echo "Request makes no sense: nFiles=$nFile but first=$first and last=$last"
34			exit 0
35			fi
36
37			# see how many we do in this job
38			nFilesPerJob=$(($last - $first + 1))
39			fList=`head -$last $condorOutput/$book/$dataset/fileList.txt \| tail -$nFilesPerJob \| cut -d' ' -f 2`
40
41	ceballos	1.2	echo LIST $fList
42
43	paus	1.1	# spread the jobs out by a bit
44			sleep $first
45
46			# loop through our list now
47			for file in $fList
48			do
49			file=`basename $file`
50			# find the line to this dataset and do further analysis
51			line=`grep $file $condorOutput/$book/$dataset/fileList.txt`
52			# find potential JSON file
53			export size=`echo $line \| tr -s ' ' \| cut -d ' ' -f 1`
54			# now run the download
55			echo "$script $dataDir/$book/$dataset/$file $target/$book/$dataset/$file"
56			$script $dataDir/$book/$dataset/$file $target/$book/$dataset/$file
57			done
58
59			exit 0