dailenspencer · May 14, 2018 23:15
diff --git a/run.sh b/run.sh
 # -- OVERVIEW -- 
 # This script will handle the execution of a the CraigsList Jobs Scrapy crawler
 # which gathers job listing contents. We then upload the results to a s3 bucket. 

 # save file with timestamp prepended
 timestamp=$(date +%Y-%m-%d_%H-%M-%S)
 filename="$timestamp"_results.json

 # execute scrapy and store results in json file
 scrapy crawl jobs -o $filename

 # copy results to s3 bucket
 aws s3 cp $filename s3://craigslist-jobs-app/scrapy-results/$filename

 # remove json file 
 rm $filename
	# -- OVERVIEW --
	# This script will handle the execution of a the CraigsList Jobs Scrapy crawler
	# which gathers job listing contents. We then upload the results to a s3 bucket.

	# save file with timestamp prepended
	timestamp=$(date +%Y-%m-%d_%H-%M-%S)
	filename="$timestamp"_results.json

	# execute scrapy and store results in json file
	scrapy crawl jobs -o $filename

	# copy results to s3 bucket
	aws s3 cp $filename s3://craigslist-jobs-app/scrapy-results/$filename

	# remove json file
	rm $filename
No results found