%sh rm -f every2SecsRndWordsInFiles.sh && echo "#!/bin/bash" >> every2SecsRndWordsInFiles.sh && echo "rm -rf logsEvery2Secs" >> every2SecsRndWordsInFiles.sh && echo "mkdir -p logsEvery2Secs" >> every2SecsRndWordsInFiles.sh && echo "while true; do echo \$( date --rfc-3339=second )\; | cat - <(shuf -n2 animals.txt) | sed '$!{:a;N;s/\n/ /;ta}' > logsEvery2Secs/\$( date '+%M_%S.log' ); sleep 2; done" >> every2SecsRndWordsInFiles.sh && cat every2SecsRndWordsInFiles.sh
#!/bin/bash
rm -rf logsEvery2Secs
mkdir -p logsEvery2Secs
while true; do echo $( date --rfc-3339=second )\; | cat - <(shuf -n2 animals.txt) | sed '{:a;N;s/\n/ /;ta}' > logsEvery2Secs/$( date '+%M_%S.log' ); sleep 2; done
var a = 0; // for loop execution to move files from local fs to distributed fs for( a <- 1 to 60*60/5){ // you may need to replace 60*60/5 above by a smaller number like 10 or 20 in the CE depending on how many files of your quota you have used up already dbutils.fs.cp("file:///databricks/driver/logsEvery2Secs/","/datasets/streamingFiles/",true) Thread.sleep(5000L) // sleep 5 seconds }
Cancelled
SDS-2.x, Scalable Data Engineering Science
Last refresh: Never