Skip to content

Commit

Permalink
Use /data dir instead of ~/Data dir
Browse files Browse the repository at this point in the history
  • Loading branch information
inchiosa committed Aug 7, 2017
1 parent 4266f49 commit 2c64cf8
Showing 1 changed file with 6 additions and 9 deletions.
15 changes: 6 additions & 9 deletions Scripts/DSVM_Customization_Script.sh
Original file line number Diff line number Diff line change
Expand Up @@ -36,9 +36,9 @@ dotnet Microsoft.RServer.Utils.AdminUtil/Microsoft.RServer.Utils.AdminUtil.dll -
# Copy data to VM
#######################################################################################################################################

cd /home/remoteuser
mkdir Data
cd Data
cd /data
mkdir airline
cd airline

# Airline data
wget http://cdspsparksamples.blob.core.windows.net/data/Airline/WeatherSubsetCsv.tar.gz
Expand All @@ -47,19 +47,16 @@ wget http://cdspsparksamples.blob.core.windows.net/data/Airline/AirlineSubsetCsv
tar -xzf WeatherSubsetCsv.tar.gz
tar -xzf AirlineSubsetCsv.tar.gz

rm *.gz
rm WeatherSubsetCsv.tar.gz AirlineSubsetCsv.tar.gz

# Make hdfs directories
/opt/hadoop/current/bin/hadoop fs -mkdir -p /user/RevoShare/remoteuser/Data
/opt/hadoop/current/bin/hdfs dfs -mkdir -p /user/RevoShare/remoteuser/Data

# Copy data to HDFS
/opt/hadoop/current/bin/hadoop fs -copyFromLocal * /user/RevoShare/remoteuser/Data
/opt/hadoop/current/bin/hdfs dfs -copyFromLocal WeatherSubsetCsv AirlineSubsetCsv /user/RevoShare/remoteuser/Data

rm -rf WeatherSubsetCsv AirlineSubsetCsv

cd /data
mkdir airline
cd airline
wget http://strata2017r.blob.core.windows.net/airline/airline_20MM.csv

# Data directory for movie sentiment analysis
Expand Down

0 comments on commit 2c64cf8

Please sign in to comment.