Skip to content
18 changes: 17 additions & 1 deletion 02_activities/assignments/assignment.sh
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ cd newproject

mkdir analysis output
touch README.md
echo "# Project Name: DSI Consulting Inc." > README.md
touch analysis/main.py

# download client data
Expand All @@ -28,21 +29,36 @@ unzip -q rawdata.zip
# Complete assignment here

# 1. Create a directory named data
mkdir data

# 2. Move the ./rawdata directory to ./data/raw
mv ./rawdata ./data/raw

# 3. List the contents of the ./data/raw directory
ls -al ./data/raw

# 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs
mkdir ./data/processed
mkdir ./data/processed/server_logs
mkdir ./data/processed/user_logs
mkdir ./data/processed/event_logs

# 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs
cp ./data/raw/*server*.log ./data/processed/server_logs

# 6. Repeat the above step for user logs and event logs
cp ./data/raw/*user*.log ./data/processed/user_logs
cp ./data/raw/*event*.log ./data/processed/event_logs

# 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs
find ./data/raw ./data/processed/user_logs -type f -name '*ipaddr*'
find ./data/raw ./data/processed/user_logs -type f -name '*ipaddr*' -delete


# 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed

# 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed
touch data/inventory.txt
ls -R ./data/processed/ > ./data/inventory.txt

###########################################

Expand Down