diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 4b48cec8b..ff4e2d421 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -28,23 +28,32 @@ unzip -q rawdata.zip # Complete assignment here # 1. Create a directory named data - +mkdir data # 2. Move the ./rawdata directory to ./data/raw (eg. move it into ./data and rename it to raw) - +mv rawdata data/raw # 3. List the contents of the ./data/raw directory - +ls data/raw # 4. Create the directory ./data/processed, # then create the following sub-directories within it: server_logs, user_logs, and event_logs - +mkdir ./data/processed +mkdir data/processed/server_logs +mkdir data/processed/user_logs +mkdir data/processed/event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs - +cp ./data/raw/*server*.log ./data/processed/server_logs # 6. Repeat the above step for user logs and event logs - +cp ./data/raw/*user*.log ./data/processed/user_logs +cp ./data/raw/*event*.log ./data/processed/event_logs # 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs - +rm ./data/raw/*ipaddr* ./data/processed/user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed - +touch ./data/inventory.txt +find ./data/processed -type f | sort > ./data/inventory.txt ########################################### echo "Project setup is complete!" + +git pull https://github.com/UofT-DSI/shell coworker-changes --no-rebase +git status +commit -m "Coworkers" diff --git a/newproject/README.md b/newproject/README.md new file mode 100644 index 000000000..e69de29bb diff --git a/newproject/analysis/main.py b/newproject/analysis/main.py new file mode 100644 index 000000000..e69de29bb