From e976b55a5c2a83f4f2ab1221ea228c9b8737db4f Mon Sep 17 00:00:00 2001 From: Simeon Wong Date: Thu, 14 Nov 2024 20:32:09 -0500 Subject: [PATCH 01/26] delete ip logs... WARNING UNTESTED! --- 02_activities/assignments/assignment.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index d81e9a77b..001291867 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -33,6 +33,7 @@ unzip rawdata.zip # 6. Repeat the above step for user logs and event logs # 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs +rf -rf ./data # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed From ea20676d33161a6f4d0fcd3c4f7aa5360f0f4309 Mon Sep 17 00:00:00 2001 From: Simeon Wong Date: Thu, 14 Nov 2024 20:55:44 -0500 Subject: [PATCH 02/26] initialize README file with company name --- 02_activities/assignments/assignment.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 001291867..f2bfd22bd 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -11,6 +11,7 @@ set -x mkdir analysis output touch README.md +echo "# Project Name: DSI Consulting Inc." > README.md touch analysis/main.py # download client data From 3fdb468f1d503c27119c5f23bb9659bdfd4ea366 Mon Sep 17 00:00:00 2001 From: anadub Date: Thu, 10 Apr 2025 16:55:00 -0400 Subject: [PATCH 03/26] Finished question 1 on assignment --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 2fbb9c81d..7c62dec20 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -21,7 +21,7 @@ unzip -q rawdata.zip # Complete assignment here # 1. Create a directory named data - +mkdir data # 2. Move the ./rawdata directory to ./data/raw # 3. List the contents of the ./data/raw directory From 72b0c85798e3046a1513f30248423c64eff0e23a Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 01:19:32 -0400 Subject: [PATCH 04/26] Finish question 2 on assignment --- 02_activities/assignments/assignment.sh | 26 ++++++++++++++++++------- 1 file changed, 19 insertions(+), 7 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 7c62dec20..0996401b3 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -23,19 +23,31 @@ unzip -q rawdata.zip # 1. Create a directory named data mkdir data # 2. Move the ./rawdata directory to ./data/raw - +cd data +mkdir raw +cd .. +mv rawdata.zip ./data/raw/ +cd data/raw/ +unzip -oq rawdata.zip # 3. List the contents of the ./data/raw directory - +# ls # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs - +# cd .. +# mkdir processed +# cd processed +# mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs - +# cd .. +# cp raw/rawdata/*server*.log processed/server_logs/ # 6. Repeat the above step for user logs and event logs - +# cp raw/rawdata/*user*.log processed/user_logs/ +# cp raw/rawdata/*event*.log processed/event_logs/ # 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs - +# rm raw/rawdata/*ipaddr* +# rm processed/user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed - +# touch ./inventory.txt +# ls processed/*/* >> inventory.txt ########################################### From 380f39d4115418d0463d78d09ab4c3a0b2bdb65c Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 07:48:30 -0400 Subject: [PATCH 05/26] Finished question 2 on assignment --- 02_activities/assignments/assignment.sh | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 0996401b3..af316a0ea 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -23,12 +23,17 @@ unzip -q rawdata.zip # 1. Create a directory named data mkdir data # 2. Move the ./rawdata directory to ./data/raw +unzip -oq rawdata.zip cd data mkdir raw cd .. -mv rawdata.zip ./data/raw/ -cd data/raw/ -unzip -oq rawdata.zip +mv rawdata ./data/raw/ +# cd data +# mkdir raw +# cd .. +# mv rawdata.zip ./data/raw/ +# cd data/raw/ +# unzip -oq rawdata.zip # 3. List the contents of the ./data/raw directory # ls # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs From 5ac15b49b2924eba1ae6b5853882b21cc97cab18 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 07:54:11 -0400 Subject: [PATCH 06/26] Finished question 3 on assignment --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index af316a0ea..9e5c47c9e 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -35,7 +35,7 @@ mv rawdata ./data/raw/ # cd data/raw/ # unzip -oq rawdata.zip # 3. List the contents of the ./data/raw directory -# ls +ls # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs # cd .. # mkdir processed From 85677f89593b4e554424429f55f4be51e78b4220 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 08:08:31 -0400 Subject: [PATCH 07/26] Finished question 3 on assignment --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 9e5c47c9e..eea69ac54 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -35,7 +35,7 @@ mv rawdata ./data/raw/ # cd data/raw/ # unzip -oq rawdata.zip # 3. List the contents of the ./data/raw directory -ls +ls ./data/raw/ # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs # cd .. # mkdir processed From 962f1b482795f6baa358abe5a7696c7de8ae9583 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 08:18:03 -0400 Subject: [PATCH 08/26] Finished question 4 on assignment --- 02_activities/assignments/assignment.sh | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index eea69ac54..5920501e8 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -37,10 +37,10 @@ mv rawdata ./data/raw/ # 3. List the contents of the ./data/raw directory ls ./data/raw/ # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs -# cd .. -# mkdir processed -# cd processed -# mkdir server_logs user_logs event_logs +cd data +mkdir processed +cd processed +mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs # cd .. # cp raw/rawdata/*server*.log processed/server_logs/ From 84aa4ad41faba0a4fb4406e7a11e3025df2503d8 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 08:24:38 -0400 Subject: [PATCH 09/26] Finished question 5 on assignment --- 02_activities/assignments/assignment.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 5920501e8..87ba8ce4e 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -42,8 +42,8 @@ mkdir processed cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs -# cd .. -# cp raw/rawdata/*server*.log processed/server_logs/ +cd .. +cp raw/rawdata/*server*.log processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From 10cef34342ad98fea1c3673185947ec4e151d303 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 08:39:50 -0400 Subject: [PATCH 10/26] Finished question 5 on assignment --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 87ba8ce4e..ef5ac7f7b 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -43,7 +43,7 @@ cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs cd .. -cp raw/rawdata/*server*.log processed/server_logs/ +cp ./raw/rawdata/*server*.log ./processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From bb870d2d33926816c2cc9fe92fb4aa28d1630712 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 08:44:08 -0400 Subject: [PATCH 11/26] Finished question 5 on assignment --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index ef5ac7f7b..fce253efe 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -42,7 +42,7 @@ mkdir processed cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs -cd .. +cd data cp ./raw/rawdata/*server*.log ./processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ From 1da079d45e830d33e7c7a7e90c06118cb612e3d7 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 09:46:02 -0400 Subject: [PATCH 12/26] Finished Question 5 --- 02_activities/assignments/assignment.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index fce253efe..0a352a775 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -44,6 +44,7 @@ mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs cd data cp ./raw/rawdata/*server*.log ./processed/server_logs/ +# new try # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From 2c06fab11d68fdb5099764acca29ba4fb72c41ac Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 10:42:49 -0400 Subject: [PATCH 13/26] Finish Q5 --- 02_activities/assignments/assignment.sh | 1 - 1 file changed, 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 0a352a775..fce253efe 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -44,7 +44,6 @@ mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs cd data cp ./raw/rawdata/*server*.log ./processed/server_logs/ -# new try # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From c2771051c251b3ed4aab2c24f5ec0e9e1b22414a Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 10:52:03 -0400 Subject: [PATCH 14/26] Finish Q5 --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index fce253efe..c1ec06c28 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -23,7 +23,7 @@ unzip -q rawdata.zip # 1. Create a directory named data mkdir data # 2. Move the ./rawdata directory to ./data/raw -unzip -oq rawdata.zip +#unzip -oq rawdata.zip cd data mkdir raw cd .. From ac24ac66d9b4392e5c2e250abfd00ca9d556b49d Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 11:23:12 -0400 Subject: [PATCH 15/26] Q 5 --- 02_activities/assignments/assignment.sh | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index c1ec06c28..5d4e5f2ec 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -42,8 +42,9 @@ mkdir processed cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs -cd data -cp ./raw/rawdata/*server*.log ./processed/server_logs/ +cd .. +ls +cp ./raw/*server*.log ./processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From 872c1f53570eeb36d44ec444ceb3ed0060789fe6 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 11:59:55 -0400 Subject: [PATCH 16/26] Q 5 --- 02_activities/assignments/assignment.sh | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 5d4e5f2ec..5392d260a 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -27,7 +27,8 @@ mkdir data cd data mkdir raw cd .. -mv rawdata ./data/raw/ +# I wrote ./rawdata instead of rawdata +mv ./rawdata ./data/raw/ # cd data # mkdir raw # cd .. @@ -42,9 +43,9 @@ mkdir processed cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs -cd .. -ls -cp ./raw/*server*.log ./processed/server_logs/ +# mkdir -p data/processed/server_logs data/processed/user_logs data/processed/event_logs +cp ../raw/*server*.log ./server_logs/ +#cp ./data/raw/*server*.log ./data/processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ # cp raw/rawdata/*event*.log processed/event_logs/ From 2a9486eec9815720b76b8ef8421b97c72ee322cf Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 12:50:54 -0400 Subject: [PATCH 17/26] Q 5 --- 02_activities/assignments/assignment.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 5392d260a..9d02eb18e 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -44,7 +44,8 @@ cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs # mkdir -p data/processed/server_logs data/processed/user_logs data/processed/event_logs -cp ../raw/*server*.log ./server_logs/ +#cp ../raw/*server*.log ./server_logs/ +cp ../raw/rawdata/*server*.log ./server_logs/ #cp ./data/raw/*server*.log ./data/processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ From 6e071660921006e2666e743f93d8cc4c30f8a71d Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 13:00:38 -0400 Subject: [PATCH 18/26] Q 5 --- 02_activities/assignments/assignment.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 9d02eb18e..f0679741a 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -28,7 +28,8 @@ cd data mkdir raw cd .. # I wrote ./rawdata instead of rawdata -mv ./rawdata ./data/raw/ +#mv ./rawdata ./data/raw/ +mv ./rawdata/* ./data/raw/ # cd data # mkdir raw # cd .. From d5f8ce2e713d0382daba050dd3d762f544a44352 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 14:13:02 -0400 Subject: [PATCH 19/26] Q5 --- 02_activities/assignments/assignment.sh | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index f0679741a..367afc183 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -24,12 +24,12 @@ unzip -q rawdata.zip mkdir data # 2. Move the ./rawdata directory to ./data/raw #unzip -oq rawdata.zip -cd data -mkdir raw -cd .. +#cd data +#mkdir raw +#cd .. # I wrote ./rawdata instead of rawdata #mv ./rawdata ./data/raw/ -mv ./rawdata/* ./data/raw/ +mv ./rawdata ./data # cd data # mkdir raw # cd .. From 8320723eba5d957e77cd659b7fa9841873dca6fa Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 14:35:36 -0400 Subject: [PATCH 20/26] Q 5 --- 02_activities/assignments/assignment.sh | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 367afc183..1cb4b33eb 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -24,12 +24,11 @@ unzip -q rawdata.zip mkdir data # 2. Move the ./rawdata directory to ./data/raw #unzip -oq rawdata.zip -#cd data -#mkdir raw -#cd .. +cd data +mkdir raw +cd .. # I wrote ./rawdata instead of rawdata -#mv ./rawdata ./data/raw/ -mv ./rawdata ./data +mv ./rawdata ./data/raw/ # cd data # mkdir raw # cd .. @@ -46,7 +45,8 @@ mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs # mkdir -p data/processed/server_logs data/processed/user_logs data/processed/event_logs #cp ../raw/*server*.log ./server_logs/ -cp ../raw/rawdata/*server*.log ./server_logs/ +mv ../raw/rawdata/* ../raw/ +cp ../raw/*server*.log ./server_logs/ #cp ./data/raw/*server*.log ./data/processed/server_logs/ # 6. Repeat the above step for user logs and event logs # cp raw/rawdata/*user*.log processed/user_logs/ From 2e12b6af3dbe4c3d618c93c005fb4abdc4e9c7da Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 14:40:56 -0400 Subject: [PATCH 21/26] Q 6 --- 02_activities/assignments/assignment.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 1cb4b33eb..17eeacc1c 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -49,8 +49,8 @@ mv ../raw/rawdata/* ../raw/ cp ../raw/*server*.log ./server_logs/ #cp ./data/raw/*server*.log ./data/processed/server_logs/ # 6. Repeat the above step for user logs and event logs -# cp raw/rawdata/*user*.log processed/user_logs/ -# cp raw/rawdata/*event*.log processed/event_logs/ +cp ../raw/*user*.log ./user_logs/ +cp ../raw/*event*.log ./event_logs/ # 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs # rm raw/rawdata/*ipaddr* # rm processed/user_logs/*ipaddr* From abb2fbc43020b6893ea524202dc0a86c8b5ecf05 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 14:45:25 -0400 Subject: [PATCH 22/26] Q 7 --- 02_activities/assignments/assignment.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 17eeacc1c..d77b5a95e 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -52,8 +52,8 @@ cp ../raw/*server*.log ./server_logs/ cp ../raw/*user*.log ./user_logs/ cp ../raw/*event*.log ./event_logs/ # 7. For user privacy, remove all files containing IP addresses (files with "ipaddr" in the filename) from ./data/raw and ./data/processed/user_logs -# rm raw/rawdata/*ipaddr* -# rm processed/user_logs/*ipaddr* +rm ../raw/*ipaddr* +rm ./user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed # touch ./inventory.txt # ls processed/*/* >> inventory.txt From 89bf99c11b3d715e6a73119e9e518438fddb6afe Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 14:58:01 -0400 Subject: [PATCH 23/26] Q 8 --- 02_activities/assignments/assignment.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index d77b5a95e..137c30cf3 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -55,8 +55,8 @@ cp ../raw/*event*.log ./event_logs/ rm ../raw/*ipaddr* rm ./user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed -# touch ./inventory.txt -# ls processed/*/* >> inventory.txt +touch ../inventory.txt +ls processed/*/* >> inventory.txt ########################################### From fef7e4a89834412a6da1d3d7dae9d199f232ce0a Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 15:04:55 -0400 Subject: [PATCH 24/26] Q 8 --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 137c30cf3..b81ece1eb 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -56,7 +56,7 @@ rm ../raw/*ipaddr* rm ./user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed touch ../inventory.txt -ls processed/*/* >> inventory.txt +ls processed/*/* >> ../inventory.txt ########################################### From 20ea56b5d789bca849c19f4440631fa1f7bd21d3 Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 15:10:57 -0400 Subject: [PATCH 25/26] Q 8 --- 02_activities/assignments/assignment.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index b81ece1eb..02373f8f9 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -56,7 +56,7 @@ rm ../raw/*ipaddr* rm ./user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed touch ../inventory.txt -ls processed/*/* >> ../inventory.txt +ls ./*/* >> ../inventory.txt ########################################### From f04857321b31cbe87115645f5797a8bca6e7940e Mon Sep 17 00:00:00 2001 From: anadub Date: Sat, 12 Apr 2025 15:15:17 -0400 Subject: [PATCH 26/26] Q 8 --- 02_activities/assignments/assignment.sh | 13 +------------ 1 file changed, 1 insertion(+), 12 deletions(-) diff --git a/02_activities/assignments/assignment.sh b/02_activities/assignments/assignment.sh index 02373f8f9..04cac1900 100644 --- a/02_activities/assignments/assignment.sh +++ b/02_activities/assignments/assignment.sh @@ -23,18 +23,10 @@ unzip -q rawdata.zip # 1. Create a directory named data mkdir data # 2. Move the ./rawdata directory to ./data/raw -#unzip -oq rawdata.zip cd data mkdir raw cd .. -# I wrote ./rawdata instead of rawdata mv ./rawdata ./data/raw/ -# cd data -# mkdir raw -# cd .. -# mv rawdata.zip ./data/raw/ -# cd data/raw/ -# unzip -oq rawdata.zip # 3. List the contents of the ./data/raw directory ls ./data/raw/ # 4. In ./data/processed, create the following directories: server_logs, user_logs, and event_logs @@ -43,11 +35,8 @@ mkdir processed cd processed mkdir server_logs user_logs event_logs # 5. Copy all server log files (files with "server" in the name AND a .log extension) from ./data/raw to ./data/processed/server_logs -# mkdir -p data/processed/server_logs data/processed/user_logs data/processed/event_logs -#cp ../raw/*server*.log ./server_logs/ mv ../raw/rawdata/* ../raw/ cp ../raw/*server*.log ./server_logs/ -#cp ./data/raw/*server*.log ./data/processed/server_logs/ # 6. Repeat the above step for user logs and event logs cp ../raw/*user*.log ./user_logs/ cp ../raw/*event*.log ./event_logs/ @@ -55,7 +44,7 @@ cp ../raw/*event*.log ./event_logs/ rm ../raw/*ipaddr* rm ./user_logs/*ipaddr* # 8. Create a file named ./data/inventory.txt that lists all the files in the subfolders of ./data/processed -touch ../inventory.txt +# touch ../inventory.txt ls ./*/* >> ../inventory.txt ###########################################