From 43761d0680cadc3be94af8c30c57a82978ecd689 Mon Sep 17 00:00:00 2001 From: Aas1kk <152005759+aa-sikkkk@users.noreply.github.com> Date: Wed, 18 Sep 2024 11:54:59 +0545 Subject: [PATCH 1/5] Update django.yml --- .github/workflows/django.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/django.yml b/.github/workflows/django.yml index e22bc29..207544e 100644 --- a/.github/workflows/django.yml +++ b/.github/workflows/django.yml @@ -24,7 +24,7 @@ jobs: working-directory: web run: | python -m pip install --upgrade pip - pip install -r web/requirements.txt + pip install -r requirements.txt - name: Run migrations working-directory: web From 29f97926d0f6add38447fc5fdcfe5b50e15c06bf Mon Sep 17 00:00:00 2001 From: Aas1kk <152005759+aa-sikkkk@users.noreply.github.com> Date: Wed, 18 Sep 2024 11:56:41 +0545 Subject: [PATCH 2/5] Update requirements.txt --- requirements.txt | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/requirements.txt b/requirements.txt index 1f78253..b06ce2e 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,3 +1,4 @@ +django==5.1.1 async-generator==1.10 attrs==21.4.0 beautifulsoup4==4.10.0 @@ -22,4 +23,4 @@ trio-websocket==0.9.2 urllib3==1.26.8 wcwidth==0.2.5 wsproto==1.1.0 -html5lib==1.1 \ No newline at end of file +html5lib==1.1 From 5b5c96cc1e414142e3586da56f8862a269b5d43b Mon Sep 17 00:00:00 2001 From: Aas1kk <152005759+aa-sikkkk@users.noreply.github.com> Date: Wed, 18 Sep 2024 11:56:56 +0545 Subject: [PATCH 3/5] Update requirements.txt --- web/requirements.txt | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/web/requirements.txt b/web/requirements.txt index 17fa697..9b5e2fd 100644 --- a/web/requirements.txt +++ b/web/requirements.txt @@ -1,3 +1,4 @@ +django==5.1.1 async-generator==1.10 attrs==21.4.0 beautifulsoup4==4.10.0 @@ -21,4 +22,4 @@ trio==0.20.0 trio-websocket==0.9.2 urllib3==1.26.8 wcwidth==0.2.5 -wsproto==1.1.0 \ No newline at end of file +wsproto==1.1.0 From ccc89612811dfff94ae39ae8fe7635a390a66744 Mon Sep 17 00:00:00 2001 From: Aas1kk <152005759+aa-sikkkk@users.noreply.github.com> Date: Wed, 18 Sep 2024 11:58:19 +0545 Subject: [PATCH 4/5] Update django.yml From 205c014a757516d2fbcf12252e2b08dcd966eebc Mon Sep 17 00:00:00 2001 From: Aas1kk <152005759+aa-sikkkk@users.noreply.github.com> Date: Wed, 18 Sep 2024 12:17:01 +0545 Subject: [PATCH 5/5] Update README.md --- README.md | 12 ++++++++++-- 1 file changed, 10 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 5ee3596..37e6537 100644 --- a/README.md +++ b/README.md @@ -13,6 +13,7 @@ WebScrape is a simple yet powerful Python-based web scraping tool that allows us - Displays existing scraped websites in a user-friendly table format. - Allows alias names for websites to manage and store scraped data. - Handles multiple websites and retains a history of scrapes. +- Web Version as well as CLI Version is available. ## Google Collab You can find the google notebook from: [link](https://colab.research.google.com/drive/1t03WODhStp3oYeFthi4r9gZuNXCR31lE?usp=sharing) @@ -41,7 +42,8 @@ python scrap.py ## Data Storage -![1_poXvWu--59Gd64sRktAQGQ](https://github.com/user-attachments/assets/15011f46-de61-487c-85b2-c433c433b9a5) + + ``` @@ -67,8 +69,14 @@ Data Storage ``` +## Web Version of the Project. +The Project is powered by Django for web version. + +![Screenshot 2024-09-18 120647](https://github.com/user-attachments/assets/389721fb-4a19-4c0c-9c90-e0dbab49c959) +![Screenshot 2024-09-18 120628](https://github.com/user-attachments/assets/06ec5a10-7210-4e00-b9c3-5c8a749048b5) + ## License -This project is licensed under the MIT License. See the LICENSE file for more details. +This project is licensed under the MIT [License](LICENSE). See the LICENSE file for more details. ## Contributing Feel free to fork the project and submit pull requests! If you encounter any issues, you can open an issue on the repository.