Skip to content
This repository was archived by the owner on Jun 29, 2024. It is now read-only.
Prev Previous commit
Next Next commit
craete task2
  • Loading branch information
meghanak124 committed May 23, 2024
commit 62573f1dac60f68f732c70e1aded5b1b5c8aa099
5 changes: 5 additions & 0 deletions MeghanaK/output1.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
Title
S,e,a,r,c,h, ,c,o,d,e,",", ,r,e,p,o,s,i,t,o,r,i,e,s,",", ,u,s,e,r,s,",", ,i,s,s,u,e,s,",", ,p,u,l,l, ,r,e,q,u,e,s,t,s,.,.,.
P,r,o,v,i,d,e, ,f,e,e,d,b,a,c,k
S,a,v,e,d, ,s,e,a,r,c,h,e,s
L,e,t,’,s, ,b,u,i,l,d, ,f,r,o,m, ,h,e,r,e
48 changes: 48 additions & 0 deletions MeghanaK/task2.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
import requests
from bs4 import BeautifulSoup
import csv
import json

def scrape_website(url):
# Send a GET request to the URL
response = requests.get(url)

# Parse HTML content
soup = BeautifulSoup(response.text, 'html.parser')

titles = [title.text.strip() for title in soup.find_all('h1')]

return titles

def save_to_csv(data, filename):
# Write data to a CSV file
with open(filename, 'w', newline='', encoding='utf-8') as csvfile:
writer = csv.writer(csvfile)
writer.writerow(['Title'])
writer.writerows(data)

def save_to_json(data, filename):
# Write data to a JSON file
with open(filename, 'w', encoding='utf-8') as jsonfile:
json.dump(data, jsonfile, indent=4)

def main( ):
url = input("Enter the URL of the website you want to scrape: ")


output_format = input("Enter 'csv' or 'json' to choose the output format: ").lower()
if output_format not in ['csv','json']:
print("Invalid output format. Please enter 'csv' or 'json'.")
return
extracted_data = scrape_website(url)
if output_format == 'csv':
filename = input("Enter the filename to store the data (without extension): ") + '.csv'
save_to_csv(extracted_data, filename)
print(f"Data has been saved to {filename}")
elif output_format == 'json':
filename = input("Enter the filename to store the data (without extension): ") + '.json'
save_to_json(extracted_data, filename)
print(f"Data has been saved to {filename}")
if __name__ == "__main__":
main()