Skip to content

PyWebScrape #1

@MohammadRijwan

Description

@MohammadRijwan

import requests
from bs4 import BeautifulSoup

def news():
# the target we want to open
url='http://www.hindustantimes.com/top-news'

#open with GET method 
resp=requests.get(url) 

#http_respone 200 means OK status 
if resp.status_code==200: 
	print("Successfully opened the web page") 
	print("The news are as follow :-\n") 

	# we need a parser,Python built-in HTML parser is enough . 
	s=BeautifulSoup(resp.text,'html.parser')
	#print(s)	 

	# l is the list which contains all the text i.e news 
	l=s.find("div")
	#print(l)

	#now we want to print only the text part of the anchor. 
	#find all the elements of a, i.e anchor 
	for i in l.findAll("div",{"class":"para-txt"}): 
		print(i.text) 
else: 
	print("Error") 

news()

Metadata

Metadata

Assignees

No one assigned

    Labels

    No labels
    No labels

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions