I want to remove target tr block with text, when i run it i got perfect output but there is a problem i have seen that it scraping <tr><td>Domain</td><td>Last Resolved Date</td></tr>
actually i don’t want this line in my output so how can i remove it.Code bellow
Got fix
Old Code
JavaScript
x
15
15
1
import requests
2
from bs4 import BeautifulSoup
3
4
5
headers = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
6
url = "https://viewdns.info/reverseip/?host=github.com&t=1"
7
text = requests.get(url, headers=headers).text
8
soup = BeautifulSoup(text, 'html.parser')
9
10
table = soup.find('table', attrs={'border':'1'})
11
domain = table.findAll('td', attrs={'align':None})
12
13
for line in domain:
14
print(line.text)
15
Fixed
JavaScript
1
15
15
1
import requests
2
from bs4 import BeautifulSoup
3
4
5
headers = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
6
url = "https://viewdns.info/reverseip/?host=github.com&t=1"
7
text = requests.get(url, headers=headers).text
8
soup = BeautifulSoup(text, 'html.parser')
9
10
table = soup.find('table', attrs={'border':'1'})
11
domain = table.findAll('td', attrs={'align':None})[2:]
12
13
for line in domain:
14
print(line.text)
15
Advertisement
Answer
Try the code.
JavaScript
1
15
15
1
import requests
2
from bs4 import BeautifulSoup
3
4
5
headers = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
6
url = "https://viewdns.info/reverseip/?host=github.com&t=1"
7
text = requests.get(url, headers=headers).text
8
soup = BeautifulSoup(text, 'html.parser')
9
10
table = soup.find('table', attrs={'border':'1'})
11
domain = table.findAll('td', attrs={'align':None})[2:]
12
13
for line in domain:
14
print(line.text)
15