32 lines
746 B
Python
Executable File
32 lines
746 B
Python
Executable File
#!/usr/bin/env python3
|
|
import sys
|
|
from bs4 import BeautifulSoup
|
|
|
|
if sys.argv[1].startswith("http://") or sys.argv[1].startswith("https://"):
|
|
import requests
|
|
response = requests.get(sys.argv[1])
|
|
data = response.content
|
|
else:
|
|
with open(sys.argv[1],'rt',encoding='ISO-8859-1') as f:
|
|
data=f.read()
|
|
|
|
page=str(BeautifulSoup(data,features="lxml"))
|
|
|
|
def getURL(page):
|
|
start_link = page.find("a href")
|
|
if start_link == -1:
|
|
return None, 0
|
|
start_quote = page.find('"', start_link)
|
|
end_quote = page.find('"', start_quote + 1)
|
|
url = page[start_quote + 1: end_quote]
|
|
return url, end_quote
|
|
|
|
|
|
while True:
|
|
url, n = getURL(page)
|
|
page = page[n:]
|
|
if url:
|
|
print(url)
|
|
else:
|
|
break
|