mirror of
https://github.com/d0zingcat/NotionNext.git
synced 2026-05-14 15:09:22 +00:00
19 lines
577 B
Python
19 lines
577 B
Python
import re
|
|
import ssl
|
|
import requests
|
|
import argparse
|
|
|
|
|
|
if __name__ == '__main__':
|
|
ssl._create_default_https_context = ssl._create_unverified_context
|
|
parser = argparse.ArgumentParser(description='parse sitemap')
|
|
parser.add_argument('url', help='The url of your website')
|
|
args = parser.parse_args()
|
|
url = f'{args.url}/sitemap.xml'
|
|
result = requests.get(url)
|
|
big = re.findall('<loc>(.*?)</loc>', result.content.decode('utf-8'), re.S)
|
|
for i in big:
|
|
print(i)
|
|
# op_xml_txt = open('xml.txt', 'a')
|
|
# op_xml_txt.write('%s\n' % i)
|