"""
@time: 2021/9/1 13:48
"""
from urllib.parse import urlparse, urlunparse, parse_qs, urlencode
def replace_field(url, name, value):
parse = urlparse(url)
query = parse.query
query_pair = parse_qs(query)
query_pair[name] = value
new_query = urlencode(query_pair, doseq=True)
new_parse = parse._replace(query=new_query)
next_page = urlunparse(new_parse)
return next_page
if __name__ == '__main__':
url_list = [
'https://xxx.com/articlelist?category=technology',
'https://xxx.com/articlelist?category=technology&after=',
'https://xxx.com/articlelist?category=technology&after=asdrtJKSAZFD',
'https://xxx.com/articlelist?category=technology&after=asdrtJKSAZFD&other=abc'
]
for url in url_list:
next_page = replace_field(url, 'after', '0000000')
print(next_page)