for image in images:
imageURL = re.findall('https://smtgvs.weathernews.jp/s/topics/img/.+', urljoin(baseURL, image['src']))
if imageURL:
print(imageURL)
for image in images:
imageURL = re.findall("(https://smtgvs.weathernews.jp/s/topics/img/[0-9]+/.+)\?[0-9]+", urljoin(baseURL, image['src']))
if imageURL:
print(imageURL)
编辑:要获取原始数据而不是src字段:
soup = BeautifulSoup(html_doc, 'html.parser')
for image in soup.find_all("img"):
print(image.get("data-original"))