from urllib.request
import urlopen
from bs4
import BeautifulSoup
import re
resp=urlopen(
"https://zh.wikipedia.org/wiki/Wikipedia:首页").read().decode(
"utf-8")
soup=BeautifulSoup(resp,
"html.parser")
listUrl=soup.findAll(
"a",href=re.compile(
"^/wiki/"))
for link
in listUrl:
if not re.search(
"\.(jpg|JPG)$",link[
"href"]):
print(link.get_text(),
"<----->",
"https://zh.wikipedia.org"+link[
"href"])