爬蟲 BeautifulSoup 蛋殼公寓租房

import re,requests
from bs4 import beautifulsoup
defget_page_info
(page=1)
: url=
""+str
(page)
headers=
r=requests.get(url,headers=headers)
soup=beautifulsoup(r.text,
'html.parser'
) house_list=soup.find_all(
"div"
,attrs=
)for once in house_list:
house_name=once.find(
"div"
,attrs=
).a.attrs[
'title'
] house_url=once.find(
"div"
,attrs=
).a.attrs[
'href'
] house_price=once.find(
"span"
,attrs=
).text.strip(
) house_station_info=once.find(
"div"
,attrs=
).next_element.strip(
) house_info4=once.find(text=re.
compile
("㎡"))
house_info4=re.sub(
"\s",''
,house_info4)
try:
house_discount=once.find(
"div"
,attrs=
).text
house_discount=re.sub(
"\s",''
,house_discount)[:
-2]except attributeerror :
house_discount=
"暫無優惠"
print
(house_discount)
for page in
range(1
,5):
get_page_info(page)
# import re
## str1="距5號環中線,10號線五和站400公尺"
# str2="距3號龍崗線六約站250公尺"
# str3="距1號羅寶線,3號龍崗線購物公園站850公尺"
# str4="距2號蛇口線,9號線景田站500公尺"
# str5="距9號線香梅站200公尺"
# regex="距(?:(\d+)號([\u4e00-\u9fa5]*)線,)?(\d+)號([\u4e00-\u9fa5]*)線([\u4e00-\u9fa5]*)站(\d+)公尺"
# print(re.search(regex,str1).groups())
# print(re.search(regex,str2).groups())
# print(re.search(regex,str3).groups())
# print(re.search(regex,str4).groups())
# print(re.search(regex,str5).groups())

c:\anaconda3\python.exe d: /ai/ 01-ai基礎/ai- 3-python高階/ 01爬蟲ppt/day3_lxml和動態請求/demo1-蛋殼公寓beautifulsoup.py 暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠暫無優惠

process finished with exit code 0

爬蟲 BeautifulSoup 蛋殼公寓租房

爬蟲 BeautifulSoup 模組

爬蟲beautifulsoup實踐

爬蟲資料 Beautiful Soup

爬蟲 BeautifulSoup 蛋殼公寓租房

爬蟲 BeautifulSoup 模組

爬蟲beautifulsoup實踐

爬蟲資料 Beautiful Soup

相關推薦