import requests
from bs4 import BeautifulSoup
def getpage(url):
responce = requests.get(url)
soup = BeautifulSoup(responce.text,'lxml')
return soup
def getlinks(link_url):
responce = requests.get(link_url)
format_list = BeautifulSoup(responce.text,'lxml')
link_div = format_list.find_all('div',class_='pic-panel')
links = [div.a.get('href') for div in link_div]
return links
url = 'https://bj.lianjia.com/zufang/'
house_url = 'https://bj.lianjia.com/zufang/101102926709.html'
def get_house_info(house_url):
# li = getlinks(url)
# print(li)
soup = getpage(house_url)
prince = soup.find('span',class_='total').text
unit = soup.find('span',class_='unit').text.strip()
house_info = soup.find_all('p')
area = house_info[0].text[3:]
layout = house_info[1].text[5:]
floor = house_info[2].text[3:]
direction = house_info[3].text[5:]
location = house_info[4].text[3:]
xiaoqu_location = house_info[5].text[3:7]
create_time = house_info[6].text[3:]
info ={'面積':area,
'分布':layout,
'樓層':floor,
'方向':direction,
'價格':prince,
'單價':unit,
'地鐵':location,
'小區':xiaoqu_location,
'時間':create_time
}
return info
house = get_house_info(house_url)
for k,v in house.items():
print('{}:{}'.format(k,v))
免責聲明:本站發布的內容(圖片、視頻和文字)以原創、轉載和分享為主,文章觀點不代表本網站立場,如果涉及侵權請聯系站長郵箱:is@yisu.com進行舉報,并提供相關證據,一經查實,將立刻刪除涉嫌侵權內容。