!pip install openpyxl
import requests
from bs4 import BeautifulSoup
from openpyxl import Workbook
def get_search_list(keyword=None,page=1):
url ='http://www.mailiangwang.com/biz/list'
payload ={'keyword':keyword, 'pageid':page}
response = requests.get(url,params=payload)
print(response.url)
print(response.status_code)
get_search_list(u'玉米',1)
name_total = []
caption_total = []
addr_total = []
category_total = []
def get_search_list(keyword=None,page=1):
url ='http://www.mailiangwang.com/biz/list'
payload ={'keyword':keyword, 'pageid':page}
response = requests.get(url,params=payload)
soup = BeautifulSoup(response.text,'lxml')
links = soup.select('body>div.wrap >div.merchantList >div.p_dataList >div.p_dataItem >span.n1 >a')
captions = soup.select('body > div.wrap > divmerchanList > div.p_dataList > div.p_dataIlem > span.n4')
addrs = soup.select('body > div.wrap >div.merchanList >div.p_dataList >div.p_dataItem > span.n5')
categories = soup.select('body > div.wrap >div.merchantList >div.p_dataItem >span.n6')
for link,caption,addr,category in zip(links, captions, addrs, categories):
name_total.append(link.get('title').strip())
caption_total.append(caption.text)
addr_total.append(addr.text)
category_total.append(category.text)
get_search_list('玉米',1)
print(name_total)
print(caption_total)
!pip install openpyxl
import requests
from bs4 import BeautifulSoup
from openpyxl import Workbook
def get_search_list(keyword=None,page=1):
url ='http://www.mailiangwang.com/biz/list'
payload ={'keyword':keyword, 'pageid':page}
response = requests.get(url,params=payload)
print(response.url)
print(response.status_code)
get_search_list(u'玉米',1)
name_total = []
caption_total = []
addr_total = []
category_total = []
def get_search_list(keyword=None,page=1):
url ='http://www.mailiangwang.com/biz/list'
payload ={'keyword':keyword, 'pageid':page}
response = requests.get(url,params=payload)
soup = BeautifulSoup(response.text,'lxml')
links = soup.select('body>div.wrap >div.merchantList >div.p_dataList >div.p_dataItem >span.n1 >a')
captions = soup.select('body > div.wrap > div.merchantList > div.p_dataList > div.p_dataItem > span.n4')
addrs = soup.select('body > div.wrap > div.merchantList >div.p_dataList >div.p_dataItem > span.n5')
categories = soup.select('body > div.wrap > div.merchantList >div.p_dataList >div.p_dataItem >span.n6')
for link,caption,addr,category in zip(links, captions, addrs, categories):
name_total.append(link.get('title').strip())
caption_total.append(caption.text)
addr_total.append(addr.text)
category_total.append(category.text)
get_search_list('玉米',1)
print(name_total)
print(caption_total)