Commit c37739a2 by lichenggang

add testmart

parent 2919eafc
Showing with 3 additions and 3 deletions
from utils.base import Module_Base
from utils.proxy_util import proxies
domain = 'http:'
domain = 'https://www.testmart.cn'
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/72.0.3626.121 Safari/537.36",
}
......@@ -23,7 +23,7 @@ def get_levels(level1_doms):
for level1_dom in level1_doms:
level1 = dict()
level1['cat_name'] = level1_dom[0].xpath('.//a[1]/text()')[0].strip()
level1['url'] = level1_dom[0].xpath('.//a[1]/@href')[0]
level1['url'] = domain + level1_dom[0].xpath('.//a[1]/@href')[0]
level1['level'] = 1
level1['islast'] = 0
level1['parent_id'] = 0
......@@ -32,7 +32,7 @@ def get_levels(level1_doms):
for level2_dom in level1_dom[1].xpath('.//a'):
level2 = {}
level2['cat_name'] = level2_dom.xpath('./text()')[0].strip()
level2['url'] = level2_dom.xpath('./@href')[0]
level2['url'] = domain + level2_dom.xpath('./@href')[0]
level2['level'] = 2
level2['islast'] = 1
level1['level2_list'].append(level2)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or sign in to comment