scrapy添加了环境变量为什么还是显示非外部内部指令?

系统设置系统变量里path添加过环境变量了,用户变量path也添加了都没有用

不知道你这个问题是否已经解决, 如果还没有解决的话:
  • 这篇博客: scrapy_爬取蘑菇街所有市场商品下的服饰---把握逛街得到机会-保护好钱包中的 目标:抓取蘑菇街主页目录下的所有主题市场商品 部分也许能够解决你的问题, 你可以仔细阅读以下内容或者直接跳转源博客中阅读:
    • 按主题市场分类
    • 每一个市场推荐标题分类
      • 商品图片
      • 商品链接,
      • 商品价格,
      • 商品标题
    • 写入excel
    • 设置好excel数据表,分析数据

    代码如下(scrapy):

    # -*- coding: utf-8 -*-
    import time
    from pprint import pprint
    import re
    from copy import deepcopy
    import collections
    import json
    import scrapy
    
    
    class MushroomSpider(scrapy.Spider):
        name = 'mushroom'
        allowed_domains = ['www.mogu.com', 'list.mogu.com']
        start_urls = ['https://www.mogu.com/']
    https://gitee.com/hanzhou521/pachongxiangmu
        def parse(self, response):
            # 拿到每一个主题市场
            theme_bazaar = response.xpath('//div[@class="cate-item-wrap"]/a/h3/text()').extract()
            # 主题url
            theme_bazaar_url = response.xpath('//div[@class="cate-item-wrap"]/a/@href').extract()[1:]
            for i in theme_bazaar:
                item = collections.OrderedDict()
                # 主题市场
                item['theme_bazaar'] = i
                # 主题市场URL
                item['theme_bazaar_url'] = theme_bazaar_url[theme_bazaar.index(i)]
                # 市场详情URL,返回是一个json数据
                bazaar = item['theme_bazaar_url'].split("/")[4]
                bazaar_url = "https://list.mogu.com/sync/menu?&action={}"
                # 抓包获取的市场数据详情url
                item["bazaar_details_url"] = bazaar_url.format(bazaar)
                yield scrapy.Request(
                    item['bazaar_details_url'],
                    callback=self.bazaar_details,
                    meta={"item": deepcopy(item)},
                )
    
        def bazaar_details(self, response):
            """市场详情"""
            # 等待拼接的详情商品URL
            jios_url = "https://list.mogu.com/search?cKey=15&page=1&fcid={}&action={}"
            # 分割当前URL提取
            bazaar = response.url.split("/")[4]
            item = response.meta["item"]
            response = json.loads(response.text)
            # pprint(response)
            for i in response['data']['cateTree']:
                # 主推荐标题
                item['recommend'] = response['data']['cateTree']["%s" % i]["p"]['title']
                for a in range(len(response['data']['cateTree']["%s" % i]["c"])):
                    # 小分类标题
                    item['classify_title'] = response['data']['cateTree']["%s" % i]["c"][a]['title']
                    # 小分类URL
                    item['classify_url'] = "https://list.mogu.com" + response['data']['cateTree']["%s" % i]["c"][a]['link']
                    # 小分类 id
                    item['classify_fcid'] = response['data']['cateTree']["%s" % i]["c"][a]['fcid']
                    # 设置索引后面一一对应
                    item["index"] = 1
                    # 拼接完整URL
                    details_url = jios_url.format(item['classify_fcid'], bazaar)
                    yield scrapy.Request(
                        details_url,
                        # url="https://list.mogu.com/book/accessories/20004357?mt=10.854.r29917",
                        # url="https://list.mogu.com/search?cKey=15&page=1&fcid=20004357&action=accessories",
                        callback=self.classify_details,
                        meta={"item": deepcopy(item)},
                        dont_filter=True
                    )
    
        def classify_details(self, response):
            """
            处理商品详情,价格,图片
            规律URL:https://list.mogu.com/search?cKey=15&page=1&fcid=50243&action=clothing
            """
            item = response.meta["item"]
            response_ = json.loads(response.text)
            # pprint(response['result']['wall']['docs'][1]['img'])
            # pprint(response_)
            # 正则表达式匹配标题字段
            title = re.match(r".*title", str(response_))
            if title != None:
                for i in range(len(response_['result']['wall']['docs'])):
                    # 商品标题
                    item['commodity_title'] = (response_['result']['wall']['docs'][i]['title'])
                    # 商品图片URL
                    item['commodity_img'] = (response_['result']['wall']['docs'][i]['img'])
                    # 商品URL
                    item['commodity_link'] = (response_['result']['wall']['docs'][i]['link'])
                    # 商品原价
                    item['commodity_orgPrice'] = (response_['result']['wall']['docs'][i]['orgPrice'])
                    # 商品现价
                    item['commodity_price'] = (response_['result']['wall']['docs'][i]['price'])
    
                # 判断下一页
                next_url = response.url
                item["index"] += 1
                if item["index"] <= 100:
                    nul = re.sub(r"&page=(\d+)", "&page=%s" % str(item["index"]), next_url)
                    yield scrapy.Request(
                        url=nul,
                        callback=self.classify_details,
                        meta={"item": deepcopy(item)},
                    )
                else:
                    item["index"] = 1
                yield item
            else:
                # print("%s没有需要数据" % response.url)
                pass
    

如果你已经解决了该问题, 非常希望你能够分享一下解决方案, 写成博客, 将相关链接放在评论区, 以帮助更多的人 ^-^