<!--

 111111111111111111111111111111111111111111111110000111111111111111111111111111111111111111111
 111111111111111111111111111111111111111111111000011111111111111111111111111111111111111111111
 111111111111111111111111111111111111111111100000011111111111111111111111111111111111111111111
 111111111111111111111111111111111111111110000001111000110000000000000001111111111111111111111
 111111111111111111111111111111110000000000000000000000000000000001111111111111111111111111111
 111111111111111111111111111111011100000000000000000000000000001111111111111111111111111111111
 111111111111111111111111111111111111100000000000000000000000000000000011111111111111111111111
 111111111111111111111111111111111000000000000000000000000000000011111111111111111111111111111
 111111111111111111111111111111110001110000000000000000000000000000011111111111111111111111111
 111111111111111111111111111110000011000000000001100000000000000000001111111111111111111111111
 111111111111111111111111111100000000000000010011110000000000000110000011111111111111111111111
 111111111111111111111111000000000000000000111011111000000000000011100001111111111111111111111
 111111111111111111111100000000000000000001111111110000000000000001111000111111111111111111111
 111111111111111111111000000001111111111111111111110000000000000000111110011111111111111111111
 111111111111111111111100000111111111111111111111000000000000000000111111111111111111111111111
 111111111111111111111111011111111111111111110000000000000000000000011111111111111111111111111
 111111111111111111111111111111000000000000000000000000000000000000011111111111111111111111111
 111111111111111111111111111111110000000000000000000000000000110000011111111111111111111111111
 111111111111111111111111111100000000000000000000000000000011110000011111111111111111111111111
 111111111111111111111111100000000000000000000000000000000111111000011111111111111111111111111
 111111111111111111111110000000000000000000000000000000111111111000011111111111111111111111111
 111111111111111111111000000000000000000000000000000011111111111000011111111111111111111111111
 111111111111111111110000000000000000000111000000111111111111111000111111111111111111111111111
 111111111111111111100000000000000001111111111111111111111111111001111111111111111111111111111
 111111111111111111000000000000000111111111111111110011111111111111111111111111111111111111111
 111111111111111110000000000000001111111111111111111110000111111111111111111111111111111111111
 111111111111111110000000000100011111111111111111111111100000111111111111111111111111111111111
 111111111111111100000000000110011111111111111111111111111000000011111111111111111111111111111
 111111111111111100000000000011101111111111110001111100001110000000111111111111111111111111111
 111111111111111100000000000001111111111111111100011111000000000000001111111111111111111111111
 111111111111111100000000000000001111111111111100000000000000000000000011111111111111111111111
 111111111111111100100000000000000000111111111000000000000000000000000000111111111111111111111
 111111111111111110011000000000000111111111000000000000000011100000000000011111111111111111111
 111111111111111111011000000000000000000000000000000000011111111111000000001111111111111111111
 111111111111111111111000000000000000000000000000000000111111111111110000000111111111111111111
 111111111111111111111000001000000000000000000110000000011101111111111000000111111111111111111
 111111111111111111111100011111000000000000011111000000000011111111111011000011111111111111111
 111111111111111111111000111111110001000000000111110000011111111111111111000011111111111111111
 111111111111111111111000111111111111111000000011111110000000011111111111100011111111111111111
 111111111111111111111100111111111111111111100000011111111111111111111111110001111111111111111

 -   ----------------------------------   神龙保佑，永无BUG   ------------------------------------   -
    Star me on Gitee - https://gitee.com/yadong.zhang/DBlog
    yadong.zhang (yadong.zhang0415#gmail.com)
    https://docs.zhyd.me
    如有问题请加QQ群(190886500)，备注：dblog
 -   ----------------------------------   神龙保佑，永无BUG   ------------------------------------   -
-->
<!DOCTYPE HTML>
<html lang="zh-CN">
<head>
    <meta charset="utf-8">
    <meta name="viewport" content="width=device-width, initial-scale=1">
    <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1"/>
    <title>Python爬虫Scrapy | 咖啡豆日记</title>
    <meta name="author" content="咖啡豆(747277306@qq.com)">
    <meta name="keywords" content="Python,爬虫,Scrapy,咖啡豆日记"/>
    <meta name="description" content="1.简介
1.1Scrapy
Scrapy是一个用于Web数据抓取的强大开源框架，主要用于从网站上抓取结构化数据，如HTML和XML文件，或者API返回的数据。Scrapy使用Python语言编写，它不仅仅是一个简单的网页抓取工具，而是包含了自动化、灵活的数据处理、数据存储等功能的完整框架。Scrapy的设计理念是模块化和可扩展的，支持中间件、Item Pipelines、信号和事件，以及多种数据" id="meta_description">
    <link rel="canonical" href="https://lanzi.cyou/article/10" />
    <link href="https://lanzi.cyou/img/favicon.ico" rel="shortcut icon" type="image/x-icon">
        <link href="https://cdn.bootcdn.net/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" rel="stylesheet" type="text/css">
        <link href="https://cdn.bootcdn.net/ajax/libs/twitter-bootstrap/3.3.5/css/bootstrap.min.css" rel="stylesheet">
        <link href="https://cdn.bootcdn.net/ajax/libs/jquery-confirm/3.3.2/jquery-confirm.min.css" rel="stylesheet">
        <link href="https://cdn.bootcdn.net/ajax/libs/fancybox/2.1.5/jquery.fancybox.min.css" rel="stylesheet">
        <link href="https://cdn.bootcdn.net/ajax/libs/jquery.bootstrapvalidator/0.5.3/css/bootstrapValidator.min.css" rel="stylesheet">
        <link href="https://cdn.bootcdn.net/ajax/libs/nprogress/0.2.0/nprogress.min.css" rel="stylesheet">
    <link href="https://lanzi.cyou/css/zhyd.core.css" rel="stylesheet" type="text/css">
    <link href="https://lanzi.cyou/css/zhyd.comment.css" rel="stylesheet" type="text/css">
        <link href="https://cdn.jsdelivr.net/npm/simplemde@1.11.2/dist/simplemde.min.css" rel="stylesheet">
        <link href="https://cdn.jsdelivr.net/npm/github-markdown-css@2.10.0/github-markdown.min.css" rel="stylesheet">
        <link href="https://cdn.jsdelivr.net/npm/highlight.js@9.12.0/styles/github.min.css" rel="stylesheet">
    <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/social-share.js@1.0.16/dist/css/share.min.css" />

    <style type="text/css">
        
    </style>
</head>
<body>
<nav id="topmenu" class="navbar navbar-default navbar-fixed-top">
    <div class="menu-box">
        <div class="pull-left">
            <ul class="list-unstyled list-inline">
                <li><span id="currentTime"></span></li>
            </ul>
            <div class="clear"></div>
        </div>
        <div class="menu-topmenu-container pull-right">
            <ul class="list-unstyled list-inline pull-left">
                <li><a href="https://lanzi.cyou/about" class="menu_a" title="关于博客" data-toggle="tooltip" data-placement="bottom">关于本站</a></li>
                <li><a href="https://lanzi.cyou/links" class="menu_a" title="友情链接" data-toggle="tooltip" data-placement="bottom">友情链接</a></li>
            </ul>
                <ul class="list-unstyled list-inline pull-left">
                    <li><a href="javascript:;;" data-toggle="modal" data-target="#oauth" rel="nofollow" title="授权登录">登录</a></li>
                </ul>
        </div>
    </div>
</nav>
<div class="modal" id="oauth" tabindex="-1" role="dialog" aria-labelledby="oauthTitle">
    <div class="modal-dialog" role="document">
        <div class="modal-content">
            <div class="modal-header">
                <button type="button" class="close" data-dismiss="modal" aria-label="Close"><span aria-hidden="true">&times;</span></button>
                <ul class="list-inline">
                    <li><h4 class="modal-title" id="oauthTitle">登录</h4></li>
                    <li><a href="javascript:$.alert.info('没用，别点了！我就没打算开发这个功能。Just to show you~~~');"><h4 class="modal-title" id="myModalLabel">注册</h4></a></li>
                </ul>
            </div>
            <div class="modal-body">
                <div class="oauth">
                    <ul class="list-unstyled list-inline oauth-list" style="text-align: center;">
                                <li>
                                    稍等一下， 博主正在快马加鞭的配置~~
                                </li>
                    </ul>
                    <div class="oauth-line">
                        <span style="font-size: 12px">
                            Powered by <a href="https://gitee.com/fujieid/jap" target="_blank">JustAuthPlus(JAP)</a>
                        </span>
                    </div>
                </div>
            </div>
        </div>
    </div>
</div>
<nav id="mainmenu" class="navbar navbar-default navbar-fixed-top" role="navigation">
    <div class="menu-box">
        <div class="navbar-header">
            <span class="pull-right nav-search toggle-search" data-toggle="modal" data-target=".nav-search-box"><i class="fa fa-search"></i></span>
            <button class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false" aria-controls="navbar">
                <span class="sr-only">Toggle navigation</span>
                <span class="icon-bar"></span>
                <span class="icon-bar"></span>
                <span class="icon-bar"></span>
            </button>
            <a class="navbar-brand" href="#">
                <img alt="Brand" src="https://lanzi.cyou/img/favicon.ico">咖啡豆日记
            </a>
        </div>
        <div id="navbar" class="navbar-collapse collapse">
            <div class="pull-left site-desc">
                <h1 class="auto-shake"><a href="https://lanzi.cyou" data-original-title="用代码研磨 Java 服务端技术的醇香，记录每一颗“咖啡豆”的成长与蜕变。☕️" data-toggle="tooltip" data-placement="bottom">咖啡豆日记</a></h1>
                <p class="site-description">用代码研磨 Java 服务端技术的醇香，记录每一颗“咖啡豆”的成长与蜕变。☕️</p>
            </div>
            <ul class="nav navbar-nav ">
                <li>
                    <a href="/" class="menu_a"><i class="fa fa-home"></i>首页</a>
                </li>
                                <li><a href="/type/6" class="menu_a"><i class="fa fa-linux"></i>Linux</a></li>
                                <li><a href="/type/5" class="menu_a"><i class="fa fa-envira"></i>微服务</a></li>
                                <li><a href="/type/4" class="menu_a"><i class="fa fa-database"></i>数据库</a></li>
                                <li><a href="/type/2" class="menu_a"><i class="fa fa-coffee"></i>后端技术</a></li>
                                <li><a href="/type/3" class="menu_a"><i class="fa fa-folder-open-o"></i>其他文章</a></li>
                <li><a href="/guestbook" class="menu_a"><i class="fa fa-comments-o"></i>留言板</a></li>
                <li><span class="pull-right nav-search main-search" data-toggle="modal" data-target=".nav-search-box"><i class="fa fa-search"></i></span></li>
            </ul>
        </div>
    </div>
</nav>
    <img src="https://lanzi.cyou:8890/blogFiles/oneblog/20240714074602181.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'" style="display: none;" id="cover-img">
<div class="container custome-container">
    <nav class="breadcrumb">
        <a class="crumbs" title="返回首页" href="https://lanzi.cyou" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-home"></i>首页</a>
        <i class="fa fa-angle-right"></i>
        <a href="https://lanzi.cyou/type/2" title="点击查看该分类文章" data-toggle="tooltip" data-placement="bottom">后端技术</a>
        <i class="fa fa-angle-right"></i>正文
    </nav>
    <div class="row article-body">
        <div class="col-sm-8 blog-main">
            <div class="blog-body overflow-initial fade-in">
                <div class="article-flag">
                        <span class="article-blockquote article-blockquote-green"></span>
                        <span class="article-original article-original-green">
                            <a href="https://lanzi.cyou/article/10"><i class="fa fa-check"></i> 原创</a>
                        </span>
                    <div class="blog-info-meta pull-right">
                        <ul class="list-unstyled list-inline">
                            <li><i class="fa fa-clock-o fa-fw"></i>2024-07-14</li>
                            <li><i class="fa fa-eye fa-fw"></i><a class="pointer" data-original-title="211人浏览了该文章" data-toggle="tooltip" data-placement="bottom">浏览 (<num>211</num>)</a></li>
                            <li><a href="#comment-box" data-original-title="0人评论了该文章" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-comments-o fa-fw"></i>评论 (0)</a></li>
                        </ul>
                    </div>
                </div>
                <div class="blog-info overflow-initial">
                    <h1 class="blog-info-title">
                        <strong>Python爬虫Scrapy</strong>
                    </h1>
                    <div class="blog-info-body ">
                            <div class="ob-alert">
                                <div class="title">
                                    <i class="fa fa-bullhorn fa-fw"></i>
                                    <span class="text">温馨提示：</span>
                                </div>
                                <div class="content">
                                    本文最后更新于 2024年07月14日，已超过 327 天没有更新。若文章内的图片失效（无法正常加载），请留言反馈或直接<a href="mailto:747277306@qq.com" target="_blank" title="点击给我发邮件" rel="external nofollow"><i class="fa fa fa-envelope fa-fw"></i>联系我</a>。
                                </div>
                            </div>
                                <h1 style="line-height: 36px; margin: 26px 0px 10px;"><font face="微软雅黑" style="" size="6" color="#000000" id="hqb4j">1.简介</font></h1><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" size="5" color="#000000" id="p3dx9">1.1Scrapy</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">Scrapy是一个用于Web数据抓取的强大开源框架，主要用于从网站上抓取结构化数据，如HTML和XML文件，或者API返回的数据。Scrapy使用Python语言编写，它不仅仅是一个简单的网页抓取工具，而是包含了自动化、灵活的数据处理、数据存储等功能的完整框架。Scrapy的设计理念是模块化和可扩展的，支持中间件、Item Pipelines、信号和事件，以及多种数据输出格式，如JSON、XML和CSV等。</font></p><p><font color="#000000" face="微软雅黑" size="4">Scrapy 官网：https://scrapy.org/<br/>Scrapy 文档：https://docs.scrapy.org/en/latest/<br/>GitHub：https://github.com/scrapy/scrapy/</font></p><p><font face="微软雅黑" size="4" color="#000000"><ne-clipboard></ne-clipboard></font></p><h2 style="line-height: 32px; margin-top: 21px; margin-bottom: 5px;"><font face="微软雅黑" size="5" color="#000000" id="ix0fq">1.2架构图</font></h2><font face="微软雅黑" size="4" color="#000000"><img src="https://lanzi.cyou:8890/blogFiles/oneblog/article/20240714073756187.png" alt="" style="max-width: 100%;height: auto;border-radius: 6px;"/></font><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">Scrapy的架构设计是模块化的，由多个组件构成，它们协同工作完成数据抓取任务。以下是Scrapy架构的主要组成部分：</font></p><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Scrapy Engine（引擎）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">负责协调数据流在Scrapy的所有组件中流动，包括Spider、Item Pipeline、Downloader和Scheduler。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Scheduler（调度器）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">接收Scrapy Engine传来的Requests，并按照一定的顺序将它们入队，当Engine请求新的Requests时提供。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Downloader（下载器）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">负责下载由Scheduler提供的Requests，并返回Response对象。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Spiders（蜘蛛）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">Spider是定义如何从网站上抓取数据的核心组件，它负责解析响应，提取数据（Items），以及生成新的Requests。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Item Pipeline（项目管道）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">用于处理由Spider提取的Items，如数据清洗、验证、存储等。Pipelines按顺序执行，可以实现复杂的数据处理逻辑。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Downloader Middlewares（下载中间件）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">位于Scrapy Engine和Downloader之间的层，用于处理Request和Response对象，如添加headers、处理异常、限制速度等。</font></li></ul></ul><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>Spider Middlewares（蜘蛛中间件）</strong>：</font></li></ol><ul style="margin: 0; padding-left: 23px; list-style: none"><ul style="margin: 0; padding-left: 23px; list-style: circle"><li><font face="微软雅黑" size="4" color="#000000">位于Scrapy Engine和Spider之间的层，用于处理由Spider生成的Responses和Requests，如过滤重复的Requests。</font></li></ul></ul><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="0qdlh" size="5">1.3逻辑流程</font></h2><ol style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><strong>请求(Request)</strong>：Scrapy的爬虫会生成一个或多个Request对象，这些对象包含了待抓取页面的URL和其他相关信息，如headers和cookies。</font></li><li><font face="微软雅黑" size="4" color="#000000"><strong>下载(Download)</strong>：Scrapy的下载器(Downloader)会处理这些Request，下载页面的内容。</font></li><li><font face="微软雅黑" size="4" color="#000000"><strong>响应(Response)</strong>：下载完成后，下载器会生成一个Response对象，这个对象包含了页面的HTML源码或其他响应内容，以及请求的状态信息。</font></li><li><font face="微软雅黑" size="4" color="#000000"><strong>解析(Parse)</strong>：Scrapy的爬虫会处理Response对象，使用XPath、CSS选择器或正则表达式等方法从中抽取数据，生成Item对象或新的Request对象。</font></li><li><font face="微软雅黑" size="4" color="#000000"><strong>Item Pipeline</strong>：抽取的数据（Item对象）会被传递给Item Pipeline，进行进一步的处理，如数据清洗、验证、去重和存储到数据库等。</font></li><li><font face="微软雅黑" size="4" color="#000000"><strong>输出(Output)</strong>：最终，数据可以被导出到不同的格式，如JSON、XML、CSV等，也可以直接存储到数据库或通过API发送到其他服务。</font></li></ol><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="pbtli" size="5">1.4子命令</font></h2><ul style="margin: 0; padding-left: 23px"><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy startproject [project_name]</strong></code>：创建一个新的Scrapy项目。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy genspider [name] [domain]</strong></code>：生成一个新的爬虫模板。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy crawl [spider_name]</strong></code>：运行指定的爬虫。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy settings</strong></code>：显示项目的配置设置。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy fetch [url]</strong></code>：下载指定URL的页面并显示响应信息。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy shell [url]</strong></code>：启动交互式的Scrapy Shell，用于调试XPath和CSS选择器。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy runspider [script.py]</strong></code>：运行一个独立的爬虫脚本，无需创建完整的项目。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy list</strong></code>：列出项目中的所有爬虫。</font></li><li><font face="微软雅黑" size="4" color="#000000"><code style="background-color: rgba(0, 0, 0, 0.06); border: 1px solid rgba(0, 0, 0, 0.08); border-radius: 2px; padding: 0px 2px;"><strong>scrapy check</strong></code>：检查爬虫是否有语法错误或引用了不存在的中间件或管道。</font></li></ul><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="9s6f3" size="5">1.5安装Scrapy库</font></h2><div><pre><code class="Bash"><xmp>pip install scrapy</xmp></code></pre></div><h1 style="line-height: 36px; margin: 26px 0px 10px;"><font face="微软雅黑" color="#000000" id="0oip6" size="6">2.代码编写</font></h1><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">编写代码爬取豆瓣电影Top250榜单数据</font></p><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="47im4" size="5">2.1.创建项目</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">执行以下命令创建Scrapy项目，在当前目录会生成一个zscrapy目录，用于存放爬虫、中间件、管道、设置文件等组件。</font></p><pre><code class="Bash"><xmp>scrapy startproject zscrapy</xmp></code></pre><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">目录结构</font></p><p><font face="微软雅黑" size="4" color="#000000"><ne-clipboard></ne-clipboard></font></p><ul style="margin-top: 0px; margin-bottom: 0px; margin-left: 0px; padding-left: 23px;"><li><font face="微软雅黑" size="4" color="#000000">__init__.py: Python包的初始化文件。</font></li><li><font face="微软雅黑" size="4" color="#000000">items.py: 定义项目中使用的数据项（Items）的文件。</font></li><li><font face="微软雅黑" size="4" color="#000000">middlewares.py: 定义项目的中间件的文件。</font></li><li><font face="微软雅黑" size="4" color="#000000">pipelines.py: 定义项目的管道（Pipelines）的文件。</font></li><li><font face="微软雅黑" size="4" color="#000000">settings.py: 项目的配置文件，用于设置各种参数。</font></li><li><font face="微软雅黑" size="4" color="#000000">spiders: 存放爬虫文件的子目录</font></li></ul><font face="微软雅黑" size="4" color="#000000"><img src="https://lanzi.cyou:8890/blogFiles/oneblog/article/20240714073826867.png" alt="" style="max-width: 100%;height: auto;border-radius: 6px;"/></font><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="b28a7" size="5">2.2.定义Item</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">在Scrapy中，Items用于定义你从网页上抓取的数据结构。Items本质上是包含字段的容器，这些字段通常代表了你想要从网页中提取的数据。</font></p><pre><code class="Python"><xmp>import scrapy

class DoubanItem(scrapy.Item):
    pic = scrapy.Field()  # 电影图片
    ranking = scrapy.Field()  # 电影排名
    title = scrapy.Field()  # 电影名字
    movieInfo = scrapy.Field()  # 电影的描述信息，包括导演、主演、电影类型等等
    star = scrapy.Field()  # 电影评分
    quote = scrapy.Field()  # 电影中最经典或者说脍炙人口的一句话
    pass

# 定义新闻数据的字段
class SinaNewsItem(scrapy.Item):
    title = scrapy.Field()  # 新闻标题
    ctime = scrapy.Field()  # 新闻发布时间
    url = scrapy.Field()  # 新闻原始url
    raw_key_words = scrapy.Field()  # 新闻关键词（爬取的关键词）
    content = scrapy.Field()  # 新闻的具体内容
    cate = scrapy.Field()  # 新闻类别　</xmp></code></pre><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="ecemc" size="5">2.3.编写爬虫脚本</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">用于抓取豆瓣电影Top 250榜单的信息</font></p><pre><code class="Python"><xmp># 导入Scrapy模块和系统模块
import scrapy
# 导入Scrapy的Request类，用于发送HTTP请求
from scrapy.http import Request
# 导入Selector类，用于解析HTML和XML文档
from scrapy.selector import Selector
# 导入自定义的DoubanItem类，用于存储爬取到的数据
from zscrapy.items import DoubanItem
# 导入urljoin函数，用于拼接URL
from urllib.parse import urljoin
# 导入CrawlerProcess类，用于运行爬虫
from scrapy.crawler import CrawlerProcess
# 导入get_project_settings函数，用于获取项目的设置
from scrapy.utils.project import get_project_settings

# 定义了一个名为Douban的爬虫类，继承自scrapy.spiders.Spider
class Douban(scrapy.spiders.Spider):
    # 设置爬虫的名称
    name = "douban"
    # 设置允许爬取的域名
    allowed_domains = ["douban.com"]
    # 设置起始URL
    start_urls = ['https://movie.douban.com/top250']

    def parse(self, response):
        # 初始化一个DoubanItem实例
        item = DoubanItem()
        # 使用Selector解析响应对象
        selector = Selector(response)
        # 获得所有class="item"的div元素集
        Movies = selector.xpath('//div[@class="item"]')
        # 将提取到的信息存储到DoubanItem实例中，并使用yield发送给Scrapy进行进一步处理或存储
        for eachMovie in Movies:
            pic = eachMovie.xpath('div[@class="pic"]/a/img/@src').extract()
            ranking = eachMovie.xpath('div[@class="pic"]/em/text()').extract()[0]
            title = eachMovie.xpath('div[@class="info"]/div[@class="hd"]/a/span/text()').extract() # 多个span标签
            fullTitle = "".join(title) # 将多个字符串无缝连接起来
            movieInfo =eachMovie.xpath('div[@class="info"]/div[@class="bd"]/p/text()').extract()
            movieInfo = movieInfo[0].strip("\n  ")
            #获取评份
            star = eachMovie.xpath('div[@class="info"]/div[@class="bd"]/div[@class="star"]/span/text()').extract()[0]
            #经典输出
            quote = eachMovie.xpath('div[@class="info"]/div[@class="bd"]/p[@class="quote"]/span/text()').extract()
            # quote可能为空，因此需要先进行判断
            if quote:
             quote = quote[0]
            else:
             quote = ''
            item['pic'] = "".join(pic)
            item['ranking'] = ranking
            item['title'] = fullTitle
            item['movieInfo'] = movieInfo
            item['star'] = star
            item['quote'] = quote
            #print("采集数据:",item)
            yield item
        # 翻页读取
        nextLink = selector.xpath('//span[@class="next"]/link/@href').extract()
        # 检查是否存在“下一页”链接，如果有，则构造新的请求并调用自身parse方法进行递归爬取
        if nextLink:
            nextLink = nextLink[0]
            yield Request(urljoin(response.url, nextLink), callback=self.parse)

# 程序入口
if __name__ =="__main__":
    # 创建CrawlerProcess类对象并传入项目设置信息参数
    process = CrawlerProcess(get_project_settings())
    # 设置需要启动的爬虫名称
    process.crawl("douban")
    # 启动爬虫
    process.start()</xmp></code></pre><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="r7h1g" size="5">2.4.设置文件</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">在settings.py文件中设置代理，设置的User-Agent字符串模拟了一个运行在Windows 7操作系统上特定版本的Safari浏览器。设置USER_AGENT是为了绕过网站的防爬机制。</font></p><pre><code class="Plain text"><xmp>USER_AGENT = 'Mozilla/5.0 (Windows; U; Windows NT 6.1; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50'</xmp></code></pre><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" id="er1j9" size="5">2.5.数据库</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">创建数据库zscrapy，创建表douban</font></p><pre><code class="SQL"><xmp>create database zscrapy charset utf8mb4 collate utf8mb4_general_ci;

CREATE TABLE `douban`  (
  `id` int(0) NOT NULL AUTO_INCREMENT,
  `title` varchar(100) CHARACTER SET utf8mb4 COLLATE utf8mb4_general_ci NOT NULL DEFAULT '' COMMENT '电影名称',
  `pic` varchar(255) CHARACTER SET utf8mb4 COLLATE utf8mb4_general_ci NOT NULL DEFAULT '' COMMENT '电影图片',
  `movieInfo` varchar(1000) CHARACTER SET utf8mb4 COLLATE utf8mb4_general_ci NOT NULL DEFAULT '' COMMENT '描述信息',
  `star` float(3, 1) NOT NULL DEFAULT 0.0 COMMENT '电影评分',
  `quote` varchar(255) CHARACTER SET utf8mb4 COLLATE utf8mb4_general_ci NOT NULL DEFAULT '' COMMENT '经典语句',
  `ranking` int(0) NOT NULL DEFAULT 0 COMMENT '电影排名',
  PRIMARY KEY (`id`) USING BTREE
) ENGINE = InnoDB CHARACTER SET = utf8mb4 COLLATE = utf8mb4_general_ci ROW_FORMAT = Dynamic;</xmp></code></pre><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">安装pymysql库，pymysql是一个Python的MySQL数据库驱动，允许Python程序与MySQL数据库进行交互。</font></p><pre><code class="Bash"><xmp> pip install pymysql</xmp></code></pre><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">在settings.py中添加MySQL连接配置</font></p><pre><code class="Plain text"><xmp>MYSQL_HOST = 'localhost'  # 数据库地址
MYSQL_DBNAME = 'zscrapy'  # 数据库名字
MYSQL_USER = 'root'  # 数据库登录名
MYSQL_PASSWD = 'Video201@'  # 数据库登录密码

# 激活ZscrapyPipeline管道，优先级301（数值越小，优先级越高）
ITEM_PIPELINES = {
    'zscrapy.pipelines.ZscrapyPipeline': 301,
}
</xmp></code></pre><h2 style="line-height: 32px; margin: 21px 0px 5px;"><font face="微软雅黑" color="#000000" size="5">2.6.管道</font></h2><p style="margin: 0; padding: 0; min-height: 24px"><font face="微软雅黑" size="4" color="#000000">Item Pipelines负责接收从爬虫传递过来的item，并对这些item执行一系列的处理，比如清洗数据、验证数据、去重、持久化数据到数据库等。以下代码定义了一个Scrapy项目中的Item Pipeline，其目的是将爬取到的数据存储到MySQL数据库中。</font></p><pre><code class="Python"><xmp># 导入pymysql模块，这是一个Python的MySQL数据库驱动。
import pymysql
# 导入项目中定义的item模块，包含爬取数据的结构定义。
import zscrapy.items
# 从项目设置模块导入设置，用于获取数据库连接信息。
from zscrapy import settings

# 定义一个名为ZscrapyPipeline的类，继承自object，这是Item Pipeline的基本类
class ZscrapyPipeline(object):
    # 在Python中，self是一个指向实例本身的引用，它是类的方法中的第一个参数。
    # 定义初始化方法，当创建类的实例时自动调用
    def __init__(self):
        # 使用pymysql.connect()方法建立到MySQL数据库的连接
        self.connect = pymysql.connect(
            host=settings.MYSQL_HOST,
            db=settings.MYSQL_DBNAME,
            user=settings.MYSQL_USER,
            passwd=settings.MYSQL_PASSWD,
            charset='utf8',
            use_unicode=True)
        # 创建游标对象，用于执行SQL语句
        self.cursor = self.connect.cursor()

    # 定义process_item方法，该方法将由Scrapy调用，用于处理每个爬取到的item
    def process_item(self, item, spider):
        try:
            # 检查item是否是DoubanItem类型，如果是，执行插入到douban表的SQL语句。
            if isinstance(item, zscrapy.items.DoubanItem):
                # 执行SQL插入语句，参数是一个SQL字符串和一个元组，元组中的值将替换SQL字符串中的占位符
                self.cursor.execute(
                    """insert into douban(title,pic,ranking,movieInfo,star,quote)
                      value (%s,%s,%s,%s,%s,%s)""",
                    (item['title'],
                     item['pic'],
                     item['ranking'],
                     item['movieInfo'],
                     item['star'],
                     item['quote']))
            else:
                self.cursor.execute(
                    """insert into sina_news(title,ctime,url,raw_key_words,content,cate)
                      value (%s,%s,%s,%s,%s,%s)""",
                    (item['title'],
                     item['ctime'],
                     item['url'],
                     item['raw_key_words'],
                     item['content'],
                     item['cate']))
            # 提交事务，确保数据被持久化到数据库中
            self.connect.commit()
        except Exception as err:
            # 捕获在执行SQL语句或提交事务过程中可能出现的异常，并打印错误信息
            print("数据插入==>错误信息为：" + str(err))
        # 返回处理过的item，以便它可以被下一个Item Pipeline处理或直接传递给Scrapy的其他组件
        return item</xmp></code></pre>
                    </div>
                    <div class="separateline"><span>正文到此结束</span></div>
                    <div id="social" style="margin-bottom: 45px;">
                        <div class="social-main">
                            <span class="like">
                                <a href="javascript:;" data-id="10" title="点赞" ><i class="fa fa-thumbs-up"></i>赞 <i class="count"> 0</i> </a>
                            </span>
                            <div class="shang-p">
                                <div class="shang-empty"><span></span></div>
                                <span class="shang-s"><a onclick="PaymentUtils.show();" style="cursor:pointer">赏</a> </span>
                            </div>
                            <div class="share-sd">
                                <span class="share-s"><a href="javascript:void(0)" id="share-s" title="分享"><i class="fa fa-share-alt"></i>分享</a></span>
                                <div id="share" style="display: none">
                                    <div class="social-share" data-initialized="true">
                                        <a href="#" class="social-share-icon icon-twitter"></a>
                                        <a href="#" class="social-share-icon icon-google"></a>
                                        <a href="#" class="social-share-icon icon-facebook"></a>
                                        <a href="#" class="social-share-icon icon-douban"></a>
                                        <a href="#" class="social-share-icon icon-qzone"></a>
                                        <a href="#" class="social-share-icon icon-wechat"></a>
                                        <a href="#" class="social-share-icon icon-qq"></a>
                                        <a href="#" class="social-share-icon icon-weibo"></a>
                                    </div>
                                </div>
                            </div>
                            <div class="clear"></div>
                        </div>
                    </div>
                    <div class="article-footer overflow-initial">所属分类：<a href="https://lanzi.cyou/type/2" data-original-title="点击查看后端技术分类的文章" data-toggle="tooltip" data-placement="bottom">后端技术</a></div>
                </div>
            </div>
            <div class="blog-body article-tag">
                <div class="cat">
                    <ul class="list-unstyled">
                        <li>
                            <strong>本文标签：</strong>
                                        <a href="https://lanzi.cyou/tag/9" class="c-label" data-original-title="Python" data-toggle="tooltip" data-placement="bottom" target="_blank">Python</a>
                        </li>
                        <li>
                            <strong>本文链接：</strong>
                            https://lanzi.cyou/article/10
                        </li>
                        <li>
                            <strong>版权声明：</strong>
                            本文由<a href="https://lanzi.cyou" target="_blank" data-original-title="咖啡豆日记" data-toggle="tooltip" data-placement="bottom"><strong>咖啡豆</strong></a>原创发布，转载请遵循《<a href="https://creativecommons.org/licenses/by-nc-sa/4.0/deed.zh" target="_blank" rel="nofollow">署名-非商业性使用-相同方式共享 4.0 国际 (CC BY-NC-SA 4.0)</a>》许可协议授权
                        </li>
                    </ul>
                </div>
            </div>
            <div class="ad-mark" id="ARTICLE_BOTTOM" style="display: none"></div>
            <div class="blog-body prev-next">
                <nav class="nav-single wow" data-wow-delay="0.3s">
                        <a href="https://lanzi.cyou/article/9" rel="prev">
                            <span class="meta-nav" data-original-title="Python基础" data-toggle="tooltip" data-placement="bottom"><span class="post-nav"><i class="fa fa-angle-left"></i> 上一篇</span>
                                <br>Python基础
                            </span>
                        </a>
                        <a href="https://lanzi.cyou/article/11" rel="next">
                            <span class="meta-nav" data-original-title="Java诊断工具Arthas" data-toggle="tooltip" data-placement="bottom"><span class="post-nav">下一篇 <i class="fa fa-angle-right"></i></span>
                                <br>Java诊断工具Arthas
                            </span>
                        </a>
                    <div class="clear"></div>
                </nav>
            </div>
            <div class="blog-body clear overflow-initial">
                <h5 class="custom-title"><i class="fa fa-fire fa-fw icon"></i><strong>热门推荐</strong><small></small></h5>
                <ul class="list-unstyled">
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20241020223543450.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/16" data-original-title="248人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                SpringBoot集成Elasticsearch
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(248)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/16#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240615150237427.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/4" data-original-title="227人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                树莓派5上部署博客系统
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(227)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/4#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240713015315670.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/8" data-original-title="224人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                使用FRP实现内网穿透：通过公网访问树莓派上的服务
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(224)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/8#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20250102172223850.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/31" data-original-title="214人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                跨平台 ChatGPT应用：ChatGPT-Next-Web
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(214)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/31#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240714074602181.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/10" data-original-title="212人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                Python爬虫Scrapy
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(212)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/10#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20241120232927172.png" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/33" data-original-title="207人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                Linux内核参数调优之TCP
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(207)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/33#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240615150315859.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/3" data-original-title="207人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                树莓派5上安装Ubuntu Server 24
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(207)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/3#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240620142312871.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/5" data-original-title="206人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                MySQL高级篇
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(206)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/5#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20241123234121379.png" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/25" data-original-title="206人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                开源远程控制软件RustDesk
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(206)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/25#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                            <li class="line-li">
                                <div class="line-container">
                                    <div class="line-left">
                                            <img class="lazy-img" src="https://lanzi.cyou:8890/blogFiles/oneblog/20240706020325406.jpg" onerror="this.src='https://lanzi.cyou/img/default.png'"width="50" height="50" rel="external nofollow"/>
                                    </div>
                                    <div class="line-right">
                                        <div class="text">
                                            <a href="https://lanzi.cyou/article/7" data-original-title="204人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                                发送邮件
                                            </a>
                                        </div>
                                        <div class="text">
                                            <span class="views" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章阅读次数"><i class="fa fa-eye fa-fw"></i>浏览(204)</span>
                                            <span class="comment" title="" data-toggle="tooltip" data-placement="bottom" data-original-title="文章评论次数">
                                                <a href="https://lanzi.cyou/article/7#comment-box" rel="external nofollow">
                                                    <i class="fa fa-comments-o fa-fw"></i>评论(0)
                                                </a>
                                            </span>
                                        </div>
                                    </div>
                                </div>
                            </li>
                </ul>
                <div class="clear"></div>
            </div>
            <div class="blog-body clear overflow-initial">
                <h5 class="custom-title"><i class="fa fa-google-wallet fa-fw icon"></i><strong>相关文章</strong><small></small></h5>
                <ul class="list-unstyled">
                        <li class="line-li">
                            <div class="line-container">
                                <div class="line-right">
                                    <div class="text">
                                        <a href="https://lanzi.cyou/article/10" data-original-title="212人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                            <i class="fa fa-book fa-fw"></i>Python爬虫Scrapy
                                        </a>
                                    </div>
                                </div>
                            </div>
                        </li>
                        <li class="line-li">
                            <div class="line-container">
                                <div class="line-right">
                                    <div class="text">
                                        <a href="https://lanzi.cyou/article/9" data-original-title="47人浏览了该文章" data-toggle="tooltip" data-placement="bottom">
                                            <i class="fa fa-book fa-fw"></i>Python基础
                                        </a>
                                    </div>
                                </div>
                            </div>
                        </li>
                </ul>
                <div class="clear"></div>
            </div>
            <div class="ad-mark" id="COMMENT_BOX_TOP" style="display: none"></div>
                    <div class="blog-body clear overflow-initial expansion">
                        <div id="comment-box" data-id="10"></div>
                    </div>
        </div>
<div class="col-sm-3 blog-sidebar">
        <div class="ad-mark" id="SIDEBAR_TOP" style="display: none"></div>
        <div class="sidebar-module" style="position: relative;">
            <h5 class="custom-title"><i class="fa fa-home fa-fw icon"></i><strong>关于我</strong><small></small></h5>
            <div class="widget">
                <div id="feed_widget">
                    <div class="feed-about">
                        <div class="about-main">
                            <div class="about-img"><a href="https://lanzi.cyou:8890/blogFiles/oneblog/20240615113733318.jpg" class="showImage" title="微信公众号"><img src="https://lanzi.cyou:8890/blogFiles/oneblog/20240615113733318.jpg" alt="微信公众号"></a></div>
                            <div class="about-name">咖啡豆日记</div>
                            <div class="about-the">用代码研磨 Java 服务端技术的醇香，记录每一颗“咖啡豆”的成长与蜕变。☕️</div>
                        </div>
                        <div class="clear"></div>
                        <!-- 方案一：图标展示 -->
                        <ul class="widget-icon">
                            <li class="weixin auto-shake" data-container="body"
                                data-toggle="popover" data-trigger="hover" data-placement="bottom" data-html="true" data-content="<img src='https://lanzi.cyou:8890/blogFiles/oneblog/20240615113733318.jpg' style='width: 130px;' alt='QR Code'>">
                                <a class="tag-icon" title="微信" rel="external nofollow"><i class="fa fa-weixin"></i></a>
                            </li>
                            <li class="tqq auto-shake">
                                <a class="tag-icon" href="javascript:window.open('tencent://message/?uin=747277306&Site=www.lanzi.cyou&Menu=yes')" title="点击QQ联系我" target="blank" rel="external nofollow"><i class="fa fa-qq"></i></a>
                            </li>
                            <li class="tsina auto-shake">
                                <a class="tag-icon" href="" title="点击查看我的微博" target="_blank" rel="external nofollow"><i class="fa fa-weibo"></i></a>
                            </li>
                            <li class="github auto-shake">
                                <a class="tag-icon" href="" title="点击查看我的github" target="_blank" rel="external nofollow"><i class="fa fa-github"></i></a>
                            </li>
                        </ul>
                        <!-- 方案二：列表展示 -->
                    </div>
                </div>
            </div>
        </div>
    <div class="sidebar-module article-module hide" style="top: 0;">
        <h5 class="custom-title"><i class="fa fa-book fa-fw icon"></i><strong>本文目录</strong><i class="fa fa-close pull-right close-article-menu hide pointer"></i><small></small></h5>
        <div id="article-menu" style="overflow:auto">
            <ul class="list-unstyled"></ul>
        </div>
    </div>
    <div class="sidebar-module">
        <h5 class="custom-title"><i class="fa fa-tags fa-fw icon"></i><strong>标签云</strong><small></small></h5>
                    <a style="font-size: 11.41px;margin: 5px;" href="https://lanzi.cyou/tag/1" title="Linux" data-toggle="tooltip" data-placement="bottom">
                        Linux
                    </a>
                    <a style="font-size: 11.46px;margin: 5px;" href="https://lanzi.cyou/tag/2" title="Java" data-toggle="tooltip" data-placement="bottom">
                        Java
                    </a>
                    <a style="font-size: 11.06px;margin: 5px;" href="https://lanzi.cyou/tag/3" title="Spring" data-toggle="tooltip" data-placement="bottom">
                        Spring
                    </a>
                    <a style="font-size: 10.53px;margin: 5px;" href="https://lanzi.cyou/tag/4" title="Spring Boot" data-toggle="tooltip" data-placement="bottom">
                        Spring Boot
                    </a>
                    <a style="font-size: 12px;margin: 5px;" href="https://lanzi.cyou/tag/5" title="其他" data-toggle="tooltip" data-placement="bottom">
                        其他
                    </a>
                    <a style="font-size: 13.7px;margin: 5px;" href="https://lanzi.cyou/tag/6" title="MySQL" data-toggle="tooltip" data-placement="bottom">
                        MySQL
                    </a>
                    <a style="font-size: 14.59px;margin: 5px;" href="https://lanzi.cyou/tag/7" title="Spring Cloud Alibaba" data-toggle="tooltip" data-placement="bottom">
                        Spring Cloud Alibaba
                    </a>
                    <a style="font-size: 11.17px;margin: 5px;" href="https://lanzi.cyou/tag/9" title="Python" data-toggle="tooltip" data-placement="bottom">
                        Python
                    </a>
                    <a style="font-size: 14.39px;margin: 5px;" href="https://lanzi.cyou/tag/10" title="分布式" data-toggle="tooltip" data-placement="bottom">
                        分布式
                    </a>
                    <a style="font-size: 10.91px;margin: 5px;" href="https://lanzi.cyou/tag/11" title="工具" data-toggle="tooltip" data-placement="bottom">
                        工具
                    </a>
                    <a style="font-size: 15.81px;margin: 5px;" href="https://lanzi.cyou/tag/12" title="Web" data-toggle="tooltip" data-placement="bottom">
                        Web
                    </a>
                    <a style="font-size: 13.94px;margin: 5px;" href="https://lanzi.cyou/tag/13" title="密码" data-toggle="tooltip" data-placement="bottom">
                        密码
                    </a>
                    <a style="font-size: 13.95px;margin: 5px;" href="https://lanzi.cyou/tag/14" title="Linux内核调优" data-toggle="tooltip" data-placement="bottom">
                        Linux内核调优
                    </a>
                    <a style="font-size: 12.26px;margin: 5px;" href="https://lanzi.cyou/tag/15" title="云原生" data-toggle="tooltip" data-placement="bottom">
                        云原生
                    </a>
                    <a style="font-size: 10.99px;margin: 5px;" href="https://lanzi.cyou/tag/16" title="C#" data-toggle="tooltip" data-placement="bottom">
                        C#
                    </a>
                    <a style="font-size: 14.76px;margin: 5px;" href="https://lanzi.cyou/tag/17" title="微信公众号" data-toggle="tooltip" data-placement="bottom">
                        微信公众号
                    </a>
    </div>
    <div class="sidebar-module">
        <ul class="nav nav-tabs sidebar-tabs" role="tablist">
            <li role="presentation" class="active"><a href="#profile" aria-controls="profile" role="tab" data-toggle="tab"><i class="fa fa-list"></i>近期文章</a></li>
            <li role="presentation"><a href="#home" aria-controls="home" role="tab" data-toggle="tab"><i class="fa fa-thumbs-o-up"></i>站长推荐</a></li>
            <li role="presentation"><a href="#messages" aria-controls="messages" role="tab" data-toggle="tab"><i class="fa fa-hand-peace-o"></i>随机文章</a></li>
        </ul>
        <div class="tab-content">
            <div role="tabpanel" class="tab-pane active" id="profile">
                <ol class="list-unstyled">
                                <li>
                                    <a href="https://lanzi.cyou/article/48" title="搭建个人微信公众号" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 搭建个人微信公众号
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/47" title="Kubernetes基本概念" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> Kubernetes基本概念
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/46" title="从零开始理解容器化技术" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 从零开始理解容器化技术
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/45" title="轻量级标记语言Markdown" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 轻量级标记语言Markdown
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/44" title="利用Wake-on-LAN技术实现远程唤醒" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 利用Wake-on-LAN技术实现远程唤醒
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/43" title="什么是云原生" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 什么是云原生
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/42" title="使用Inno Setup制作专业级Windows安装包" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 使用Inno Setup制作专业级Windows安装包
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/41" title="告别单点故障！MySQL Group Replication如何重塑金融级数据库架构" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 告别单点故障！MySQL Group Replication如何重塑金融级数据库架构
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/40" title="利用Docker Swarm与SSL加密实现安全高效的PXC集群部署" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 利用Docker Swarm与SSL加密实现安全高效的PXC集群部署
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/39" title="从零开始：基于Ubuntu的Kubernetes集群部署全攻略（含国内加速配置）" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 从零开始：基于Ubuntu的Kubernetes集群部署全攻略（含国内加速配置）
                                    </a>
                                </li>
                </ol>
            </div>
            <div role="tabpanel" class="tab-pane" id="home">
                <ol class="list-unstyled">
                            <li class="empty-list">
                                <i class="fa fa-bookmark-o fa-fw"></i> 暂无相关文章
                            </li>
                </ol>
            </div>
            <div role="tabpanel" class="tab-pane" id="messages">
                <ol class="list-unstyled">
                                <li>
                                    <a href="https://lanzi.cyou/article/18" title="OAuth2服务端" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> OAuth2服务端
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/20" title="SSH移动端ServerBox" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> SSH移动端ServerBox
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/7" title="发送邮件" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 发送邮件
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/28" title="Nginx" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> Nginx
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/26" title="JavaCV开源计算机视觉库" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> JavaCV开源计算机视觉库
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/39" title="从零开始：基于Ubuntu的Kubernetes集群部署全攻略（含国内加速配置）" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 从零开始：基于Ubuntu的Kubernetes集群部署全攻略（含国内加速配置）
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/6" title="SpringCloud第一篇：Nacos" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> SpringCloud第一篇：Nacos
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/42" title="使用Inno Setup制作专业级Windows安装包" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 使用Inno Setup制作专业级Windows安装包
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/11" title="Java诊断工具Arthas" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> Java诊断工具Arthas
                                    </a>
                                </li>
                                <li>
                                    <a href="https://lanzi.cyou/article/4" title="树莓派5上部署博客系统" data-toggle="tooltip" data-placement="bottom">
                                        <i class="fa fa-book fa-fw"></i> 树莓派5上部署博客系统
                                    </a>
                                </li>
                </ol>
            </div>
        </div>
    </div>
    <div class="clear"></div>
    <div class="sidebar-module">
        <h5 class="custom-title"><i class="fa fa-info fa-fw icon"></i><strong>网站信息</strong><small></small></h5>
        <ul class="ul-default site-info">
                <li> <i class="fa fa-file fa-fw"></i>  文章总数：41 篇</li>
                <li> <i class="fa fa-tags fa-fw"></i> 标签总数：16 个</li>
                <li> <i class="fa fa-folder-open fa-fw"></i> 分类总数：5 个</li>
                <li> <i class="fa fa-comments fa-fw"></i> 留言数量：0 条</li>
                <li> <i class="fa fa-users fa-fw"></i> 在线人数：<span class="online">1</span>人</li>
                <li> <i class="fa fa-calendar fa-fw"></i> 运行天数：357天</li>
                <li> <i class="fa fa-pencil-square fa-fw"></i> 最后更新：2024年06月14日23点</li>
                <li> <i class="fa fa-vine fa-fw"></i>  系统版本：v3.0.0</li>
        </ul>
    </div>
    <div class="ad-mark" id="SIDEBAR_BOTTOM" style="display: none"></div>
</div>
    </div>
</div>
<div id="lockModal" class="modal fade" tabindex="-1" role="dialog" aria-labelledby="mySmallModalLabel" aria-hidden="true" data-keyboard="false">
    <div class="modal-dialog" role="document">
        <div class="modal-content">
            <div class="modal-header">
                <button type="button" class="close" data-dismiss="modal" aria-label="Close"><span aria-hidden="true">&times;</span></button>
                <h4 class="modal-title" id="myModalLabel">输入密码查看文章详情</h4>
            </div>
            <div class="modal-body">
                <input type="text" name="password" id="password" class="form-control" placeholder="请输入文章密码">
            </div>
            <div class="modal-footer">
                <button type="button" class="btn btn-primary" id="verifyPassword">确定</button>
            </div>
        </div>
    </div>
</div>
<div class="modal fade nav-search-box" tabindex="-1" role="dialog" aria-labelledby="navSearchModalLabel">
    <div class="modal-dialog modal-lg" role="document">
        <div class="modal-content">
            <div class="modal-header" style="padding: 5px 15px;">
                <button type="button" class="close" data-dismiss="modal" aria-label="Close" style="margin-top: 10px;"><span aria-hidden="true">&times;</span></button>
                <h4><i class="fa fa-search"></i> 搜索文章</h4>
            </div>
            <div class="modal-body">
                <form action="/" method="post" class="form-horizontal searchForm" id="searchForm">
                    <input type="hidden" name="pageNumber" value="1">
                    <div class="input-group bottom-line">
                        <input type="text" class="form-control br-none" name="keywords" value="" required="required" placeholder="输入搜索内容">
                        <span class="input-group-btn">
                        <button class="btn btn-default br-none nav-search-btn pointer" type="submit"><i class="fa fa-search"></i> 搜索</button>
                    </span>
                    </div>
                    <div class="clear"></div>
                    <ul class="list-unstyled list-inline search-hot">
                        <li><strong style="position: relative;top: 2px;color: #999999;">热门搜索：</strong></li>
                                    <li><a class="pointer" rel="external nofollow"><span class="label label-info">Java</span></a></li>
                                    <li><a class="pointer" rel="external nofollow"><span class="label label-info">SpringBoot</span></a></li>
                    </ul>
                </form>
            </div>
        </div>
    </div>
</div>
<!--评论弹框-->
<div class="modal fade bs-example-modal-sm" id="comment-detail-modal" tabindex="-1" role="dialog" aria-labelledby="comment-detail-modal-label">
    <div class="modal-dialog" role="document">
        <div class="modal-content">
            <div class="modal-header">
                <button type="button" class="close" data-dismiss="modal" aria-label="Close"><span aria-hidden="true">&times;</span></button>
                <h4 class="modal-title" id="comment-detail-modal-label">评论信息框</h4>
                <small><i class="fa fa-lightbulb-o fa-fw"></i>可以通过QQ号实时获取昵称和头像</small>
            </div>
            <div class="modal-body">
                <form id="detail-form">
                    <input type="hidden" name="avatar">
                    <div class="form-group input-logo">
                        <input type="text" class="form-control" name="qq" placeholder="选填" value="">
                        <img class="pull-left hide" alt="">
                        <span class="fa fa-qq pull-left" aria-hidden="true">QQ</span>
                    </div>
                    <div class="form-group input-logo">
                        <input type="text" class="form-control" name="nickname" placeholder="必填" value="匿名">
                        <span class="fa fa-user pull-left" aria-hidden="true">昵称</span>
                    </div>
                    <div class="form-group input-logo">
                        <input type="text" class="form-control" name="email" placeholder="选填">
                        <span class="fa fa-envelope pull-left" aria-hidden="true">邮箱</span>
                    </div>
                    <div class="form-group input-logo">
                        <input type="text" class="form-control" name="url" placeholder="选填">
                        <span class="fa fa-globe pull-left" aria-hidden="true">网址</span>
                    </div>
                    <div class="form-group">
                        <button type="button" class="btn btn-default btn-sm" id="detail-form-btn"><i class="fa fa-smile-o"></i>提交评论</button>
                    </div>
                </form>
            </div>
        </div>
    </div>
</div>
<div class="modal fade" id="reward" tabindex="-1" role="dialog">
    <div class="modal-dialog">
        <div class="modal-content">
            <div class="modal-header">
                <button type="button" class="close" data-dismiss="modal" aria-label="Close"><span aria-hidden="true">&times;</span></button>
                <h4 class="modal-title">山无棱江水为竭，冬雷震震夏雨雪，才敢请君舍</h4>
            </div>
            <div class="modal-body">
                <div class="rewardType" align="center">
                    <ul class="list-unstyle list-inline">
                        <li style="margin-right: 20px;">
                            <input type="radio" name="type" id="alipay" onclick="PaymentUtils.change(0)" data-index="0" checked="checked" ><span style="margin-left: 5px;">支付宝</span>
                        </li>
                        <li style="margin-right: 20px;">
                            <input type="radio" name="type" id="wechat" onclick="PaymentUtils.change(1)" data-index="1"><span style="margin-left: 5px;">微信</span>
                        </li>
                    </ul>
                </div>
                <div id="qrcode-container" align="center" style="margin-top: 10px;"></div>
                <div style="width: 100%;color: #a3a3a3;font-size: 16px;font-family: 'Microsoft YaHei';text-align: center;">
                    转账时请备注“<strong>博客赞助</strong>”
                </div>
            </div>
        </div>
        <small class="font-bold"></small>
    </div>
    <small class="font-bold"> </small>
</div>
<div id="loading">
    <div class="filter"></div>
    <div class="loader">
        <div class="loading-1"></div>
        <div class="loading-2">Loading...</div>
    </div>
</div>
        <footer class="footer">
            <div class="container">
                <div class="row">
                    <div class="col col-xs-12 col-md-12 col-lg-12">
                        <p>
                        <ul class="list-unstyled list-inline">
                            <li>其他连接：</li>
                            <li><a href="https://lanzi.cyou/sitemap.html" target="_blank" title="网站地图" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-map-o fa-fw"></i>网站地图</a></li>
                            <li><a href="https://lanzi.cyou/recommended" title="站长推荐" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-thumbs-o-up fa-fw"></i>站长推荐</a></li>
                            <li><a href="https://lanzi.cyou/updateLog" title="更新记录" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-file-o fa-fw"></i>更新记录</a></li>
                            <li><a href="https://lanzi.cyou/archives" title="归档目录" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-folder-o fa-fw"></i>归档目录</a></li>
                            <li><a href="https://lanzi.cyou/disclaimer" title="免责声明" data-toggle="tooltip" data-placement="bottom"><i class="fa fa-file-o fa-fw"></i>免责声明</a></li>
                        </ul>
                        </p>
                        <p>托管于<a href="https://promotion.aliyun.com/ntms/act/ambassador/sharetouser.html?userCode=wylo59db" target="_blank" title="阿里云-为了无法计算的价值" data-toggle="tooltip" data-placement="bottom" rel="external nofollow">阿里云</a> & <a href="https://portal.qiniu.com/signup?code=3l8yx2v0f21ci" target="_blank" title="七牛云-国内领先的企业级云服务商" data-toggle="tooltip" data-placement="bottom" rel="external nofollow">七牛云</a></p>
                    </div>
                    <div class="col col-md-4"></div>
                </div>
            </div>
        </footer>
    <footer class="footer">
        <div class="container">
            <div class="row">
                <div class="col col-xs-12 col-md-12 col-lg-12">
                    <p>© 2024 lanzi.cyou. Content is licensed under a <a href="https://creativecommons.org/licenses/by/3.0/" title="创作共用署名 3.0" data-toggle="tooltip" data-placement="right" target="_blank" style="color: #4286ca;font-weight: 600;">Creative Commons Attribution 3.0 Unported License</a>.</p>

                </div>
            </div>
        </div>
    </footer>
<a class="to-top" title="点击返回顶部" data-toggle="tooltip" data-placement="bottom"></a>
    <script type="text/javascript" src="https://cdn.staticfile.org/jquery/1.11.1/jquery.min.js"></script>
    <script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.5/js/bootstrap.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/jquery.lazyload/1.9.1/jquery.lazyload.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/jquery-confirm/3.3.2/jquery-confirm.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/fancybox/2.1.5/jquery.fancybox.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/bootstrap-validator/0.5.3/js/bootstrapValidator.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/nprogress/0.2.0/nprogress.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/js-xss/0.3.3/xss.min.js"></script>
    <script type="text/javascript" src="https://cdn.staticfile.org/mustache.js/2.3.0/mustache.min.js"></script>
<script type="text/javascript">
    var appConfig = {
        siteName: "咖啡豆日记",
        wwwPath: "https://lanzi.cyou",
        cmsPath: "https://lanzi.cyou:8889",
        staticPath: "https://lanzi.cyou",
        lazyloadPath: "",
        fileStoragePath: "https://lanzi.cyou:8890/blogFiles/",
        wxPraiseCode: "https://lanzi.cyou:8890/blogFiles/oneblog/qrcode/20250108014802406.jpg" || "https://lanzi.cyou/img/default.png",
        zfbPraiseCode: "https://lanzi.cyou:8890/blogFiles/oneblog/qrcode/20250108014802572.jpg" || "https://lanzi.cyou/img/default.png",
        anonymous: "1",
        editorPlaceholder: "说点什么吧",
        editorAlert: "讲文明、要和谐",
        dynamicTitle: "您有一条新消息",
        bubbleWord: "",
    };

    var oauthConfig = {
        loginUserId: "",
        loginUserName: "",
        loginUserAvatar: ""
    }
</script>
<script type="text/javascript" src="https://lanzi.cyou/js/zhyd.core.js"></script>
<script type="text/javascript" src="https://lanzi.cyou/js/zhyd.comment.js"></script>
<script type="text/javascript" src="https://lanzi.cyou/js/zhyd.js"></script>
<script type="text/javascript" id="customJs">
    
</script>

    <script type="text/javascript" src="https://cdn.jsdelivr.net/npm/highlight.js@9.12.0/lib/highlight.min.js"></script>
	<script type="text/javascript" src="https://cdn.jsdelivr.net/npm/simplemde@1.11.2/dist/simplemde.min.js"></script>
    <script type="text/javascript" src="https://cdn.jsdelivr.net/npm/social-share.js@1.0.16/dist/js/social-share.min.js"></script>
    <script src="https://res.wx.qq.com/open/js/jweixin-1.6.0.js" type="text/javascript"></script>

    <script>
        var isPrivate = '';
        if(isPrivate || isPrivate == 'true') {
            $("#lockModal").modal('show')
        }

        $("#verifyPassword").click(function (){
            var password = $("#password").val();
            var articleId = "10";
            $.post("/api/verifyArticlePassword", {articleId : articleId, password: password}, function (json) {
                $.alert.ajaxSuccess(json);
                if(json.status === 200) {
                    $(".blog-info-body").html(json.data);
                    $("#lockModal").modal('hide')
                }
            })
        })


        $(function () {
            var url = location.href.split("#")[0];
            //当前页面的url
            var encodeUrl = encodeURIComponent(url);

            var title = "Python爬虫Scrapy";
            var desc = "1.简介
1.1Scrapy
Scrapy是一个用于Web数据抓取的强大开源框架，主要用于从网站上抓取结构化数据，如HTML和XML文件，或者API返回的数据。Scrapy使用Python语言编写，它不仅仅是一个简单的网页抓取工具，而是包含了自动化、灵活的数据处理、数据存储等功能的完整框架。Scrapy的设计理念是模块化和可扩展的，支持中间件、Item Pipelines、信号和事件，以及多种数据";
            var imgUrl = "https://lanzi.cyou:8890/blogFiles/oneblog/20240714074602181.jpg";

            $.post("/api/jssdkGetSignature", {url: encodeUrl}, function (json) {
                // $.alert.ajaxSuccess(json);

                if (json.status === 200) {
                    var signature = json.data.signature;
                    var timestamp = json.data.timestamp;
                    var noncestr = json.data.noncestr;
                    var appid = json.data.appid;
                    var jsapi_ticket = json.data.ticket;

                    // alert(signature + "---" + timestamp + "---" + noncestr + "---" + appid + "---" + jsapi_ticket);
                    // console.log(signature + "---" + timestamp + "---" + noncestr + "---" + appid + "---" + jsapi_ticket)
                    wx.config({
                        debug: false, // true:开启调试模式,调用的所有 api 的返回值会在客户端 alert 出来，若要查看传入的参数，可以在 pc 端打开，参数信息会通过 log 打出，仅在 pc 端时才会打印。
                        appId: appid, // 必填，公众号的唯一标识
                        timestamp: timestamp, // 必填，生成签名的时间戳
                        nonceStr: noncestr, // 必填，生成签名的随机串
                        signature: signature,// 必填，签名
                        jsApiList: ["updateAppMessageShareData", "updateTimelineShareData"] // 必填，需要使用的 JS 接口列表
                    });

                    wx.error(function (res) {
                        // alert(JSON.stringify(res));
                        // config信息验证失败会执行 error 函数，如签名过期导致验证失败，具体错误信息可以打开 config 的debug模式查看，也可以在返回的 res 参数中查看，对于 SPA 可以在这里更新签名。
                        console.log(JSON.stringify(res))
                    });

                    var mTitle = title + '| 蜂唤信息公众号';
                    wx.ready(function () {
                        //需在用户可能点击分享按钮前就先调用 自定义“分享到朋友圈”及“分享到 QQ 空间”按钮的分享内容
                        wx.updateTimelineShareData({
                            title: mTitle, // 分享标题
                            link: url, // 分享链接，该链接域名或路径必须与当前页面对应的公众号 JS 安全域名一致
                            imgUrl: imgUrl, // 分享图标
                            success: function () {
                                // 设置成功
                            }
                        });

                    });

                    var nTitle = '您有新消息| ' + title + '| 蜂唤信息公众号';
                    wx.ready(function () {
                        //需在用户可能点击分享按钮前就先调用 自定义“分享给朋友”及“分享到QQ”按钮的分享内容
                        wx.updateAppMessageShareData({
                            title: nTitle, // 分享标题
                            desc: desc, // 分享描述
                            link: url, // 分享链接，该链接域名或路径必须与当前页面对应的公众号 JS 安全域名一致
                            imgUrl: imgUrl, // 分享图标
                            success: function () {
                                // 设置成功
                            }
                        });
                    });

                }
            })
        })
    </script>

    </body>
</html>