array(2) {
  ["docs"]=>
  array(10) {
    [0]=>
    array(10) {
      ["id"]=>
      string(3) "428"
      ["text"]=>
      string(77) "Visual Studio 2017 单独启动MSDN帮助（Microsoft Help Viewer）的方法"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(8) "DonetRen"
      ["tagsname"]=>
      string(55) "Visual Studio 2017|MSDN帮助|C#程序|.NET|Help Viewer"
      ["tagsid"]=>
      string(23) "[401,402,403,"300",404]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511400964"
      ["_id"]=>
      string(3) "428"
    }
    [1]=>
    array(10) {
      ["id"]=>
      string(3) "427"
      ["text"]=>
      string(42) "npm -v；报错 cannot find module "wrapp""
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(4) "zzty"
      ["tagsname"]=>
      string(50) "node.js|npm|cannot find module &quot;wrapp“|node"
      ["tagsid"]=>
      string(19) "[398,"239",399,400]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511400760"
      ["_id"]=>
      string(3) "427"
    }
    [2]=>
    array(10) {
      ["id"]=>
      string(3) "426"
      ["text"]=>
      string(54) "说说css中pt、px、em、rem都扮演了什么角色"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(12) "zhengqiaoyin"
      ["tagsname"]=>
      string(0) ""
      ["tagsid"]=>
      string(2) "[]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511400640"
      ["_id"]=>
      string(3) "426"
    }
    [3]=>
    array(10) {
      ["id"]=>
      string(3) "425"
      ["text"]=>
      string(83) "深入学习JS执行--创建执行上下文（变量对象，作用域链，this）"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(7) "Ry-yuan"
      ["tagsname"]=>
      string(33) "Javascript|Javascript执行过程"
      ["tagsid"]=>
      string(13) "["169","191"]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511399901"
      ["_id"]=>
      string(3) "425"
    }
    [4]=>
    array(10) {
      ["id"]=>
      string(3) "424"
      ["text"]=>
      string(30) "C# 排序技术研究与对比"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(9) "vveiliang"
      ["tagsname"]=>
      string(0) ""
      ["tagsid"]=>
      string(2) "[]"
      ["catesname"]=>
      string(8) ".Net Dev"
      ["catesid"]=>
      string(5) "[199]"
      ["createtime"]=>
      string(10) "1511399150"
      ["_id"]=>
      string(3) "424"
    }
    [5]=>
    array(10) {
      ["id"]=>
      string(3) "423"
      ["text"]=>
      string(72) "【算法】小白的算法笔记：快速排序算法的编码和优化"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(9) "penghuwan"
      ["tagsname"]=>
      string(6) "算法"
      ["tagsid"]=>
      string(7) "["344"]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511398109"
      ["_id"]=>
      string(3) "423"
    }
    [6]=>
    array(10) {
      ["id"]=>
      string(3) "422"
      ["text"]=>
      string(64) "JavaScript数据可视化编程学习（二）Flotr2，雷达图"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(7) "chengxs"
      ["tagsname"]=>
      string(28) "数据可视化|前端学习"
      ["tagsid"]=>
      string(9) "[396,397]"
      ["catesname"]=>
      string(18) "前端基本知识"
      ["catesid"]=>
      string(5) "[198]"
      ["createtime"]=>
      string(10) "1511397800"
      ["_id"]=>
      string(3) "422"
    }
    [7]=>
    array(10) {
      ["id"]=>
      string(3) "421"
      ["text"]=>
      string(36) "C#表达式目录树（Expression）"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(4) "wwym"
      ["tagsname"]=>
      string(0) ""
      ["tagsid"]=>
      string(2) "[]"
      ["catesname"]=>
      string(4) ".NET"
      ["catesid"]=>
      string(7) "["119"]"
      ["createtime"]=>
      string(10) "1511397474"
      ["_id"]=>
      string(3) "421"
    }
    [8]=>
    array(10) {
      ["id"]=>
      string(3) "420"
      ["text"]=>
      string(47) "数据结构 队列_队列实例：事件处理"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(7) "idreamo"
      ["tagsname"]=>
      string(40) "C语言|数据结构|队列|事件处理"
      ["tagsid"]=>
      string(23) "["246","247","248",395]"
      ["catesname"]=>
      string(12) "数据结构"
      ["catesid"]=>
      string(7) "["133"]"
      ["createtime"]=>
      string(10) "1511397279"
      ["_id"]=>
      string(3) "420"
    }
    [9]=>
    array(10) {
      ["id"]=>
      string(3) "419"
      ["text"]=>
      string(47) "久等了,博客园官方Android客户端发布"
      ["intro"]=>
      string(288) "目录

ECharts
异步加载


ECharts
数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。
chart.setOption({
    color: [
        "
      ["username"]=>
      string(3) "cmt"
      ["tagsname"]=>
      string(0) ""
      ["tagsid"]=>
      string(2) "[]"
      ["catesname"]=>
      string(0) ""
      ["catesid"]=>
      string(2) "[]"
      ["createtime"]=>
      string(10) "1511396549"
      ["_id"]=>
      string(3) "419"
    }
  }
  ["count"]=>
  int(200)
}
222<!DOCTYPE html>
<html lang="zh-CN">
<head>
<meta charset="utf-8" />
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<meta http-equiv="content-language" content="zh-CN" />
<meta http-equiv="X-UA-Compatible" content="IE=edge" /> 
    <title>TensorFlow 入门之手写识别CNN 三 - 爱码网</title>
     
<meta name="keywords" content="TensorFlow 入门之手写识别CNN 三" />
<meta name="description" content="目录ECharts异步加载ECharts数据可视化在过去几年中取得了巨大进展。开发人员对可视化产品的期望不再是简单的图表创建工具，而是在交互、性能、数据处理等方面有更高的要求。chart.setOption({    color: [" />
<meta name="viewport" content="width=device-width, initial-scale=1.0" />
<link rel="stylesheet" type="text/css" href="/statics/css/base.css?v=2.7" />
<script src="/statics/js/detail.min.js?v=2.2"></script>   
<script>
   $(document).ready(function () { 
		$("img").error(function () {
			$(this).hide();
		}); 
	}); 
</script>
</head>
<body class="home-template dtpg">
<nav class="main-nav clearfix">
    <div class="inner">
        <ul class="nav">
            <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/" title="爱码网">首页</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/1.html" title="前端技术">前端技术</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/9.html" title="编程语言">编程语言</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/31.html" title="人工智能">人工智能</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/41.html" title="运维知识">运维知识</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/52.html" title="资源下载">资源下载</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/68.html" title="常用小工具">常用小工具</a></li>
                        <li class="menu-item menu-item-type-custom menu-item-object-custom current-menu-item current_page_item menu-item-home menu-item-886"><a href="/nav/72.html" title="技术问答">技术问答</a></li>
                    </ul>            
	 
    </div>
</nav><div class="site-wrapper">
 
    <header style="height: auto;padding: 10px 0px;" class="main-header">
        <div style="max-width:910px" class="main-header-content inner">
                        <h1 class="page-title"><a href="/show-307861093.html" title="TensorFlow 入门之手写识别CNN 三">TensorFlow 入门之手写识别CNN 三</a></h1>
            
        </div>

    </header>
    <main class="content" role="main">
	

        <div class="leftbox">
    <article class="post tag-uifont tag-webview">
        <header class="post-header">
            <footer class="tc">  
                <time class="post-date" datetime="2022-12-23">2022-12-23</time>
            </footer>
        </header>
        <section class="post-content">
            <div class="contentbef">  
                  
                              </div>

            
                                    <div style='font-family: "Helvetica Neue", Helvetica, Tahoma, Arial, "Hiragino Sans GB", STHeiti, "Microsoft YaHei", "微软雅黑", "WenQuanYi Micro Hei", STXihei, "华文细黑", Heiti, "黑体", SimSun, "宋体", Song, sans-serif; font-size: 18px; line-height: 1.33; font-weight: 100; color: rgba(47, 47, 47, 1)'>
	<div class="preview html_preview">
<div class="story_tags" style="margin: 0 0 1.2em">
<div class="tag blue label" style="display: inline-block; vertical-align: baseline; line-height: 1; margin: 0.125em; background-color: rgba(102, 128, 153, 0.07); border-color: rgba(102, 128, 153, 0.07); background-image: none; padding: 0.6em 0.8em; color: rgba(0, 0, 0, 0.6); text-transform: none; font-weight: bold; border-radius: 0.2857rem; box-sizing: border-box; font-size: 0.7428rem">MNIST</div>
<div class="tag blue label" style="display: inline-block; vertical-align: baseline; line-height: 1; margin: 0.125em; background-color: rgba(102, 128, 153, 0.07); border-color: rgba(102, 128, 153, 0.07); background-image: none; padding: 0.6em 0.8em; color: rgba(0, 0, 0, 0.6); text-transform: none; font-weight: bold; border-radius: 0.2857rem; box-sizing: border-box; font-size: 0.7428rem"> 卷积神经网络</div>
<div class="tag blue label" style="display: inline-block; vertical-align: baseline; line-height: 1; margin: 0.125em; background-color: rgba(102, 128, 153, 0.07); border-color: rgba(102, 128, 153, 0.07); background-image: none; padding: 0.6em 0.8em; color: rgba(0, 0, 0, 0.6); text-transform: none; font-weight: bold; border-radius: 0.2857rem; box-sizing: border-box; font-size: 0.7428rem"> Fly</div>
</div>
<p style="margin: 0 0 1.1em; line-height: 1.6"></p>
<div class="toc"><ul style="padding: 0; margin: 0 0 10px 35px; list-style: none"><li>
<a href="#e5a49ae5b182e58db7e7a7afe7bd91e7bb9c_1" style="color: rgba(0, 136, 204, 1); text-decoration: none">多层卷积网络</a><ul style="padding: 0; margin: 0 0 0 35px; list-style: none">
<li><a href="#e5a49ae5b182e58db7e7a7afe7bd91e7bb9ce79a84e59fbae69cace79086e8aeba_2" style="color: rgba(0, 136, 204, 1); text-decoration: none">多层卷积网络的基本理论</a></li>
<li>
<a href="#e69e84e5bbbae4b880e4b8aae5a49ae5b182e58db7e7a7afe7bd91e7bb9c_3" style="color: rgba(0, 136, 204, 1); text-decoration: none">构建一个多层卷积网络</a><ul style="padding: 0; margin: 0 0 0 35px; list-style: none">
<li><a href="#e69d83e580bce5889de5a78be58c96_4" style="color: rgba(0, 136, 204, 1); text-decoration: none">权值初始化</a></li>
<li>
<a href="#e58db7e7a7afe5928ce6b1a0e58c96_5" style="color: rgba(0, 136, 204, 1); text-decoration: none">卷积和池化</a><ul style="padding: 0; margin: 0 0 0 35px; list-style: none">
<li><a href="#e7acace4b880e5b182e58db7e7a7af_6" style="color: rgba(0, 136, 204, 1); text-decoration: none">第一层卷积</a></li>
<li><a href="#e7acace4ba8ce5b182e58db7e7a7af_7" style="color: rgba(0, 136, 204, 1); text-decoration: none">第二层卷积</a></li>
</ul>
</li>
<li><a href="#e5af86e99b86e5b182e8bf9ee68ea5_8" style="color: rgba(0, 136, 204, 1); text-decoration: none">密集层连接</a></li>
<li><a href="#dropout_9" style="color: rgba(0, 136, 204, 1); text-decoration: none">Dropout</a></li>
<li><a href="#e8be93e587bae5b182_10" style="color: rgba(0, 136, 204, 1); text-decoration: none">输出层</a></li>
</ul>
</li>
<li><a href="#e8aeade7bb83e5928ce8af84e4bcb0e6a8a1e59e8b_11" style="color: rgba(0, 136, 204, 1); text-decoration: none">训练和评估模型</a></li>
</ul>
</li></ul></div>
<p style="margin: 0 0 1.1em; line-height: 1.6"></p>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e5a49ae5b182e58db7e7a7afe7bd91e7bb9c_1" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h2 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.6; color: inherit; text-rendering: optimizelegibility; font-size: 38.5px">多层卷积网络</h2>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e5a49ae5b182e58db7e7a7afe7bd91e7bb9ce79a84e59fbae69cace79086e8aeba_2" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 31.5px">多层卷积网络的基本理论</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">卷积神经网络(Convolutional Neural Network,CNN) 是一种前馈神经网络, 它的人工神经元可以响应一部分覆盖范围内的周围单元，对于大型图像处理有出色表现。它包括卷积层(alternating convolutional layer)和池层(pooling layer)。</p>
<p style="margin: 0 0 1.1em; line-height: 1.6">多层卷积网络的基本可以参看下面这篇博文。</p>
<blockquote style="padding: 0 0 0 15px; margin: 0 0 20px; border-left: 5px solid rgba(221, 221, 221, 1)">
<ul style="padding: 0; margin: 0 0 10px 35px">
<li><a href="http://apinetree.blog.51cto.com/714152/1629641/" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow">Convolutional Neural Networks  卷积神经网络 </a></li>
<li><a href="http://dataunion.org/11692.html" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow">一文读懂卷积神经网络CNN</a></li>
</ul>
</blockquote>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e69e84e5bbbae4b880e4b8aae5a49ae5b182e58db7e7a7afe7bd91e7bb9c_3" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 31.5px">构建一个多层卷积网络</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">在前面一个笔记中的手写识别大概在91%左右，正确率并不高。但是我们将学习卷积神经网络来改善效果。准确率会比前面的高好多。</p>
<p style="margin: 0 0 1.1em; line-height: 1.6">为了创建这个模型，我们需要创建大量的权重和偏置项。这个模型中的权重在初始化时应该加入少量的噪声来打破对称性以及避免0梯度。由于我们使用的是ReLU神经元，因此比较好的做法是用一个较小的正数来初始化偏置项，以避免神经元节点输出恒为0的问题（dead neurons ）。</p>
<blockquote style="padding: 0 0 0 15px; margin: 0 0 20px; border-left: 5px solid rgba(221, 221, 221, 1)">
<p style="margin: 0; font-size: 16px; font-weight: 300; line-height: 25px">需要说明的是，<span class="mark" style="border: 0; background-color: rgba(221, 243, 231, 0.4); border-radius: 4px; color: rgba(41, 117, 77, 1); font-size: 90%; padding: 2px 4px">ReLU</span>就是类似<span class="mark" style="border: 0; background-color: rgba(221, 243, 231, 0.4); border-radius: 4px; color: rgba(41, 117, 77, 1); font-size: 90%; padding: 2px 4px">sigmoid</span>的函数。而且有研究表明，ReLU函数更加接近人体大脑的表现形式。</p>
</blockquote>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e69d83e580bce5889de5a78be58c96_4" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 24.5px">权值初始化</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">为了不在建立模型的时候反复做初始化操作，我们定义两个函数用于初始化。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)"><span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">def</span> <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">weight_variable</span><span class="hljs-params" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">(shape)</span>:</span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    initial = tf.truncated_normal(shape, stddev = <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0.1</span>) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    <span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">return</span> tf.Variable(initial) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">     <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)"><span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">def</span> <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">bias_variable</span><span class="hljs-params" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">(shape)</span>:</span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    initial = tf.constant(<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0.1</span>, shape = shape) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="7" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    <span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">return</span> tf.Variable(initial) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="8" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">     <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e58db7e7a7afe5928ce6b1a0e58c96_5" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 24.5px">卷积和池化</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">TensorFlow在卷积和池化上有很强的灵活性。我们怎么处理边界？步长应该设多大？在这个实例里，我们会一直使用vanilla版本。我们的卷积使用1步长（stride size），0边距（padding size） 的模板，  保证输出和输入是同一个大小。我们的池化用简单传统的2x2大小的模板做max pooling。为了代码更简洁，我们把这部分抽象成一个函数。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)"><span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">def</span> <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">conv2d</span><span class="hljs-params" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">(x, W)</span>:</span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    <span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">return</span> tf.nn.covn2d(x, W, strides=[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>], padding=<span class="hljs-string" style="overflow: visible !important; color: rgba(72, 182, 133, 1)">'SAME'</span>) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">     <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)"><span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">def</span> <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">max_pool_2x2</span><span class="hljs-params" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">(x)</span></span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)">    <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">return</span> <span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">tf</span>.<span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">nn</span>.<span class="hljs-title" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">max_pool</span><span class="hljs-params" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">(x, ksize=[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">2</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">2</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>],strides=[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">2</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">2</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>], padding=<span class="hljs-string" style="overflow: visible !important; color: rgba(72, 182, 133, 1)">'SAME'</span>)</span></span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-function" style="overflow: visible !important; color: rgba(6, 182, 239, 1)"></span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e7acace4b880e5b182e58db7e7a7af_6" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h4 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 20px; color: inherit; text-rendering: optimizelegibility; font-size: 17.5px">第一层卷积</h4>
<p style="margin: 0 0 1.1em; line-height: 1.6">定义了卷积方式之后，我们就可以来实现<span class="mark" style="border: 0; background-color: rgba(221, 243, 231, 0.4); border-radius: 4px; color: rgba(41, 117, 77, 1); font-size: 90%; padding: 2px 4px">CNN</span>的第一层了。它是有一个卷积接一个池化来完成的。卷积在每个5x5的patch中算出32个特征，卷积的权重张量形状是[5, 5, 1, 32],前两个维度是patch大小，接着是输入的通道数目，，最后是输出的通道数目。同时每个通道还有一个偏置量。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">W_conv1 = weight_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">5</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">5</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">32</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">b_conv1 = bias_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">32</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-comment" style="overflow: visible !important; color: rgba(119, 110, 113, 1)">#为了用这一层，我们把x变成一个4d向量，其第2、第3维对应图片的宽、高，最后一维代表图片的颜色通道数(因为是灰度图所以这里的通道数为1，如果是rgb彩色图，则为3)。</span> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">x_image = tf.reshape(x, [<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">-1</span>,<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">28</span>,<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">28</span>,<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>])] <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="7" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="8" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_conv1 = tf.nn.relu(conv2d(x_image, W_conv1) + b_conv1) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="9" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_pool1 = max_pool_2x2(h_conv1) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="10" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e7acace4ba8ce5b182e58db7e7a7af_7" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h4 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 20px; color: inherit; text-rendering: optimizelegibility; font-size: 17.5px">第二层卷积</h4>
<p style="margin: 0 0 1.1em; line-height: 1.6">为了构建一个更深的网络，我们会把几个类似的层堆叠起来。第二层中，每个5x5的patch会得到64个特征。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">W_conv2 = weight_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">5</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">5</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">32</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">64</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">b_conv2 = bias_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">64</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_conv2 = tf.nn.relu(conv2d(h_pool1, W_conv2) + b_conv2) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_pool2 = max_pool_2x2(h_conv2) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e5af86e99b86e5b182e8bf9ee68ea5_8" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 24.5px">密集层连接</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">现在，图片尺寸减小到7x7，我们加入一个有1024个神经元的全连接层，用于处理整个图片。我们把池化层输出的张量reshape成一些向量，乘上权重矩阵，加上偏置，然后对其使用ReLU。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">W_fc1 = weight_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">7</span> * <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">7</span> * <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">64</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1024</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">b_fc1 = bias_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1024</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_pool2_flat = tf.reshape(h_pool2, [<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">-1</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">7</span>*<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">7</span>*<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">64</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat, W_fc1) + b_fc1) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="dropout_9" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 24.5px">Dropout</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">为了减少过拟合，我们在输出层之前加入dropout。我们用一个placeholder来代表一个神经元的输出在dropout中保持不变的概率。这样我们可以在训练过程中启用dropout，在测试过程中关闭dropout。 TensorFlow的tf.nn.dropout操作除了可以屏蔽神经元的输出外，还会自动处理神经元输出值的scale。所以用dropout的时候可以不用考虑scale。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">keep_prob = tf.placeholder(tf.float31) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e8be93e587bae5b182_10" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 24.5px">输出层</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">最后添加一个softmax层。这与前面的softmax回归是一样的。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">W_fc2 = weight_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1024</span>, <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">10</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">b_fc2 = bias_variable([<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">10</span>]) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">y_conv=tf.nn.softmax(tf.matmul(h_fc1_drop, W_fc2) + b_fc2) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
<div class="xiaoshujiang_element xsj_anchor">
  <a name="e8aeade7bb83e5928ce8af84e4bcb0e6a8a1e59e8b_11" class="blank_anchor_name" target="_blank" style="color: rgba(0, 136, 204, 1); text-decoration: none" rel="nofollow" href="/default/index/url?u=aHR0cHM6Ly93d3cuY25ibG9ncy5jb20="></a><a></a>
</div>
<h3 style="margin: 1em 0 0.6em; font-family: inherit; font-weight: 500; line-height: 1.1; color: inherit; text-rendering: optimizelegibility; font-size: 31.5px">训练和评估模型</h3>
<p style="margin: 0 0 1.1em; line-height: 1.6">为了进行训练和评估，我们使用与之前简单的单层SoftMax神经网络模型几乎相同的一套代码，只是我们会用更加复杂的ADAM优化器来做梯度最速下降，在feed_dict中加入额外的参数keep_prob来控制dropout比例。然后每100次迭代输出一次日志。</p>
<div class="xiaoshujiang_code_container" style="margin: 1em 0; position: relative; padding-bottom: 2em"><div class="xiaoshujiang_pre" style="line-height: initial !important; word-wrap: break-word; word-break: break-all; tab-size: 4; font-family: monospace; white-space: pre"><div class="language-python hljs code_linenums xiaoshujiang_code" style="border: 0; border-radius: 4px; font-size: 90%; overflow: visible !important; position: relative; display: block; overflow-x: auto; background: rgba(231, 233, 219, 1); color: rgba(79, 66, 76, 1); padding: 0.5em; -webkit-text-size-adjust: none"><ol start="1" class="ol_linenums" style="counter-reset: lines 0; padding: 0; margin: 0 0 0 30px; overflow: visible !important; border-left: 1px solid rgba(224, 224, 224, 1)">
<li class="li_linenum  li_list_style" date-linenum="1" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">cross_entropy = tf.reduce_mean(-tf.reduce_sum(y_ * tf.log(y_conv), reduction_indices=[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>])) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="2" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="3" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">train_step = tf.train.AdamOptimizer(<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1e-4</span>).minimize(cross_entropy) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="4" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="5" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">correct_prediction = tf.equal(tf.argmax(y_conv,<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>), tf.argmax(y_,<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>)) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="6" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="7" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32)) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="8" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="9" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">sess.run(tf.initialize_all_variables()) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="10" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="11" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">
<span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">for</span> i <span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">in</span> range(<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">20000</span>): <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="12" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">  batch = mnist.train.next_batch(<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">50</span>) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="13" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">  <span class="hljs-keyword" style="overflow: visible !important; color: rgba(129, 91, 164, 1)">if</span> i%<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">100</span> == <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0</span>: <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="14" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    train_accuracy = accuracy.eval(feed_dict={ <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="15" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">        x:batch[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0</span>], y_: batch[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>], keep_prob: <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1.0</span>}) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="16" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    print(<span class="hljs-string" style="overflow: visible !important; color: rgba(72, 182, 133, 1)">"step %d, training accuracy %g"</span>%(i, train_accuracy)) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="17" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">  train_step.run(feed_dict={x: batch[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0</span>], y_: batch[<span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1</span>], keep_prob: <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">0.5</span>}) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="18" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1"> <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="19" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">print(<span class="hljs-string" style="overflow: visible !important; color: rgba(72, 182, 133, 1)">"test accuracy %g"</span>%accuracy.eval(feed_dict={ <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
<li class="li_linenum  li_list_style" date-linenum="20" style="overflow: visible !important; line-height: 20px; margin-left: 5px; counter-increment: lines 1">    x: mnist.test.images, y_: mnist.test.labels, keep_prob: <span class="hljs-number" style="overflow: visible !important; color: rgba(249, 155, 21, 1)">1.0</span>})) <hr class="code_line_break_hack" style="margin: 0; border: 0; overflow: visible !important">
</li>
</ol></div></div></div>
</div>
</div> 
                    
            
                <div style="margin-top: 10px;">
                  </div> 
        </section>
	 
        <footer class="post-footer">
            <section class="author">
                                            </section>
        </footer>
        <p class="mt10">相关文章：</p>
        <div style="width: 100%;" class="contentcard">
      
            <div style="width: 100%;height: auto;" class="carditem litem clearfix"> 
                    <ul style="padding-left: 0rem;" class="cardcont">
                                            </ul>
               </div>   
         </div>
    </article>

  
</div>

<div class="rigthbox contentcard mt10">
 
          <div style="height: auto;" class="carditem litem">
    <div class="cardtit">猜你喜欢 </div>
        <ul class="cardcont">
                        </ul>
   </div> 

<div style="height: auto;" class="carditem litem">
    <div class="cardtit">相关资源 </div>
        <ul class="cardcont">
              
                            </ul>
   </div>
   
    <div style="height: auto;" class="carditem litem">
     <div class="cardtit">相似解决方案 </div>
         <ul class="cardcont">
                          </ul>
    </div>
  
   <div style="height: auto;background-color: #ddd;text-align: center;" class="carditem litem">
    <ins class="adsbygoogle" style="display:block" data-ad-client="ca-pub-5446233687289962" data-ad-slot="2607637140"  data-ad-format="auto"  data-full-width-responsive="true"></ins><script>(adsbygoogle = window.adsbygoogle || []).push({});</script>
</div> 
   <div  style="height: auto;" class="carditem litem mt20">
    <div class="cardtit">热门标签  </div>
    <div class="tagbox">
                    <a target="_blank" title="Java" href="/default/index/tags?cid=164&cname=Java" >Java</a>
                        <a target="_blank" title="Python" href="/default/index/tags?cid=367&cname=Python" >Python</a>
                        <a target="_blank" title="linux" href="/default/index/tags?cid=274&cname=linux" >linux</a>
                        <a target="_blank" title="javascript" href="/default/index/tags?cid=169&cname=javascript" >javascript</a>
                        <a target="_blank" title="Mysql" href="/default/index/tags?cid=237&cname=Mysql" >Mysql</a>
                        <a target="_blank" title="C#" href="/default/index/tags?cid=187&cname=C%23" >C#</a>
                        <a target="_blank" title="Docker" href="/default/index/tags?cid=243&cname=Docker" >Docker</a>
                        <a target="_blank" title="算法" href="/default/index/tags?cid=344&cname=%E7%AE%97%E6%B3%95" >算法</a>
                        <a target="_blank" title="前端" href="/default/index/tags?cid=160&cname=%E5%89%8D%E7%AB%AF" >前端</a>
                        <a target="_blank" title="SpringBoot" href="/default/index/tags?cid=168&cname=SpringBoot" >SpringBoot</a>
                        <a target="_blank" title="Redis" href="/default/index/tags?cid=227&cname=Redis" >Redis</a>
                        <a target="_blank" title="Vue" href="/default/index/tags?cid=236&cname=Vue" >Vue</a>
                        <a target="_blank" title="spring" href="/default/index/tags?cid=696&cname=spring" >spring</a>
                        <a target="_blank" title="设计模式" href="/default/index/tags?cid=632&cname=%E8%AE%BE%E8%AE%A1%E6%A8%A1%E5%BC%8F" >设计模式</a>
                        <a target="_blank" title=".net core" href="/default/index/tags?cid=381&cname=.net+core" >.net core</a>
                        <a target="_blank" title=".net" href="/default/index/tags?cid=300&cname=.net" >.net</a>
                        <a target="_blank" title="kubernetes" href="/default/index/tags?cid=2179&cname=kubernetes" >kubernetes</a>
                        <a target="_blank" title="c++" href="/default/index/tags?cid=312&cname=c%2B%2B" >c++</a>
                        <a target="_blank" title="数据库" href="/default/index/tags?cid=284&cname=%E6%95%B0%E6%8D%AE%E5%BA%93" >数据库</a>
                        <a target="_blank" title="数据结构" href="/default/index/tags?cid=247&cname=%E6%95%B0%E6%8D%AE%E7%BB%93%E6%9E%84" >数据结构</a>
                        <a target="_blank" title="大数据" href="/default/index/tags?cid=888&cname=%E5%A4%A7%E6%95%B0%E6%8D%AE" >大数据</a>
                        <a target="_blank" title="js" href="/default/index/tags?cid=159&cname=js" >js</a>
                        <a target="_blank" title="机器学习" href="/default/index/tags?cid=171&cname=%E6%9C%BA%E5%99%A8%E5%AD%A6%E4%B9%A0" >机器学习</a>
                        <a target="_blank" title="微服务" href="/default/index/tags?cid=832&cname=%E5%BE%AE%E6%9C%8D%E5%8A%A1" >微服务</a>
                        <a target="_blank" title="Android" href="/default/index/tags?cid=282&cname=Android" >Android</a>
                        <a target="_blank" title="Go" href="/default/index/tags?cid=839&cname=Go" >Go</a>
                        <a target="_blank" title="程序员" href="/default/index/tags?cid=327&cname=%E7%A8%8B%E5%BA%8F%E5%91%98" >程序员</a>
                        <a target="_blank" title="面试" href="/default/index/tags?cid=637&cname=%E9%9D%A2%E8%AF%95" >面试</a>
                        <a target="_blank" title="JVM" href="/default/index/tags?cid=727&cname=JVM" >JVM</a>
                        <a target="_blank" title="ASP.net core" href="/default/index/tags?cid=179&cname=ASP.net+core" >ASP.net core</a>
                        <a target="_blank" title="云原生" href="/default/index/tags?cid=22056&cname=%E4%BA%91%E5%8E%9F%E7%94%9F" >云原生</a>
                        <a target="_blank" title="人工智能" href="/default/index/tags?cid=270&cname=%E4%BA%BA%E5%B7%A5%E6%99%BA%E8%83%BD" >人工智能</a>
                        <a target="_blank" title="后端" href="/default/index/tags?cid=1089&cname=%E5%90%8E%E7%AB%AF" >后端</a>
                        <a target="_blank" title="PHP" href="/default/index/tags?cid=281&cname=PHP" >PHP</a>
                        <a target="_blank" title="git" href="/default/index/tags?cid=226&cname=git" >git</a>
                        <a target="_blank" title="CSS" href="/default/index/tags?cid=817&cname=CSS" >CSS</a>
                        <a target="_blank" title="golang" href="/default/index/tags?cid=409&cname=golang" >golang</a>
                        <a target="_blank" title="k8s" href="/default/index/tags?cid=5067&cname=k8s" >k8s</a>
                        <a target="_blank" title="Nginx" href="/default/index/tags?cid=373&cname=Nginx" >Nginx</a>
                        <a target="_blank" title="Django" href="/default/index/tags?cid=634&cname=Django" >Django</a>
                        <a target="_blank" title="mybatis" href="/default/index/tags?cid=720&cname=mybatis" >mybatis</a>
                        <a target="_blank" title="深度学习" href="/default/index/tags?cid=345&cname=%E6%B7%B1%E5%BA%A6%E5%AD%A6%E4%B9%A0" >深度学习</a>
                        <a target="_blank" title="多线程" href="/default/index/tags?cid=986&cname=%E5%A4%9A%E7%BA%BF%E7%A8%8B" >多线程</a>
                        <a target="_blank" title="React" href="/default/index/tags?cid=560&cname=React" >React</a>
                        <a target="_blank" title="架构" href="/default/index/tags?cid=2070&cname=%E6%9E%B6%E6%9E%84" >架构</a>
                        <a target="_blank" title="devops" href="/default/index/tags?cid=2662&cname=devops" >devops</a>
                        <a target="_blank" title="爬虫" href="/default/index/tags?cid=905&cname=%E7%88%AC%E8%99%AB" >爬虫</a>
                        <a target="_blank" title="云计算" href="/default/index/tags?cid=361&cname=%E4%BA%91%E8%AE%A1%E7%AE%97" >云计算</a>
                        <a target="_blank" title="Spring Boot" href="/default/index/tags?cid=201&cname=Spring+Boot" >Spring Boot</a>
                        <a target="_blank" title="LeetCode" href="/default/index/tags?cid=342&cname=LeetCode" >LeetCode</a>
                </div>
       
   </div>
   
        <div id="rightadbox" style="height: 300px;background-color: #ddd;text-align: center;" class="carditem litem">
            <ins class="adsbygoogle" style="display:block" data-ad-client="ca-pub-5446233687289962" data-ad-slot="2607637140"  data-ad-format="auto"  data-full-width-responsive="true"></ins><script>(adsbygoogle = window.adsbygoogle || []).push({});</script>
        </div> 
</div>
<div class="clearfix"></div>
</main>
    
<div class="yllinks alink"></div>
 

<footer class="site-footer clearfix">
<section class="copyright">By &copy; 2026 <a href="/" title="www.likecs.com">likecs</a> 版权所有,<br/>本站所有数据收集于网络如有侵犯到您的权益请联系 进行下架处理1。 </section>
<section class="poweredby">  <a target="_blank" href="https://beian.miit.gov.cn/">粤ICP备22038628号</a>Powered By  WordPress </section>
<script charset="UTF-8" id="LA_COLLECT" src="//sdk.51.la/js-sdk-pro.min.js"></script>
<script>LA.init({id: "Je3PjbvUssp6BbvY",ck: "Je3PjbvUssp6BbvY"})</script>
<script>
var _hmt = _hmt || [];
(function() {
  var hm = document.createElement("script");
  hm.src = "https://hm.baidu.com/hm.js?2eb031e42d29b7c1a1f16948d2ae2a9f";
  var s = document.getElementsByTagName("script")[0]; 
  s.parentNode.insertBefore(hm, s);
})();
</script>
</footer>  
</div>
<script>
    $(function(){
                    $(".post-content").append('<p style="padding: 20px;color: #cacaca;">原文链接：https://www.cnblogs.com/flyu6/p/7691004.html</p>')  
            }) 
</script> 
</body>
</html>