You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
675 lines
28 KiB
675 lines
28 KiB
6 years ago
|
|
||
|
<!DOCTYPE HTML>
|
||
|
<html lang="" >
|
||
|
<head>
|
||
|
<meta charset="UTF-8">
|
||
|
<meta content="text/html; charset=utf-8" http-equiv="Content-Type">
|
||
|
<title>特征工程 · GitBook</title>
|
||
|
<meta http-equiv="X-UA-Compatible" content="IE=edge" />
|
||
|
<meta name="description" content="">
|
||
|
<meta name="generator" content="GitBook 3.2.3">
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
<link rel="stylesheet" href="../gitbook/style.css">
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
<link rel="stylesheet" href="../gitbook/gitbook-plugin-katex/katex.min.css">
|
||
|
|
||
|
|
||
|
|
||
|
<link rel="stylesheet" href="../gitbook/gitbook-plugin-highlight/website.css">
|
||
|
|
||
|
|
||
|
|
||
|
<link rel="stylesheet" href="../gitbook/gitbook-plugin-search/search.css">
|
||
|
|
||
|
|
||
|
|
||
|
<link rel="stylesheet" href="../gitbook/gitbook-plugin-fontsettings/website.css">
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
<meta name="HandheldFriendly" content="true"/>
|
||
|
<meta name="viewport" content="width=device-width, initial-scale=1, user-scalable=no">
|
||
|
<meta name="apple-mobile-web-app-capable" content="yes">
|
||
|
<meta name="apple-mobile-web-app-status-bar-style" content="black">
|
||
|
<link rel="apple-touch-icon-precomposed" sizes="152x152" href="../gitbook/images/apple-touch-icon-precomposed-152.png">
|
||
|
<link rel="shortcut icon" href="../gitbook/images/favicon.ico" type="image/x-icon">
|
||
|
|
||
|
|
||
|
<link rel="next" href="fit and predict.html" />
|
||
|
|
||
|
|
||
|
<link rel="prev" href="EDA.html" />
|
||
|
|
||
|
|
||
|
</head>
|
||
|
<body>
|
||
|
|
||
|
<div class="book">
|
||
|
<div class="book-summary">
|
||
|
|
||
|
|
||
|
<div id="book-search-input" role="search">
|
||
|
<input type="text" placeholder="Type to search" />
|
||
|
</div>
|
||
|
|
||
|
|
||
|
<nav role="navigation">
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="summary">
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
<li class="chapter " data-level="1.1" data-path="../">
|
||
|
|
||
|
<a href="../">
|
||
|
|
||
|
|
||
|
简介
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.2" data-path="../machine_learning.html">
|
||
|
|
||
|
<a href="../machine_learning.html">
|
||
|
|
||
|
|
||
|
机器学习概述
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3" data-path="../algorithm.html">
|
||
|
|
||
|
<a href="../algorithm.html">
|
||
|
|
||
|
|
||
|
常见机器学习算法
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="articles">
|
||
|
|
||
|
|
||
|
<li class="chapter " data-level="1.3.1" data-path="../kNN.html">
|
||
|
|
||
|
<a href="../kNN.html">
|
||
|
|
||
|
|
||
|
近朱者赤近墨者黑-kNN
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.2" data-path="../linear_regression.html">
|
||
|
|
||
|
<a href="../linear_regression.html">
|
||
|
|
||
|
|
||
|
最简单的回归算法-线性回归
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.3" data-path="../logistic_regression.html">
|
||
|
|
||
|
<a href="../logistic_regression.html">
|
||
|
|
||
|
|
||
|
使用回归的思想进行分类-逻辑回归
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.4" data-path="../decision_tree.html">
|
||
|
|
||
|
<a href="../decision_tree.html">
|
||
|
|
||
|
|
||
|
最接近人类思维的算法-决策树
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.5" data-path="../random_forest.html">
|
||
|
|
||
|
<a href="../random_forest.html">
|
||
|
|
||
|
|
||
|
群众的力量是伟大的-随机森林
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.6" data-path="../kMeans.html">
|
||
|
|
||
|
<a href="../kMeans.html">
|
||
|
|
||
|
|
||
|
物以类聚人以群分-kMeans
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.3.7" data-path="../AGNES.html">
|
||
|
|
||
|
<a href="../AGNES.html">
|
||
|
|
||
|
|
||
|
以距离为尺-AGNES
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
|
</ul>
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.4" data-path="../metrics.html">
|
||
|
|
||
|
<a href="../metrics.html">
|
||
|
|
||
|
|
||
|
模型评估指标
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="articles">
|
||
|
|
||
|
|
||
|
<li class="chapter " data-level="1.4.1" data-path="../classification_metrics.html">
|
||
|
|
||
|
<a href="../classification_metrics.html">
|
||
|
|
||
|
|
||
|
分类性能评估指标
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.4.2" data-path="../regression_metrics.html">
|
||
|
|
||
|
<a href="../regression_metrics.html">
|
||
|
|
||
|
|
||
|
回归性能评估指标
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.4.3" data-path="../cluster_metrics.html">
|
||
|
|
||
|
<a href="../cluster_metrics.html">
|
||
|
|
||
|
|
||
|
聚类性能评估指标
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
|
</ul>
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.5" data-path="../sklearn.html">
|
||
|
|
||
|
<a href="../sklearn.html">
|
||
|
|
||
|
|
||
|
使用sklearn进行机器学习
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.6" >
|
||
|
|
||
|
<span>
|
||
|
|
||
|
|
||
|
综合实战案例
|
||
|
|
||
|
</span>
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="articles">
|
||
|
|
||
|
|
||
|
<li class="chapter " data-level="1.6.1" >
|
||
6 years ago
|
|
||
|
<span>
|
||
|
|
||
|
|
||
|
泰坦尼克生还预测
|
||
|
|
||
|
</span>
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="articles">
|
||
|
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.1.1" data-path="introduction.html">
|
||
6 years ago
|
|
||
|
<a href="introduction.html">
|
||
|
|
||
|
|
||
|
简介
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.1.2" data-path="EDA.html">
|
||
6 years ago
|
|
||
|
<a href="EDA.html">
|
||
|
|
||
|
|
||
|
探索性数据分析(EDA)
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter active" data-level="1.6.1.3" data-path="feature engerning.html">
|
||
6 years ago
|
|
||
|
<a href="feature engerning.html">
|
||
|
|
||
|
|
||
|
特征工程
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.1.4" data-path="fit and predict.html">
|
||
6 years ago
|
|
||
|
<a href="fit and predict.html">
|
||
|
|
||
|
|
||
|
构建模型进行预测
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.1.5" data-path="tuning.html">
|
||
6 years ago
|
|
||
|
<a href="tuning.html">
|
||
|
|
||
|
|
||
|
调参
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
|
</ul>
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.2" >
|
||
6 years ago
|
|
||
|
<span>
|
||
|
|
||
|
|
||
|
使用强化学习玩乒乓球游戏
|
||
|
|
||
|
</span>
|
||
|
|
||
|
|
||
|
|
||
|
<ul class="articles">
|
||
|
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.2.1" data-path="../pingpong/what is reinforce learning.html">
|
||
6 years ago
|
|
||
|
<a href="../pingpong/what is reinforce learning.html">
|
||
|
|
||
|
|
||
|
什么是强化学习
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.2.2" data-path="../pingpong/Policy Gradient.html">
|
||
6 years ago
|
|
||
|
<a href="../pingpong/Policy Gradient.html">
|
||
|
|
||
|
|
||
|
Policy Gradient原理
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
6 years ago
|
<li class="chapter " data-level="1.6.2.3" data-path="../pingpong/coding.html">
|
||
6 years ago
|
|
||
|
<a href="../pingpong/coding.html">
|
||
|
|
||
|
|
||
|
使用Policy Gradient玩乒乓球游戏
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
|
</ul>
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
6 years ago
|
</ul>
|
||
|
|
||
|
</li>
|
||
|
|
||
|
<li class="chapter " data-level="1.7" data-path="../recommand.html">
|
||
|
|
||
|
<a href="../recommand.html">
|
||
|
|
||
|
|
||
|
实训推荐
|
||
|
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</li>
|
||
|
|
||
|
|
||
6 years ago
|
|
||
|
|
||
|
<li class="divider"></li>
|
||
|
|
||
|
<li>
|
||
|
<a href="https://www.gitbook.com" target="blank" class="gitbook-link">
|
||
|
Published with GitBook
|
||
|
</a>
|
||
|
</li>
|
||
|
</ul>
|
||
|
|
||
|
|
||
|
</nav>
|
||
|
|
||
|
|
||
|
</div>
|
||
|
|
||
|
<div class="book-body">
|
||
|
|
||
|
<div class="body-inner">
|
||
|
|
||
|
|
||
|
|
||
|
<div class="book-header" role="navigation">
|
||
|
|
||
|
|
||
|
<!-- Title -->
|
||
|
<h1>
|
||
|
<i class="fa fa-circle-o-notch fa-spin"></i>
|
||
|
<a href=".." >特征工程</a>
|
||
|
</h1>
|
||
|
</div>
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
<div class="page-wrapper" tabindex="-1" role="main">
|
||
|
<div class="page-inner">
|
||
|
|
||
|
<div id="book-search-results">
|
||
|
<div class="search-noresults">
|
||
|
|
||
|
<section class="normal markdown-section">
|
||
|
|
||
|
<h1 id="特征工程">特征工程</h1>
|
||
|
<p>什么是特征工程?其实每当我们拿到数据时,并不是所有的特征都是有用的,可能有许多冗余的特征需要删掉,或者根据 EDA 的结果,我们可以根据已有的特征来添加新的特征,这其实就是特征工程。</p>
|
||
|
<p>接下来我们来尝试对一些特征进行处理。</p>
|
||
|
<h2 id="年龄离散化">年龄离散化</h2>
|
||
|
<p>年龄是一个连续型的数值特征,有的机器学习算法对于连续性数值特征不太友好,例如决策树、随机森林等 tree-base model。所以我们可以考虑将年龄转换成年龄段。例如将年龄小于 16 的船客置为 0 ,16 到 32 岁之间的置为 1 等。</p>
|
||
|
<pre><code class="lang-python">data[<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">0</span>
|
||
|
data.loc[data[<span class="hljs-string">'Age'</span>]<=<span class="hljs-number">16</span>,<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">0</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Age'</span>]><span class="hljs-number">16</span>)&(data[<span class="hljs-string">'Age'</span>]<=<span class="hljs-number">32</span>),<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">1</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Age'</span>]><span class="hljs-number">32</span>)&(data[<span class="hljs-string">'Age'</span>]<=<span class="hljs-number">48</span>),<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">2</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Age'</span>]><span class="hljs-number">48</span>)&(data[<span class="hljs-string">'Age'</span>]<=<span class="hljs-number">64</span>),<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">3</span>
|
||
|
data.loc[data[<span class="hljs-string">'Age'</span>]><span class="hljs-number">64</span>,<span class="hljs-string">'Age_band'</span>]=<span class="hljs-number">4</span>
|
||
|
</code></pre>
|
||
|
<p><img src="../img/52.jpg" alt=""></p>
|
||
|
<p>我们可以看一下转换成年龄段后,年龄段与生还率的关系。</p>
|
||
|
<pre><code class="lang-python">sns.factorplot(<span class="hljs-string">'Age_band'</span>,<span class="hljs-string">'Survived'</span>,data=data,col=<span class="hljs-string">'Pclass'</span>)
|
||
|
plt.show()
|
||
|
</code></pre>
|
||
|
<p><img src="../img/53.jpg" alt=""></p>
|
||
|
<p>可以看出和我们之前 EDA 的结果相符,年龄越大,生还率越低。</p>
|
||
|
<h2 id="家庭成员数量与是否孤身一人">家庭成员数量与是否孤身一人</h2>
|
||
|
<p>由于家庭成员数量和是否孤身一人好想对于是否生还有影响,所以我们不妨添加新的特征。</p>
|
||
|
<pre><code class="lang-python">data[<span class="hljs-string">'Family_Size'</span>]=<span class="hljs-number">0</span>
|
||
|
data[<span class="hljs-string">'Family_Size'</span>]=data[<span class="hljs-string">'Parch'</span>]+data[<span class="hljs-string">'SibSp'</span>]
|
||
|
data[<span class="hljs-string">'Alone'</span>]=<span class="hljs-number">0</span>
|
||
|
data.loc[data.Family_Size==<span class="hljs-number">0</span>,<span class="hljs-string">'Alone'</span>]=<span class="hljs-number">1</span>
|
||
|
</code></pre>
|
||
|
<p>然后再可视化看一下</p>
|
||
|
<pre><code class="lang-python">f,ax=plt.subplots(<span class="hljs-number">1</span>,<span class="hljs-number">2</span>,figsize=(<span class="hljs-number">18</span>,<span class="hljs-number">6</span>))
|
||
|
sns.factorplot(<span class="hljs-string">'Family_Size'</span>,<span class="hljs-string">'Survived'</span>,data=data,ax=ax[<span class="hljs-number">0</span>])
|
||
|
ax[<span class="hljs-number">0</span>].set_title(<span class="hljs-string">'Family_Size vs Survived'</span>)
|
||
|
sns.factorplot(<span class="hljs-string">'Alone'</span>,<span class="hljs-string">'Survived'</span>,data=data,ax=ax[<span class="hljs-number">1</span>])
|
||
|
ax[<span class="hljs-number">1</span>].set_title(<span class="hljs-string">'Alone vs Survived'</span>)
|
||
|
plt.close(<span class="hljs-number">2</span>)
|
||
|
plt.close(<span class="hljs-number">3</span>)
|
||
|
plt.show()
|
||
|
</code></pre>
|
||
|
<p><img src="../img/54.jpg" alt=""></p>
|
||
|
<p>从图中可以很明显的看出,如果你是一个人,那么生还的几率比较低,而且对于人数大于 4 人的家庭来说生还率也比较低。感觉,这可能也是一个比较好的特征,可以再深入的看一下。</p>
|
||
|
<pre><code class="lang-python">sns.factorplot(<span class="hljs-string">'Alone'</span>,<span class="hljs-string">'Survived'</span>,data=data,hue=<span class="hljs-string">'Sex'</span>,col=<span class="hljs-string">'Pclass'</span>)
|
||
|
plt.show()
|
||
|
</code></pre>
|
||
|
<p><img src="../img/55.jpg" alt=""></p>
|
||
|
<p>可以看出,除了三等舱的单身女性的生还率比非单身女性的生还率高外,单身并不是什么好事。</p>
|
||
|
<h2 id="花费离散化">花费离散化</h2>
|
||
|
<p>和年龄一样,花费也是一个连续性的数值特征,所以我们不妨将其离散化。</p>
|
||
|
<pre><code class="lang-python">data[<span class="hljs-string">'Fare_cat'</span>]=<span class="hljs-number">0</span>
|
||
|
data.loc[data[<span class="hljs-string">'Fare'</span>]<=<span class="hljs-number">7.91</span>,<span class="hljs-string">'Fare_cat'</span>]=<span class="hljs-number">0</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Fare'</span>]><span class="hljs-number">7.91</span>)&(data[<span class="hljs-string">'Fare'</span>]<=<span class="hljs-number">14.454</span>),<span class="hljs-string">'Fare_cat'</span>]=<span class="hljs-number">1</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Fare'</span>]><span class="hljs-number">14.454</span>)&(data[<span class="hljs-string">'Fare'</span>]<=<span class="hljs-number">31</span>),<span class="hljs-string">'Fare_cat'</span>]=<span class="hljs-number">2</span>
|
||
|
data.loc[(data[<span class="hljs-string">'Fare'</span>]><span class="hljs-number">31</span>)&(data[<span class="hljs-string">'Fare'</span>]<=<span class="hljs-number">513</span>),<span class="hljs-string">'Fare_cat'</span>]=<span class="hljs-number">3</span>
|
||
|
|
||
|
sns.factorplot(<span class="hljs-string">'Fare_cat'</span>,<span class="hljs-string">'Survived'</span>,data=data,hue=<span class="hljs-string">'Sex'</span>)
|
||
|
plt.show()
|
||
|
</code></pre>
|
||
|
<p><img src="../img/56.jpg" alt=""></p>
|
||
|
<p>很明显,花费越多生还率越高,金钱决定命运。</p>
|
||
|
<h2 id="将字符串特征转换为数值型特征">将字符串特征转换为数值型特征</h2>
|
||
|
<p>由于我们的机器学习模型不支持字符串,所以需要将一些有用的字符串类型的特征转换成数值型的特征,比如:性别,口岸,姓名前缀。</p>
|
||
|
<pre><code class="lang-python">data[<span class="hljs-string">'Sex'</span>].replace([<span class="hljs-string">'male'</span>,<span class="hljs-string">'female'</span>],[<span class="hljs-number">0</span>,<span class="hljs-number">1</span>],inplace=<span class="hljs-keyword">True</span>)
|
||
|
data[<span class="hljs-string">'Embarked'</span>].replace([<span class="hljs-string">'S'</span>,<span class="hljs-string">'C'</span>,<span class="hljs-string">'Q'</span>],[<span class="hljs-number">0</span>,<span class="hljs-number">1</span>,<span class="hljs-number">2</span>],inplace=<span class="hljs-keyword">True</span>)
|
||
|
data[<span class="hljs-string">'Initial'</span>].replace([<span class="hljs-string">'Mr'</span>,<span class="hljs-string">'Mrs'</span>,<span class="hljs-string">'Miss'</span>,<span class="hljs-string">'Master'</span>,<span class="hljs-string">'Other'</span>],[<span class="hljs-number">0</span>,<span class="hljs-number">1</span>,<span class="hljs-number">2</span>,<span class="hljs-number">3</span>,<span class="hljs-number">4</span>],inplace=<span class="hljs-keyword">True</span>)
|
||
|
</code></pre>
|
||
|
<h2 id="删掉没多大用处的特征">删掉没多大用处的特征</h2>
|
||
|
<ul>
|
||
|
<li>姓名:难道姓名和生死有关系?这也太玄乎了,我不信,所以把它删掉</li>
|
||
|
<li>年龄:由于已经根据年龄生成了新的特征“年龄段”,所以这个特征也需要删除。</li>
|
||
|
<li>票:票这个特征感觉是一堆随机的字符串,所以删掉。</li>
|
||
|
<li>花费:和年龄一样,删掉。</li>
|
||
|
<li>船舱:由于有很多缺失值,不好填充,所以可以考虑删掉。</li>
|
||
|
<li>船客ID:ID和生死应该没啥关系,所以删掉。</li>
|
||
|
</ul>
|
||
|
<pre><code class="lang-python">data.drop([<span class="hljs-string">'Name'</span>,<span class="hljs-string">'Age'</span>,<span class="hljs-string">'Ticket'</span>,<span class="hljs-string">'Fare'</span>,<span class="hljs-string">'Cabin'</span>,<span class="hljs-string">'PassengerId'</span>],axis=<span class="hljs-number">1</span>,inplace=<span class="hljs-keyword">True</span>)
|
||
|
</code></pre>
|
||
|
|
||
|
|
||
|
</section>
|
||
|
|
||
|
</div>
|
||
|
<div class="search-results">
|
||
|
<div class="has-results">
|
||
|
|
||
|
<h1 class="search-results-title"><span class='search-results-count'></span> results matching "<span class='search-query'></span>"</h1>
|
||
|
<ul class="search-results-list"></ul>
|
||
|
|
||
|
</div>
|
||
|
<div class="no-results">
|
||
|
|
||
|
<h1 class="search-results-title">No results matching "<span class='search-query'></span>"</h1>
|
||
|
|
||
|
</div>
|
||
|
</div>
|
||
|
</div>
|
||
|
|
||
|
</div>
|
||
|
</div>
|
||
|
|
||
|
</div>
|
||
|
|
||
|
|
||
|
|
||
|
<a href="EDA.html" class="navigation navigation-prev " aria-label="Previous page: 探索性数据分析(EDA)">
|
||
|
<i class="fa fa-angle-left"></i>
|
||
|
</a>
|
||
|
|
||
|
|
||
|
<a href="fit and predict.html" class="navigation navigation-next " aria-label="Next page: 构建模型进行预测">
|
||
|
<i class="fa fa-angle-right"></i>
|
||
|
</a>
|
||
|
|
||
|
|
||
|
|
||
|
</div>
|
||
|
|
||
|
<script>
|
||
|
var gitbook = gitbook || [];
|
||
|
gitbook.push(function() {
|
||
6 years ago
|
gitbook.page.hasChanged({"page":{"title":"特征工程","level":"1.6.1.3","depth":3,"next":{"title":"构建模型进行预测","level":"1.6.1.4","depth":3,"path":"titanic/fit and predict.md","ref":"./titanic/fit and predict.md","articles":[]},"previous":{"title":"探索性数据分析(EDA)","level":"1.6.1.2","depth":3,"path":"titanic/EDA.md","ref":"./titanic/EDA.md","articles":[]},"dir":"ltr"},"config":{"gitbook":"*","theme":"default","variables":{},"plugins":["katex"],"pluginsConfig":{"katex":{},"highlight":{},"search":{},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"fontsettings":{"theme":"white","family":"sans","size":2},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":false}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"}},"file":{"path":"titanic/feature engerning.md","mtime":"2019-07-05T01:24:43.597Z","type":"markdown"},"gitbook":{"version":"3.2.3","time":"2019-07-06T07:31:21.537Z"},"basePath":"..","book":{"language":""}});
|
||
6 years ago
|
});
|
||
|
</script>
|
||
|
</div>
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook.js"></script>
|
||
|
<script src="../gitbook/theme.js"></script>
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-search/search-engine.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-search/search.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-lunr/lunr.min.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-lunr/search-lunr.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-sharing/buttons.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
<script src="../gitbook/gitbook-plugin-fontsettings/fontsettings.js"></script>
|
||
|
|
||
|
|
||
|
|
||
|
</body>
|
||
|
</html>
|
||
|
|