From e10541d3163c3c0dbf6d0b511433d80b6436a6f8 Mon Sep 17 00:00:00 2001
From: baniasbaabe <baniasbaabe@users.noreply.github.com>
Date: Sun, 4 Feb 2024 11:37:36 +0000
Subject: [PATCH] deploy: dccdefcd7ba1a7fa7861588a37cd8260448fdd59

---
 _sources/book/cooltools/Chapter.ipynb         | 39 ++++++++++++
 .../machinelearning/outlierdetection.ipynb    | 59 +++++++++++++++++++
 _sources/book/pandas/Chapter.ipynb            | 48 +++++++++++++++
 _sources/book/pythontricks/Chapter.ipynb      | 10 +++-
 book/cooltools/Chapter.html                   | 27 +++++++++
 book/machinelearning/outlierdetection.html    | 44 ++++++++++++++
 book/pandas/Chapter.html                      | 30 ++++++++++
 book/pythontricks/Chapter.html                |  4 ++
 searchindex.js                                |  2 +-
 9 files changed, 261 insertions(+), 2 deletions(-)

diff --git a/_sources/book/cooltools/Chapter.ipynb b/_sources/book/cooltools/Chapter.ipynb
index feec4ec..ffea5a4 100644
--- a/_sources/book/cooltools/Chapter.ipynb
+++ b/_sources/book/cooltools/Chapter.ipynb
@@ -1665,6 +1665,45 @@
     "        }\n",
     "    )"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## SQL Query Builder in Python"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can build SQL queries in Python with pypika.\n",
+    "\n",
+    "pypika provides a simple interface to build SQL queries with an easy syntax.\n",
+    "\n",
+    "It supports nearly every SQL command."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from pypika import Tables, Query\n",
+    "\n",
+    "history, customers = Tables('history', 'customers')\n",
+    "q = Query \\\n",
+    "    .from_(history) \\\n",
+    "    .join(customers) \\\n",
+    "    .on(history.customer_id == customers.id) \\\n",
+    "    .select(history.star) \\\n",
+    "    .where(customers.id == 5)\n",
+    "    \n",
+    "q.get_sql()\n",
+    "# SELECT \"history\".* FROM \"history\" JOIN \"customers\" \n",
+    "# ON \"history\".\"customer_id\"=\"customers\".\"id\" WHERE \"customers\".\"id\"=5"
+   ]
   }
  ],
  "metadata": {
diff --git a/_sources/book/machinelearning/outlierdetection.ipynb b/_sources/book/machinelearning/outlierdetection.ipynb
index 1022f7e..3092056 100644
--- a/_sources/book/machinelearning/outlierdetection.ipynb
+++ b/_sources/book/machinelearning/outlierdetection.ipynb
@@ -83,6 +83,65 @@
     "    \n",
     "majority_vote(labels)"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Robust Outlier Detection with `puncc`"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Outlier Detection is notoriously hard.\n",
+    "\n",
+    "But it doesn't have to.\n",
+    "\n",
+    "`puncc` offers outlier detection, powered by Conformal Prediction, where the detection threshold will be calibrated.\n",
+    "\n",
+    "So, false alarms are reduced."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install puncc"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from sklearn.ensemble import IsolationForest\n",
+    "from deel.puncc.anomaly_detection import SplitCAD\n",
+    "from deel.puncc.api.prediction import BasePredictor\n",
+    "\n",
+    "# We need to redefine the predict to output the nonconformity scores.\n",
+    "class ADPredictor(BasePredictor):\n",
+    "    def predict(self, X):\n",
+    "        return -self.model.score_samples(X)\n",
+    "\n",
+    "# Wrap Isolation Forest in a predictor\n",
+    "if_predictor = ADPredictor(IsolationForest())\n",
+    "\n",
+    "# Instantiate CAD on top of IF predictor\n",
+    "if_cad = SplitCAD(if_predictor, train=True)\n",
+    "\n",
+    "\n",
+    "if_cad.fit(z=dataset, fit_ratio=0.7)\n",
+    "\n",
+    "# Maximum false detection rate\n",
+    "alpha = 0.01\n",
+    "\n",
+    "results = if_cad.predict(new_data, alpha=alpha)"
+   ]
   }
  ],
  "metadata": {
diff --git a/_sources/book/pandas/Chapter.ipynb b/_sources/book/pandas/Chapter.ipynb
index 4fead7e..aabb881 100644
--- a/_sources/book/pandas/Chapter.ipynb
+++ b/_sources/book/pandas/Chapter.ipynb
@@ -189,6 +189,54 @@
     "data = {'Value': [1.2343129, 5.8956701, 6.224289]}\n",
     "df = pd.DataFrame(data)"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Faster I/O with Parquet"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Whenever you work with bigger datasets, please avoid using CSV format (or similar).\n",
+    "\n",
+    "CSV files are text files, which are human-readable, and therefore a popular option to store data.\n",
+    "\n",
+    "For small datasets, this is not a big issue.\n",
+    "\n",
+    "But, what if your data has millions of rows?\n",
+    "\n",
+    "It can get really slow to do read/write operations on them.\n",
+    "\n",
+    "On the other side, binary files exist too.\n",
+    "\n",
+    "They consist of 0s and 1s and are not meant to be human-readable but to be used by programs that know how to interpret them.\n",
+    "\n",
+    "Because of that, binary files are more compact and consume less space.\n",
+    "\n",
+    "Parquet is one popular binary file format, which is more memory-efficient than CSVs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "\n",
+    "# Shape: (100000000, 5)\n",
+    "df = pd.DataFrame(...)\n",
+    "\n",
+    "# Time: 1m 58s\n",
+    "df.to_csv(\"data.csv\")\n",
+    "\n",
+    "# Time: 8s\n",
+    "df.to_parquet(\"data.parquet\")"
+   ]
   }
  ],
  "metadata": {
diff --git a/_sources/book/pythontricks/Chapter.ipynb b/_sources/book/pythontricks/Chapter.ipynb
index 0e64bb5..3b1ef79 100644
--- a/_sources/book/pythontricks/Chapter.ipynb
+++ b/_sources/book/pythontricks/Chapter.ipynb
@@ -961,7 +961,15 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": []
+   "source": [
+    "One cool feature in Python 3.12:\n",
+    "\n",
+    "The support for Type Variables.\n",
+    "\n",
+    "You can use them to parametrize generic classes and functions.\n",
+    "\n",
+    "See below for a small example where our generic class is parametrized by T which we indicate with [T]."
+   ]
   },
   {
    "cell_type": "code",
diff --git a/book/cooltools/Chapter.html b/book/cooltools/Chapter.html
index 9eb3d65..e06f1fd 100644
--- a/book/cooltools/Chapter.html
+++ b/book/cooltools/Chapter.html
@@ -449,6 +449,7 @@ <h2> Contents </h2>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#better-alternative-to-requests">2.1.32. Better Alternative to <code class="docutils literal notranslate"><span class="pre">requests</span></code></a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#managing-configurations-with-python-dotenv">2.1.33. Managing Configurations with <code class="docutils literal notranslate"><span class="pre">python-dotenv</span></code></a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#work-with-notion-via-python-with">2.1.34. Work with Notion via Python with</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#sql-query-builder-in-python">2.1.35. SQL Query Builder in Python</a></li>
 </ul>
             </nav>
         </div>
@@ -1462,6 +1463,31 @@ <h2><span class="section-number">2.1.34. </span>Work with Notion via Python with
 </div>
 </div>
 </section>
+<section id="sql-query-builder-in-python">
+<h2><span class="section-number">2.1.35. </span>SQL Query Builder in Python<a class="headerlink" href="#sql-query-builder-in-python" title="Permalink to this heading">#</a></h2>
+<p>You can build SQL queries in Python with pypika.</p>
+<p>pypika provides a simple interface to build SQL queries with an easy syntax.</p>
+<p>It supports nearly every SQL command.</p>
+<div class="cell docutils container">
+<div class="cell_input docutils container">
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">pypika</span> <span class="kn">import</span> <span class="n">Tables</span><span class="p">,</span> <span class="n">Query</span>
+
+<span class="n">history</span><span class="p">,</span> <span class="n">customers</span> <span class="o">=</span> <span class="n">Tables</span><span class="p">(</span><span class="s1">&#39;history&#39;</span><span class="p">,</span> <span class="s1">&#39;customers&#39;</span><span class="p">)</span>
+<span class="n">q</span> <span class="o">=</span> <span class="n">Query</span> \
+    <span class="o">.</span><span class="n">from_</span><span class="p">(</span><span class="n">history</span><span class="p">)</span> \
+    <span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">customers</span><span class="p">)</span> \
+    <span class="o">.</span><span class="n">on</span><span class="p">(</span><span class="n">history</span><span class="o">.</span><span class="n">customer_id</span> <span class="o">==</span> <span class="n">customers</span><span class="o">.</span><span class="n">id</span><span class="p">)</span> \
+    <span class="o">.</span><span class="n">select</span><span class="p">(</span><span class="n">history</span><span class="o">.</span><span class="n">star</span><span class="p">)</span> \
+    <span class="o">.</span><span class="n">where</span><span class="p">(</span><span class="n">customers</span><span class="o">.</span><span class="n">id</span> <span class="o">==</span> <span class="mi">5</span><span class="p">)</span>
+    
+<span class="n">q</span><span class="o">.</span><span class="n">get_sql</span><span class="p">()</span>
+<span class="c1"># SELECT &quot;history&quot;.* FROM &quot;history&quot; JOIN &quot;customers&quot; </span>
+<span class="c1"># ON &quot;history&quot;.&quot;customer_id&quot;=&quot;customers&quot;.&quot;id&quot; WHERE &quot;customers&quot;.&quot;id&quot;=5</span>
+</pre></div>
+</div>
+</div>
+</div>
+</section>
 </section>
 
     <script type="text/x-thebe-config">
@@ -1565,6 +1591,7 @@ <h2><span class="section-number">2.1.34. </span>Work with Notion via Python with
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#better-alternative-to-requests">2.1.32. Better Alternative to <code class="docutils literal notranslate"><span class="pre">requests</span></code></a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#managing-configurations-with-python-dotenv">2.1.33. Managing Configurations with <code class="docutils literal notranslate"><span class="pre">python-dotenv</span></code></a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#work-with-notion-via-python-with">2.1.34. Work with Notion via Python with</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#sql-query-builder-in-python">2.1.35. SQL Query Builder in Python</a></li>
 </ul>
   </nav></div>
 
diff --git a/book/machinelearning/outlierdetection.html b/book/machinelearning/outlierdetection.html
index 1bee12c..2ad9507 100644
--- a/book/machinelearning/outlierdetection.html
+++ b/book/machinelearning/outlierdetection.html
@@ -416,6 +416,7 @@ <h2> Contents </h2>
             <nav aria-label="Page">
                 <ul class="visible nav section-nav flex-column">
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#ensembling-for-outlier-detection">5.6.1. Ensembling for Outlier Detection</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#robust-outlier-detection-with-puncc">5.6.2. Robust Outlier Detection with <code class="docutils literal notranslate"><span class="pre">puncc</span></code></a></li>
 </ul>
             </nav>
         </div>
@@ -486,6 +487,48 @@ <h2><span class="section-number">5.6.1. </span>Ensembling for Outlier Detection<
 </div>
 </div>
 </section>
+<section id="robust-outlier-detection-with-puncc">
+<h2><span class="section-number">5.6.2. </span>Robust Outlier Detection with <code class="docutils literal notranslate"><span class="pre">puncc</span></code><a class="headerlink" href="#robust-outlier-detection-with-puncc" title="Permalink to this heading">#</a></h2>
+<p>Outlier Detection is notoriously hard.</p>
+<p>But it doesn’t have to.</p>
+<p><code class="docutils literal notranslate"><span class="pre">puncc</span></code> offers outlier detection, powered by Conformal Prediction, where the detection threshold will be calibrated.</p>
+<p>So, false alarms are reduced.</p>
+<div class="cell docutils container">
+<div class="cell_input docutils container">
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span>!pip install puncc
+</pre></div>
+</div>
+</div>
+</div>
+<div class="cell docutils container">
+<div class="cell_input docutils container">
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">sklearn.ensemble</span> <span class="kn">import</span> <span class="n">IsolationForest</span>
+<span class="kn">from</span> <span class="nn">deel.puncc.anomaly_detection</span> <span class="kn">import</span> <span class="n">SplitCAD</span>
+<span class="kn">from</span> <span class="nn">deel.puncc.api.prediction</span> <span class="kn">import</span> <span class="n">BasePredictor</span>
+
+<span class="c1"># We need to redefine the predict to output the nonconformity scores.</span>
+<span class="k">class</span> <span class="nc">ADPredictor</span><span class="p">(</span><span class="n">BasePredictor</span><span class="p">):</span>
+    <span class="k">def</span> <span class="nf">predict</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">X</span><span class="p">):</span>
+        <span class="k">return</span> <span class="o">-</span><span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">score_samples</span><span class="p">(</span><span class="n">X</span><span class="p">)</span>
+
+<span class="c1"># Wrap Isolation Forest in a predictor</span>
+<span class="n">if_predictor</span> <span class="o">=</span> <span class="n">ADPredictor</span><span class="p">(</span><span class="n">IsolationForest</span><span class="p">())</span>
+
+<span class="c1"># Instantiate CAD on top of IF predictor</span>
+<span class="n">if_cad</span> <span class="o">=</span> <span class="n">SplitCAD</span><span class="p">(</span><span class="n">if_predictor</span><span class="p">,</span> <span class="n">train</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+
+
+<span class="n">if_cad</span><span class="o">.</span><span class="n">fit</span><span class="p">(</span><span class="n">z</span><span class="o">=</span><span class="n">dataset</span><span class="p">,</span> <span class="n">fit_ratio</span><span class="o">=</span><span class="mf">0.7</span><span class="p">)</span>
+
+<span class="c1"># Maximum false detection rate</span>
+<span class="n">alpha</span> <span class="o">=</span> <span class="mf">0.01</span>
+
+<span class="n">results</span> <span class="o">=</span> <span class="n">if_cad</span><span class="o">.</span><span class="n">predict</span><span class="p">(</span><span class="n">new_data</span><span class="p">,</span> <span class="n">alpha</span><span class="o">=</span><span class="n">alpha</span><span class="p">)</span>
+</pre></div>
+</div>
+</div>
+</div>
+</section>
 </section>
 
     <script type="text/x-thebe-config">
@@ -556,6 +599,7 @@ <h2><span class="section-number">5.6.1. </span>Ensembling for Outlier Detection<
   <nav class="bd-toc-nav page-toc">
     <ul class="visible nav section-nav flex-column">
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#ensembling-for-outlier-detection">5.6.1. Ensembling for Outlier Detection</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#robust-outlier-detection-with-puncc">5.6.2. Robust Outlier Detection with <code class="docutils literal notranslate"><span class="pre">puncc</span></code></a></li>
 </ul>
   </nav></div>
 
diff --git a/book/pandas/Chapter.html b/book/pandas/Chapter.html
index db999ab..7e87bb0 100644
--- a/book/pandas/Chapter.html
+++ b/book/pandas/Chapter.html
@@ -420,6 +420,7 @@ <h2> Contents </h2>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#change-the-plotting-backend">8.1.3. Change the Plotting Backend</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#style-your-dataframes">8.1.4. Style your DataFrames</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#set-precision-of-displayed-floats">8.1.5. Set Precision of Displayed Floats</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#faster-i-o-with-parquet">8.1.6. Faster I/O with Parquet</a></li>
 </ul>
             </nav>
         </div>
@@ -534,6 +535,34 @@ <h2><span class="section-number">8.1.5. </span>Set Precision of Displayed Floats
 </div>
 </div>
 </section>
+<section id="faster-i-o-with-parquet">
+<h2><span class="section-number">8.1.6. </span>Faster I/O with Parquet<a class="headerlink" href="#faster-i-o-with-parquet" title="Permalink to this heading">#</a></h2>
+<p>Whenever you work with bigger datasets, please avoid using CSV format (or similar).</p>
+<p>CSV files are text files, which are human-readable, and therefore a popular option to store data.</p>
+<p>For small datasets, this is not a big issue.</p>
+<p>But, what if your data has millions of rows?</p>
+<p>It can get really slow to do read/write operations on them.</p>
+<p>On the other side, binary files exist too.</p>
+<p>They consist of 0s and 1s and are not meant to be human-readable but to be used by programs that know how to interpret them.</p>
+<p>Because of that, binary files are more compact and consume less space.</p>
+<p>Parquet is one popular binary file format, which is more memory-efficient than CSVs.</p>
+<div class="cell docutils container">
+<div class="cell_input docutils container">
+<div class="highlight-ipython3 notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">pandas</span> <span class="k">as</span> <span class="nn">pd</span>
+
+<span class="c1"># Shape: (100000000, 5)</span>
+<span class="n">df</span> <span class="o">=</span> <span class="n">pd</span><span class="o">.</span><span class="n">DataFrame</span><span class="p">(</span><span class="o">...</span><span class="p">)</span>
+
+<span class="c1"># Time: 1m 58s</span>
+<span class="n">df</span><span class="o">.</span><span class="n">to_csv</span><span class="p">(</span><span class="s2">&quot;data.csv&quot;</span><span class="p">)</span>
+
+<span class="c1"># Time: 8s</span>
+<span class="n">df</span><span class="o">.</span><span class="n">to_parquet</span><span class="p">(</span><span class="s2">&quot;data.parquet&quot;</span><span class="p">)</span>
+</pre></div>
+</div>
+</div>
+</div>
+</section>
 </section>
 
     <script type="text/x-thebe-config">
@@ -608,6 +637,7 @@ <h2><span class="section-number">8.1.5. </span>Set Precision of Displayed Floats
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#change-the-plotting-backend">8.1.3. Change the Plotting Backend</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#style-your-dataframes">8.1.4. Style your DataFrames</a></li>
 <li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#set-precision-of-displayed-floats">8.1.5. Set Precision of Displayed Floats</a></li>
+<li class="toc-h2 nav-item toc-entry"><a class="reference internal nav-link" href="#faster-i-o-with-parquet">8.1.6. Faster I/O with Parquet</a></li>
 </ul>
   </nav></div>
 
diff --git a/book/pythontricks/Chapter.html b/book/pythontricks/Chapter.html
index 92ceca6..1fa4e3b 100644
--- a/book/pythontricks/Chapter.html
+++ b/book/pythontricks/Chapter.html
@@ -1014,6 +1014,10 @@ <h2><span class="section-number">10.1.23. </span>Modify Print Statements<a class
 </section>
 <section id="type-variables-in-python-3-12">
 <h2><span class="section-number">10.1.24. </span>Type Variables in Python 3.12<a class="headerlink" href="#type-variables-in-python-3-12" title="Permalink to this heading">#</a></h2>
+<p>One cool feature in Python 3.12:</p>
+<p>The support for Type Variables.</p>
+<p>You can use them to parametrize generic classes and functions.</p>
+<p>See below for a small example where our generic class is parametrized by T which we indicate with [T].</p>
 <div class="cell docutils container">
 <div class="cell_input docutils container">
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="k">class</span> <span class="nc">Stack</span><span class="p">[</span><span class="n">T</span><span class="p">]:</span>
diff --git a/searchindex.js b/searchindex.js
index 4e30dcd..61d7532 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"docnames": ["README", "book/Miscellaneous/Chapter", "book/Miscellaneous/index", "book/codequality/automation", "book/codequality/cicd", "book/codequality/codestyle", "book/codequality/index", "book/codequality/memory", "book/codequality/security", "book/codequality/typing", "book/cooltools/Chapter", "book/cooltools/index", "book/documentation/Chapter", "book/documentation/index", "book/jupyternotebook/Chapter", "book/jupyternotebook/index", "book/llm/Chapter", "book/llm/index", "book/machinelearning/dataaugmentation", "book/machinelearning/eda", "book/machinelearning/featureselection", "book/machinelearning/getdata", "book/machinelearning/index", "book/machinelearning/modeltraining", "book/machinelearning/outlierdetection", "book/machinelearning/preprocessing", "book/machinelearning/timeseries", "book/numpy/Chapter", "book/numpy/index", "book/pandas/Chapter", "book/pandas/additionallibs", "book/pandas/index", "book/polars/Chapter", "book/polars/index", "book/pythontricks/Chapter", "book/pythontricks/index", "book/pythontricks/utility", "book/selenium/Chapter", "book/selenium/index", "book/streamlit/Chapter", "book/streamlit/index", "book/testing/Chapter", "book/testing/index"], "filenames": ["README.md", "book/Miscellaneous/Chapter.ipynb", "book/Miscellaneous/index.ipynb", "book/codequality/automation.ipynb", "book/codequality/cicd.ipynb", "book/codequality/codestyle.ipynb", "book/codequality/index.ipynb", "book/codequality/memory.ipynb", "book/codequality/security.ipynb", "book/codequality/typing.ipynb", "book/cooltools/Chapter.ipynb", "book/cooltools/index.ipynb", "book/documentation/Chapter.ipynb", "book/documentation/index.ipynb", "book/jupyternotebook/Chapter.ipynb", "book/jupyternotebook/index.ipynb", "book/llm/Chapter.ipynb", "book/llm/index.ipynb", "book/machinelearning/dataaugmentation.ipynb", "book/machinelearning/eda.ipynb", "book/machinelearning/featureselection.ipynb", "book/machinelearning/getdata.ipynb", "book/machinelearning/index.ipynb", "book/machinelearning/modeltraining.ipynb", "book/machinelearning/outlierdetection.ipynb", "book/machinelearning/preprocessing.ipynb", "book/machinelearning/timeseries.ipynb", "book/numpy/Chapter.ipynb", "book/numpy/index.ipynb", "book/pandas/Chapter.ipynb", "book/pandas/additionallibs.ipynb", "book/pandas/index.ipynb", "book/polars/Chapter.ipynb", "book/polars/index.ipynb", "book/pythontricks/Chapter.ipynb", "book/pythontricks/index.ipynb", "book/pythontricks/utility.ipynb", "book/selenium/Chapter.ipynb", "book/selenium/index.ipynb", "book/streamlit/Chapter.ipynb", "book/streamlit/index.ipynb", "book/testing/Chapter.ipynb", "book/testing/index.ipynb"], "titles": ["Delightful Data Science", "<span class=\"section-number\">14.1. </span>Miscellaneous", "<span class=\"section-number\">14. </span>Miscellaneous", "<span class=\"section-number\">1.1. </span>Automation", "<span class=\"section-number\">1.2. </span>CI/CD", "<span class=\"section-number\">1.3. </span>Code Style", "<span class=\"section-number\">1. </span>Code Quality", "<span class=\"section-number\">1.4. </span>Memory Optimization", "<span class=\"section-number\">1.5. </span>Security in Projects", "<span class=\"section-number\">1.6. </span>Typing", "<span class=\"section-number\">2.1. </span>Cool Tools", "<span class=\"section-number\">2. </span>Cool Tools", "<span class=\"section-number\">4.1. </span>Documentation", "<span class=\"section-number\">4. </span>Documentation", "<span class=\"section-number\">3.1. </span>Jupyter Notebook Tips and Tricks", "<span class=\"section-number\">3. </span>Jupyter Notebook Tricks and Tips", "<span class=\"section-number\">6.1. </span>LLM", "<span class=\"section-number\">6. </span>LLM", "<span class=\"section-number\">5.1. </span>Data Augmentation", "<span class=\"section-number\">5.2. </span>EDA", "<span class=\"section-number\">5.3. </span>Feature Selection", "<span class=\"section-number\">5.4. </span>Get Data", "<span class=\"section-number\">5. </span>Machine Learning", "<span class=\"section-number\">5.5. </span>Model Training", "<span class=\"section-number\">5.6. </span>Outlier Detection", "<span class=\"section-number\">5.8. </span>Preprocessing", "<span class=\"section-number\">5.7. </span>Time Series", "<span class=\"section-number\">7.1. </span>NumPy Tips and Tricks", "<span class=\"section-number\">7. </span>NumPy Tips and Tricks", "<span class=\"section-number\">8.1. </span>Pandas Tips and Tricks", "<span class=\"section-number\">8.2. </span>Utility Libraries for Pandas", "<span class=\"section-number\">8. </span>Pandas Tricks and Tips", "<span class=\"section-number\">9.1. </span>Polars Tips &amp; Tricks", "<span class=\"section-number\">9. </span>Polars", "<span class=\"section-number\">10.1. </span>Pure Python + Built-in libraries", "<span class=\"section-number\">10. </span>Python Tips and Tricks", "<span class=\"section-number\">10.2. </span>Utilities for Python", "<span class=\"section-number\">11.1. </span>Selenium Tips and Tricks", "<span class=\"section-number\">11. </span>Selenium Tips and Tricks", "<span class=\"section-number\">12.1. </span>Streamlit Tips and Tricks", "<span class=\"section-number\">12. </span>Streamlit Tips and Tricks", "<span class=\"section-number\">13.1. </span>Testing", "<span class=\"section-number\">13. </span>Testing in Python"], "terms": {"It": [0, 1, 4, 5, 8, 9, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 34, 36, 37, 41], "wa": [0, 1, 10, 23, 26, 34, 41], "decemb": [0, 21], "2022": [0, 8, 21], "when": [0, 1, 4, 5, 9, 10, 14, 16, 20, 25, 29, 34, 36, 37, 41], "i": [0, 7, 10, 16, 20, 23, 24, 34, 36, 41], "start": [0, 1, 8, 29, 34], "write": [0, 1, 5, 9, 10, 14, 19, 36], "daili": 0, "linkedin": [0, 21], "post": 0, "share": [0, 34], "one": [0, 5, 10, 14, 19, 23, 25, 27, 29, 30, 34, 36, 37, 39], "short": [0, 25], "python": [0, 3, 7, 8, 9, 12, 16, 18, 19, 20, 21, 23, 24, 25, 26, 37, 41], "tip": 0, "per": [0, 14, 23, 25], "dai": [0, 26, 36], "my": [0, 25], "main": [0, 4, 8, 10, 23, 36], "goal": 0, "what": [0, 1, 9, 10, 21, 23, 34, 36, 39, 41], "learnt": 0, "over": [0, 10, 18, 23, 26], "year": [0, 19], "am": 0, "current": [0, 5, 10, 23], "learn": [0, 10, 20], "other": [0, 5, 8, 10, 19, 21, 23, 27, 34, 41], "thought": 0, "s": [0, 1, 4, 8, 9, 10, 12, 14, 19, 20, 21, 26, 27, 29, 30, 34, 36, 37], "us": [0, 1, 3, 4, 5, 7, 8, 9, 10, 14, 16, 18, 20, 21, 24, 25, 26, 27, 29, 30, 36, 37, 39, 41], "me": [0, 25], "probabl": [0, 4, 10, 23, 34, 37], "peopl": 0, "too": [0, 4, 10, 19, 21, 23, 26, 34, 36], "As": 0, "time": [0, 1, 4, 5, 9, 10, 14, 23, 30, 36, 37, 41], "went": 0, "more": [0, 1, 5, 8, 9, 16, 19, 20, 23, 24, 25, 29, 36], "found": [0, 8, 10, 34], "soon": 0, "realiz": 0, "could": [0, 20, 21, 27], "compil": [0, 14, 23], "comprehens": 0, "guid": 0, "anyon": 0, "interest": [0, 41], "becom": 0, "better": [0, 23, 30], "scientist": [0, 32], "thu": [0, 21, 23], "idea": 0, "born": 0, "The": [0, 8, 10, 19, 20, 21, 23, 25, 34, 37, 41], "contain": [0, 10, 14, 23], "all": [0, 5, 10, 14, 16, 19, 20, 23, 25, 27, 30, 32, 34, 36, 41], "author": 0, "well": [0, 5, 10, 23], "mani": [0, 1, 10, 23, 34, 41], "come": [0, 8, 10, 21, 23, 26, 34, 36, 41], "futur": [0, 23, 26], "call": [0, 8, 10, 25, 34, 41], "becaus": [0, 5, 10, 23, 26], "aim": [0, 10, 23], "make": [0, 1, 4, 5, 7, 9, 14, 16, 19, 20, 23, 30, 36, 37, 41], "your": [0, 1, 3, 4, 9, 18, 19, 21, 26, 27, 30, 32, 39], "journei": 0, "help": [0, 1, 9, 10, 14, 16, 19, 23, 41], "you": [0, 1, 3, 4, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 32, 34, 36, 37, 39, 41], "By": [0, 23, 29, 30, 37, 41], "incorpor": [0, 23], "trick": [0, 34], "workflow": [0, 23], "can": [0, 1, 3, 4, 5, 7, 8, 9, 10, 14, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 34, 36, 37, 39, 41], "project": [0, 3, 10, 12, 21, 27, 37, 41], "enjoy": 0, "success": 0, "add": [1, 9, 10, 14, 16, 23, 30], "8": [1, 3, 8, 19, 20, 23, 34, 36, 41], "work": [1, 8, 9, 14, 16, 18, 19, 20, 23, 26, 29, 34], "boost": [1, 18, 26], "product": [1, 9, 23, 29], "\ud835\udc0f\ud835\udc32\ud835\udc2d\ud835\udc21\ud835\udc28\ud835\udc27": 1, "\ud835\udc08\ud835\udc27\ud835\udc1d\ud835\udc1e\ud835\udc27\ud835\udc2d": 1, "sure": [1, 5, 9, 14, 41], "indent": [1, 34], "correct": [1, 10, 26], "everi": [1, 4, 8, 10, 14, 20, 21, 23, 24], "enter": [1, 34], "\ud835\udc0f\ud835\udc32\ud835\udc25\ud835\udc1a\ud835\udc27\ud835\udc1c\ud835\udc1e": 1, "A": [1, 3, 10, 12, 14, 18, 19, 20, 21, 23, 29, 34, 36, 41], "brainer": 1, "includ": [1, 8, 10, 19, 23, 24, 25, 26, 34, 36], "benefit": 1, "like": [1, 5, 8, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 32, 34, 37, 41], "paramet": [1, 36], "suggest": [1, 8], "code": [1, 3, 8, 9, 23, 29, 34, 39, 41], "navig": 1, "signatur": 1, "microsoft": [1, 16, 23], "declar": 1, "default": [1, 10, 23, 29, 30, 37, 41], "languag": [1, 10, 16, 21, 36], "server": [1, 14], "\ud835\udc06\ud835\udc22\ud835\udc2d\ud835\udc0b\ud835\udc1e\ud835\udc27\ud835\udc2c": 1, "provid": [1, 5, 8, 10, 14, 16, 19, 21, 23, 25, 26, 30, 34, 36, 41], "power": [1, 18, 20, 26], "featur": [1, 10], "git": [1, 14], "experi": 1, "see": [1, 3, 7, 9, 10, 14, 19, 20, 21, 23, 29, 34, 36, 37, 41], "specif": [1, 10, 14, 23, 34, 37], "line": [1, 3, 7, 8, 10, 14, 19, 23, 26, 29, 34, 39], "whom": 1, "which": [1, 7, 8, 9, 10, 20, 23, 26, 27, 34, 41], "pull": [1, 4], "request": [1, 5, 8, 36], "messag": [1, 10, 16, 36], "And": [1, 10, 16, 18, 19, 23, 29], "much": [1, 16, 23, 36], "\ud835\udc09\ud835\udc2e\ud835\udc29\ud835\udc32\ud835\udc2d\ud835\udc1e\ud835\udc2b": 1, "notebook": 1, "support": [1, 4, 5, 10, 16, 19, 20, 21, 23, 24, 25, 26], "allow": [1, 4, 10, 19, 23, 34, 41], "ani": [1, 8, 10, 23, 34, 41], "environ": [1, 3, 16], "jupyt": [1, 10], "kernel": 1, "\ud835\udc00\ud835\udc11\ud835\udc04\ud835\udc0f\ud835\udc0b": 1, "\ud835\udc1f\ud835\udc28\ud835\udc2b": 1, "automat": [1, 8, 19, 20, 23, 25, 30, 37, 41], "evalu": [1, 5, 26], "real": [1, 14, 21, 41], "type": [1, 5, 10, 19, 20, 23, 26, 30], "displai": [1, 26, 36], "variabl": [1, 5, 9, 10, 19, 23, 25, 26], "error": [1, 5, 9, 21, 23, 25, 34, 36], "readabl": [1, 25], "wai": [1, 3, 10, 14, 23, 25, 29, 30, 36, 37, 41], "onli": [1, 5, 9, 10, 14, 16, 19, 20, 23, 25, 26, 29, 30, 34, 36, 37], "3": [1, 3, 4, 7, 8, 9, 10, 14, 16, 19, 20, 21, 23, 24, 26, 27, 29, 37, 41], "7": [1, 3, 7, 8, 14, 19, 20, 23, 29, 34, 41], "\ud835\udc0f\ud835\udc1a\ud835\udc2d\ud835\udc21": 1, "gener": [1, 26, 27, 39, 41], "intern": [1, 10], "import": [1, 3, 7, 8, 9, 10, 14, 16, 18, 19, 21, 23, 24, 25, 26, 27, 29, 30, 32, 34, 36, 37, 39, 41], "statement": [1, 5, 16, 30, 41], "\ud835\udc13\ud835\udc1e\ud835\udc2c\ud835\udc2d": 1, "\ud835\udc04\ud835\udc31\ud835\udc29\ud835\udc25\ud835\udc28\ud835\udc2b\ud835\udc1e\ud835\udc2b": 1, "show": [1, 10, 19, 20, 23, 26, 29], "test": [1, 5, 8, 10, 14, 16, 23, 26, 32], "explor": 1, "without": [1, 9, 10, 12, 19, 23, 34, 41], "effort": [1, 21], "instead": [1, 4, 5, 9, 10, 20, 25, 26, 30, 34, 37, 41], "go": [1, 9, 10, 37], "through": [1, 8, 9, 10, 23, 37], "output": [1, 10, 16, 20, 21, 23, 25, 34, 36], "termin": [1, 34], "\ud835\udc1a\ud835\udc2e\ud835\udc2d\ud835\udc28\ud835\udc03\ud835\udc28\ud835\udc1c\ud835\udc2c\ud835\udc2d\ud835\udc2b\ud835\udc22\ud835\udc27\ud835\udc20": 1, "quickli": [1, 14, 23], "docstr": [1, 5], "function": [1, 5, 7, 8, 9, 14, 19, 21, 23, 25, 26, 29, 30, 36, 41], "ar": [1, 4, 5, 10, 14, 16, 18, 20, 23, 26, 27, 34, 36, 37, 41], "new": [1, 4, 10, 14, 16, 23, 25, 34, 36, 37], "data": [1, 8, 14, 20, 24, 27, 29, 30, 34, 39], "scienc": [1, 27], "hassl": [1, 10], "set": [1, 3, 8, 14, 16, 19, 25, 26, 27, 36, 37, 41], "up": [1, 3, 5, 10, 16, 23, 26, 34, 41], "structur": [1, 14], "try": [1, 5, 7, 8, 9, 10, 12, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 30, 36, 41], "command": [1, 8, 10, 14, 21, 34], "tool": [1, 3, 5, 8, 20, 23, 34], "creat": [1, 3, 8, 12, 16, 19, 23, 34, 36, 41], "thi": [1, 3, 5, 8, 10, 19, 20, 23, 25, 26, 27, 29, 30, 34, 36, 37, 41], "save": [1, 10, 16, 21, 30, 34, 36, 37, 41], "standard": [1, 3, 10, 21, 26, 34, 36], "There": [1, 10, 23], "ton": 1, "github": [1, 21], "sai": [1, 5, 10, 14, 29, 34], "goodby": [1, 5], "tediou": 1, "link": [1, 9, 23], "repositori": [1, 10], "http": [1, 4, 8, 10, 21, 23, 25, 34, 36, 37], "com": [1, 4, 10, 16, 21, 23, 25, 34, 37], "drivendata": 1, "do": [1, 3, 5, 8, 9, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 30, 34, 36, 37, 39, 41], "want": [1, 3, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 25, 26, 30, 34, 36, 37, 39, 41], "someth": [1, 10, 34], "react": 1, "app": [1, 5, 23, 34, 39], "anyth": [1, 4], "ai": [1, 10, 23], "an": [1, 8, 9, 10, 14, 16, 19, 20, 23, 24, 25, 36, 41], "entir": 1, "codebas": [1, 10, 30], "base": [1, 10, 19, 20, 24, 25, 29, 30, 34, 36], "markdown": [1, 5], "file": [1, 3, 4, 8, 14, 25, 41], "describ": [1, 10, 26, 34], "kind": 1, "applic": [1, 8, 10, 16, 19, 23], "necessari": [1, 4], "boilerpl": 1, "clear": [1, 23], "But": [1, 5, 8, 9, 10, 20, 23, 26, 29, 34, 36, 37, 39, 41], "alwai": [1, 5, 20, 23], "easi": [1, 10, 14, 18, 21, 23, 24, 37], "team": [1, 23], "With": [1, 3, 4, 5, 10, 14, 19, 20, 23, 27, 34, 36, 39, 41], "get": [1, 5, 8, 9, 14, 30, 36, 37], "releas": [1, 23, 37], "manag": [1, 23], "design": 1, "defin": [1, 3, 4, 9, 10, 18, 19, 20, 23, 24, 29, 30, 34, 37, 41], "rule": 1, "bump": 1, "version": [1, 3, 4, 8, 9, 25, 37], "changelog": 1, "life": [1, 23], "easier": [1, 5, 26, 34], "enforc": [1, 5, 30], "descript": 1, "struggl": [3, 10], "rememb": [3, 10], "exact": [3, 23, 26], "seri": [3, 20, 23, 30], "need": [3, 4, 5, 8, 9, 10, 12, 14, 16, 20, 21, 23, 29, 30, 34], "build": [3, 4, 23, 25], "packag": [3, 8, 16, 21, 23, 26, 27, 30, 41], "Or": [3, 10], "manual": [3, 5, 10, 14, 19, 34, 36, 37], "run": [3, 4, 5, 7, 8, 9, 10, 12, 20, 23, 26, 41], "instal": [3, 4, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 24, 25, 26, 30, 32, 36, 37, 39, 41], "depend": [3, 19], "rescu": 3, "have": [3, 5, 10, 14, 20, 23, 25, 26, 29, 30, 32, 34, 36, 37, 41], "execut": [3, 14, 34, 41], "those": [3, 10, 34, 37], "below": [3, 4, 7, 8, 9, 10, 14, 19, 20, 21, 23, 24, 26, 29, 30, 34, 36, 37, 41], "how": [3, 5, 7, 9, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 34, 36, 41], "we": [3, 8, 10, 14, 16, 20, 21, 23, 24, 34, 41], "our": [3, 16, 34], "format": [3, 10, 16, 19, 21, 25, 34, 36], "black": [3, 14, 25], "name": [3, 4, 8, 9, 10, 16, 20, 21, 23, 25, 29, 30, 36, 41], "echo": [3, 10, 34], "requir": [3, 4, 41], "pip": [3, 4, 5, 7, 8, 9, 12, 14, 16, 18, 19, 20, 21, 23, 24, 25, 26, 30, 32, 36, 37, 39, 41], "r": [3, 4, 8, 10, 20], "txt": [3, 4, 10], "quiet": 3, "pytest": 3, "against": [3, 8, 16, 20, 23], "multipl": [3, 10, 19, 20, 23, 24, 26], "hard": [3, 10], "step": [3, 4, 14, 19, 23, 27], "local": [3, 10], "custom": [3, 5, 10, 23], "session": [3, 10, 23], "script": [3, 7, 10, 23], "exampl": [3, 5, 8, 10, 21, 23, 24, 26, 30, 34, 36, 37, 41], "where": [3, 10, 20, 23, 34, 39, 41], "\ud835\udc2d\ud835\udc1e\ud835\udc2c\ud835\udc2d\ud835\udc2c": 3, "\ud835\udc27\ud835\udc28\ud835\udc31\ud835\udc1f\ud835\udc22\ud835\udc25\ud835\udc1e": 3, "\ud835\udc29\ud835\udc32": 3, "moreov": 3, "anoth": [3, 27], "\ud835\udc25\ud835\udc22\ud835\udc27\ud835\udc2d": 3, "flake8": [3, 5, 14], "highli": [3, 20, 25], "customiz": 3, "so": [3, 4, 9, 10, 14, 20, 23, 24, 34, 36, 37, 41], "check": [3, 5, 8, 16, 23, 30, 34, 37, 41], "out": [3, 5, 10, 14, 16, 19, 23, 26], "document": [3, 10, 34, 41], "noxfil": 3, "py": [3, 4, 5, 7, 8, 9, 10, 12, 14, 41], "6": [3, 7, 10, 14, 19, 20, 23, 29, 34, 36, 41], "9": [3, 4, 7, 16, 19, 20, 23, 25, 29, 34], "def": [3, 5, 7, 9, 10, 14, 23, 29, 30, 34, 36, 41], "lint": 3, "don": [4, 5, 10, 14, 23, 26, 30, 32, 34, 36, 37, 41], "t": [4, 5, 10, 14, 21, 23, 26, 30, 32, 34, 36, 37, 41], "wast": [4, 5, 37], "commit": [4, 14], "push": [4, 14, 34], "chang": [4, 14, 20, 23, 30, 34, 37], "docker": 4, "imag": [4, 36, 41], "machin": [4, 20, 23], "curl": 4, "raw": [4, 10, 23], "githubusercont": [4, 23], "nekto": 4, "master": 4, "sh": 4, "sudo": 4, "bash": 4, "whenev": 4, "trigger": 4, "again": [4, 10, 20, 23, 30, 32, 41], "even": [4, 5, 9, 10, 25, 26, 30], "didn": 4, "small": [4, 10, 14, 16, 23, 30, 34], "snippet": [4, 5, 14], "skip": [4, 8], "next": [4, 21, 34, 36], "branch": 4, "job": [4, 5, 10], "ubuntu": 4, "latest": [4, 37], "checkout": 4, "v4": 4, "setup": 4, "poetri": [4, 10], "pipenv": 4, "unit": [4, 14, 30, 41], "python3": 4, "u": [4, 14], "m": [4, 7, 10, 19, 23, 26], "unittest": 4, "If": [5, 10, 12, 14, 19, 23, 25, 30, 32, 36, 41], "problemat": 5, "difficult": [5, 12, 20, 29], "read": [5, 10], "reduc": [5, 14, 16, 41], "perform": [5, 16, 19, 20, 26, 34, 36, 41], "interpret": [5, 20, 34], "ha": [5, 8, 10, 20, 26, 32, 34], "spend": 5, "less": [5, 26, 34], "unnecessari": [5, 30], "potenti": [5, 8], "issu": [5, 10, 23, 26], "aris": 5, "conflict": [5, 10], "clean": [5, 10, 14, 34, 41], "optim": [5, 10, 14, 20, 29], "also": [5, 8, 10, 16, 21, 23, 24, 26, 30, 34, 36, 37, 41], "fine": 5, "tune": 5, "process": [5, 8, 14, 20], "place": 5, "One": [5, 10, 14, 23, 34, 36], "aspect": 5, "qualiti": [5, 23, 30], "maintain": [5, 10], "In": [5, 8, 10, 14, 20, 21, 23, 26, 29, 30, 34, 41], "about": [5, 20, 23, 34], "method": [5, 10, 19, 20, 23, 24, 26], "class": [5, 10, 25, 26, 36, 41], "print": [5, 8, 9, 14, 20, 21, 23, 25, 26, 27, 30, 36], "coverag": [5, 23], "report": [5, 8, 19, 23, 39, 41], "poorli": 5, "v": [5, 41], "bigger": [5, 23], "look": [5, 10, 14, 18, 19, 23, 25, 41], "nasti": [5, 10], "order": 5, "them": [5, 8, 10, 14, 20, 23, 25, 34, 36, 41], "librari": [5, 8, 10, 12, 18, 19, 20, 21, 23, 24, 25, 26, 36, 39], "alphabet": [5, 10], "separ": 5, "section": [5, 23], "cli": [5, 8, 21], "avoid": [5, 9, 23], "focu": [5, 23], "high": [5, 8, 10, 20], "hand": 5, "tire": [5, 10, 36], "thei": [5, 8, 9, 10, 16, 20, 25, 34, 36, 41], "form": [5, 10], "sinc": [5, 8, 21, 23, 25, 26, 34, 41], "popular": [5, 23, 32, 39], "choic": [5, 23, 30], "config": [5, 10, 14, 23], "nice": [5, 10, 14, 21, 41], "catch": [5, 9], "befor": [5, 9, 23, 26], "caus": [5, 9, 23, 25], "problem": [5, 9, 10, 16, 19, 20, 23, 25, 36], "still": [5, 9, 10, 14, 19, 23], "pylint": 5, "10x": 5, "100x": 5, "faster": [5, 23, 26], "linter": 5, "written": [5, 9, 10], "rust": 5, "magnitud": 5, "than": [5, 8, 9, 16, 23, 24, 26, 29, 34, 36], "while": [5, 10, 19, 23, 34, 37], "integr": [5, 9, 23, 37], "some_fil": 5, "json": [5, 10, 19, 21], "divid": 5, "b": [5, 7, 10, 14, 19, 20, 29, 34, 36, 41], "result": [5, 8, 10, 14, 19, 20, 21, 25, 26, 27, 30, 34, 36, 41], "except": [5, 10, 20], "zerodivisionerror": 5, "e": [5, 10, 19, 23, 36], "infin": 5, "return": [5, 7, 9, 14, 16, 21, 23, 26, 29, 30, 34, 36, 41], "appli": [5, 18, 23, 29], "blacken": 5, "doc": [5, 10], "latex": 5, "restructuredtext": 5, "unformat": 5, "anymor": [5, 10, 27, 36], "md": 5, "typo": 5, "word": [5, 10, 19, 25], "sourc": [5, 10, 14, 19, 23], "touch": [5, 10], "nich": 5, "term": [5, 23], "fals": [5, 8, 10, 14, 23, 34, 37], "posit": [5, 19, 23], "directori": [5, 14, 41], "most": [7, 10, 23, 29, 30, 41], "amount": [7, 9, 14], "modul": [7, 8, 12, 21, 23, 27, 36], "analysi": 7, "consumpt": [7, 23], "within": [7, 10, 14, 39], "decor": [7, 9, 10, 23, 34], "profil": [7, 8, 14], "pass": [7, 9, 10, 23], "option": [7, 10, 23, 29, 30, 37, 41], "load": [7, 10, 14, 23, 26], "from": [7, 9, 16, 19, 20, 23, 24, 25, 26, 30, 36, 37, 39, 41], "my_func": 7, "1": [7, 8, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 34, 36, 41], "10": [7, 8, 10, 14, 19, 20, 23, 25, 26, 29, 34, 36], "2": [7, 8, 10, 14, 19, 20, 21, 23, 25, 26, 29, 34, 36, 41], "del": 7, "mem": 7, "usag": [7, 16, 30], "increment": 7, "occurr": 7, "content": [7, 14, 16, 23, 25], "41": 7, "mib": 7, "4": [7, 8, 10, 14, 16, 19, 20, 23, 26, 29, 34, 37, 41], "5": [7, 8, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 34, 41], "49": [7, 23], "102": 7, "rang": [7, 10, 14, 19, 20, 23, 24, 25, 26, 34, 36], "100": [7, 9, 10, 12, 16, 23, 30, 41], "194": 7, "145": 7, "0": [7, 8, 10, 14, 16, 19, 20, 23, 24, 25, 30, 34, 41], "22": [7, 26], "20": [7, 19, 20, 23, 25, 29, 41], "find": [8, 9, 26], "known": 8, "abstract": 8, "syntax": [8, 10, 36], "tree": [8, 20, 23, 34], "plugin": [8, 41], "produc": [8, 41], "ignor": [8, 14, 23, 34], "verifi": 8, "ssl": 8, "certif": 8, "\ud835\udc2f\ud835\udc1e\ud835\udc2b\ud835\udc22\ud835\udc1f\ud835\udc32": 8, "\ud835\udc05\ud835\udc1a\ud835\udc25\ud835\udc2c\ud835\udc1e": 8, "immedi": [8, 29, 34, 41], "identifi": [8, 10, 20, 26], "bandit_test": 8, "www": [8, 10, 36, 37], "googl": [8, 23, 34], "de": [8, 10, 21, 25, 34], "info": [8, 36], "none": [8, 34], "exclud": 8, "node_visitor": 8, "warn": [8, 10, 36], "unabl": 8, "qualifi": 8, "12": [8, 14, 20, 21, 23, 26], "23": [8, 36], "15": [8, 19, 20, 23], "32": [8, 23], "44": [8, 36], "650893": 8, "b501": 8, "request_with_no_cert_valid": 8, "disabl": 8, "sever": [8, 23], "confid": [8, 23], "cwe": 8, "295": 8, "mitr": 8, "org": [8, 10, 36], "definit": 8, "html": 8, "locat": [8, 19, 23], "readthedoc": 8, "io": 8, "en": [8, 10, 21, 25], "b501_request_with_no_cert_valid": 8, "status_cod": 8, "scan": 8, "total": [8, 10, 14, 23, 41], "nosec": 8, "metric": [8, 14, 23, 26, 32], "undefin": 8, "low": [8, 23], "medium": 8, "audit": 8, "advisori": 8, "databas": [8, 16, 41], "should": [8, 10, 34, 36, 41], "upgrad": [8, 41], "id": [8, 21, 34], "fix": [8, 23, 34], "flask": [8, 10], "pysec": 8, "2019": 8, "179": 8, "2018": 8, "66": 8, "setuptool": 8, "56": [8, 23], "ghsa": 8, "r9hx": 8, "vwmv": 8, "q579": 8, "65": 8, "almost": 8, "password": 8, "api": [8, 10, 16, 21, 36, 41], "kei": [8, 10, 16, 19, 23, 27, 34], "never": [8, 23, 25, 26], "plain": [8, 10, 36], "text": [8, 14, 23, 36], "would": [8, 16, 23, 26, 34], "trivial": 8, "access": [8, 36], "anybodi": 8, "who": 8, "To": [8, 10, 19, 20, 23, 24, 29, 34, 37, 41], "wrapper": [8, 21, 41], "around": [8, 41], "system": [8, 16, 23, 41], "maco": 8, "keychain": 8, "window": 8, "locker": 8, "etc": [8, 10, 19, 21, 23], "safer": 8, "retriev": [8, 21, 34], "easili": [8, 9, 10, 18, 19, 21, 23, 34], "field": [8, 34], "done": [8, 23, 34], "set_password": 8, "mydb": 8, "usernam": [8, 34], "get_password": 8, "hint": 9, "expect": [9, 16, 41], "wrong": 9, "awai": 9, "rais": [9, 10], "thing": [9, 12, 23, 41], "typecheck": 9, "say_hello": 9, "str": [9, 10, 34], "f": [9, 10, 14, 19, 30, 34, 36], "hello": [9, 10, 14, 16, 34], "checker": [9, 20], "analyz": [9, 10, 23, 26], "ensur": [9, 10, 16, 26, 34], "align": 9, "reliabl": 9, "bank": 9, "deposit": 9, "int": [9, 10, 30], "balanc": [9, 23], "withdraw": 9, "1000": [9, 20, 26, 29, 36], "wish": 9, "fast": [9, 10, 18, 23, 29, 30, 34, 41], "match": [9, 10, 34], "typescript": 9, "commun": [9, 32], "extra": [9, 34], "3x": [9, 16, 30], "5x": [9, 30], "og": 9, "whether": 9, "pleas": 9, "consid": [9, 23, 24, 41], "know": [10, 20, 21, 23, 29, 34], "headach": 10, "pycountri": 10, "iso": 10, "alpha_2": 10, "alpha_3": 10, "eur": 10, "freez": 10, "veri": [10, 20, 23, 41], "good": [10, 23], "virtual": 10, "encount": [10, 16], "follow": [10, 12, 14, 20, 37], "desir": 10, "unus": 10, "realli": [10, 25, 41], "y": [10, 14, 19, 20, 23, 26, 34, 41], "two": [10, 14, 20, 23, 25, 34], "pgeocod": 10, "just": [10, 14, 19, 23, 29, 30, 34], "specifi": [10, 19, 23, 25, 29, 34, 36, 41], "km": 10, "dist": 10, "geodist": 10, "query_postal_cod": 10, "10117": 10, "80331": 10, "ever": 10, "convers": 10, "manipul": [10, 36], "handl": [10, 20, 21, 23, 25, 26, 34, 36], "physic": 10, "quantiti": [10, 34], "arithmet": 10, "keep": 10, "track": [10, 14], "accur": [10, 26], "initi": [10, 23], "registri": 10, "ureg": 10, "unitregistri": 10, "33": 10, "kilomet": 10, "feet": 10, "108267": 10, "71653543308": 10, "foot": 10, "oper": [10, 30], "speed": [10, 23, 26, 41], "hour": [10, 26, 30, 36], "198": 10, "steroid": [10, 23, 36], "cpu": [10, 41], "gpu": [10, 23], "memori": [10, 23, 34, 36], "bottleneck": 10, "propos": 10, "web": [10, 19, 25, 37], "gui": [10, 23], "my_modul": [10, 14], "repair": 10, "scrambl": 10, "occur": [10, 20], "encod": [10, 23], "decod": 10, "foreign": 10, "appear": 10, "correctli": [10, 41], "fix_text": 10, "doe": [10, 16, 25], "\u00e2": 10, "\u0153ftfy\u00e2": 10, "x9d": 10, "mean": [10, 14, 20, 23, 36], "\u00e2\u0153": 10, "mona": 10, "lisa": 10, "doesn\u00e3\u0192\u00e2": 10, "\u00e3": 10, "\u0161\u00e2": 10, "\u017e\u00e2": 10, "eyebrow": 10, "pre": [10, 23, 36, 41], "train": [10, 14, 16, 20, 25, 26], "model": [10, 16, 18, 20, 24, 25, 26], "cv2": [10, 18], "input_path": 10, "car": [10, 34], "jpg": [10, 18, 36], "output_path": 10, "car2": 10, "input_fil": 10, "imread": [10, 18], "output_fil": 10, "imwrit": 10, "clunki": 10, "intuit": [10, 23, 25, 36], "auto": [10, 26], "ditch": [10, 32], "argpars": 10, "hello_script": 10, "bye": 10, "__name__": [10, 36], "__main__": [10, 36], "john": [10, 16, 36], "annoi": [10, 37, 41], "few": [10, 19], "divers": [10, 41], "address": [10, 16, 23, 25, 36], "phone": [10, 16, 25], "email": [10, 16, 23, 25], "fr_fr": 10, "phone_numb": 10, "color": [10, 25, 29, 36], "offer": [10, 19, 23, 26, 34, 36], "beauti": [10, 14], "bore": 10, "url": [10, 21, 25, 34, 36], "25000000": 10, "\ud835\udc2d\ud835\udc2a\ud835\udc1d\ud835\udc26": 10, "set_descript": 10, "glob": 10, "sample_data": 10, "csv": [10, 19, 23, 26], "emoticon": 10, "give": [10, 23, 26, 30, 36], "insight": 10, "especi": [10, 29, 34, 37, 41], "sentiment": [10, 23], "emot_obj": 10, "core": 10, "love": 10, "watermark": 10, "same": [10, 14, 19, 34, 41], "endpoint": 10, "second": [10, 23, 25, 36], "delai": [10, 36], "take": [10, 16, 23, 34, 36, 41], "60": [10, 23], "httpbin": 10, "requests_cach": 10, "cachedsess": 10, "test_cach": 10, "string": [10, 19, 29, 30, 32, 34], "fuzzi": 10, "differ": [10, 18, 19, 21, 23, 26, 37], "variat": 10, "panda": [10, 19, 20, 21, 23, 25, 26, 32, 36], "pd": [10, 19, 20, 23, 25, 26, 30, 39], "util": [10, 14, 23, 24, 26], "unify_nam": 10, "deduplicate_list_str": 10, "read_csv": [10, 19, 23, 30, 39], "bairro": 10, "imovel": 10, "value_count": 10, "threshold_count": 10, "500": [10, 21, 23], "\ud835\udc25\ud835\udc22\ud835\udc27\ud835\udc24\ud835\udc1c\ud835\udc21\ud835\udc1e\ud835\udc1c\ud835\udc24\ud835\udc1e\ud835\udc2b": 10, "recurs": 10, "mai": [10, 20, 25], "harm": [10, 16, 20], "search": [10, 21, 36], "engin": [10, 23], "rank": [10, 20, 23], "linkcheck": 10, "bashplotlib": 10, "littl": 10, "basic": 10, "quick": [10, 14], "visual": [10, 14], "histogram": 10, "scatter": 10, "plot": [10, 14], "hist": 10, "stop": [10, 14, 34], "resolv": 10, "pipdeptre": 10, "possibl": [10, 23], "wrote": 10, "acrosort": 10, "tex": 10, "fun": 10, "sundai": 10, "publish": 10, "\ud835\udc82\ud835\udc84\ud835\udc93\ud835\udc90": 10, "\ud835\udc82\ud835\udc83\ud835\udc83\ud835\udc93\ud835\udc86\ud835\udc97\ud835\udc8a\ud835\udc82\ud835\udc95\ud835\udc8a\ud835\udc90\ud835\udc8f": 10, "\ud835\udc94\ud835\udc89\ud835\udc90\ud835\udc93\ud835\udc95\ud835\udc87\ud835\udc90\ud835\udc93\ud835\udc8e": 10, "\ud835\udc8d\ud835\udc90\ud835\udc8f\ud835\udc88\ud835\udc87\ud835\udc90\ud835\udc93\ud835\udc8e": 10, "begin": [10, 34], "lnkd": 10, "etf8qs5w": 10, "acrosort_tex": 10, "old": [10, 23, 34, 37], "pyfiglet": 10, "banner": 10, "introduc": [10, 34], "user": [10, 14, 16, 21], "font": 10, "ascii_art": 10, "figlet_format": 10, "world": [10, 14], "bubblehead": 10, "bulbhead": 10, "entiti": 10, "recognit": 10, "displaci": 10, "detect": [10, 16, 20, 21, 23], "super": [10, 23], "some": [10, 20, 23, 30, 34, 41], "sentenc": [10, 23], "span": 10, "chelsea": 10, "footbal": [10, 34], "club": 10, "english": 10, "profession": 10, "fulham": 10, "west": 10, "london": [10, 36], "1905": 10, "plai": [10, 34, 41], "home": 10, "game": [10, 41], "stamford": 10, "bridg": 10, "compet": 10, "premier": 10, "leagu": 10, "top": [10, 14, 23], "divis": 10, "won": 10, "first": [10, 23, 34], "major": [10, 23, 24], "honour": 10, "championship": 10, "1955": 10, "nlp": 10, "en_core_web_sm": 10, "render": 10, "style": [10, 19], "ent": 10, "true": [10, 14, 19, 23, 24, 25, 30], "paper": 10, "graphic": 10, "element": [10, 30, 34], "notori": 10, "No": [10, 12, 14], "worri": 10, "figur": [10, 19, 41], "tikzplotlib": 10, "insert": [10, 16], "pyplot": [10, 19, 26, 41], "plt": [10, 19, 26, 41], "numpi": [10, 14, 18, 19, 20, 23, 24, 25, 34], "np": [10, 14, 18, 19, 20, 23, 24, 25, 34], "ggplot": 10, "arang": 10, "sin": 10, "pi": 10, "s2": 10, "co": 10, "o": 10, "lw": 10, "xlabel": [10, 41], "ylabel": [10, 41], "voltag": 10, "mv": 10, "titl": [10, 19], "simpl": [10, 12, 23], "frac": 10, "alpha": [10, 23], "grid": [10, 19], "mytikz": 10, "For": [10, 19, 23, 25, 27], "pattern": [10, 25, 26, 34], "break": [10, 34], "down": 10, "complex": [10, 23, 25, 30, 34], "simpler": 10, "ones": [10, 23, 41], "combin": [10, 23, 24], "end": [10, 29, 34, 41], "either": [10, 30, 34], "ip": [10, 16], "digit": [10, 25], "port": [10, 23], "anylett": 10, "anydigit": 10, "anyfrom": 10, "quantifi": [10, 23], "atleastatmost": 10, "group": 10, "captur": [10, 19], "http_protocol": 10, "alphanum": 10, "domain_nam": 10, "n": [10, 26, 34], "61": [10, 20, 23], "tld": 10, "ip_octet": 10, "at_least_at_most": 10, "port_numb": 10, "sub": 10, "togeth": 10, "effortlessli": [10, 14], "extract": [10, 21, 23, 26, 34], "optic": 10, "charact": [10, 34], "built": [10, 26, 30, 36, 41], "pytorch": [10, 18, 26], "80": [10, 23], "latin": 10, "chines": 10, "arab": 10, "cyril": 10, "given": [10, 29, 41], "ps": 10, "recommend": [10, 23, 30], "reader": 10, "image_path": [10, 36], "english_imag": 10, "png": [10, 23], "readtext": 10, "draw": 10, "variou": [10, 19, 23, 24, 25, 26], "node": [10, 23, 34], "cloud": [10, 19], "aw": [10, 23], "azur": 10, "gcp": 10, "architectur": 10, "comput": [10, 14, 18, 34], "ec2": 10, "rd": 10, "network": [10, 21, 23], "elb": 10, "worker": 10, "direct": [10, 23], "tb": 10, "lb": 10, "worker1": 10, "worker2": 10, "worker3": 10, "worker4": 10, "worker5": 10, "event": 10, "program": [10, 36], "fail": [10, 41], "let": [10, 14, 19, 23, 26, 29, 34], "instabl": [10, 24], "internet": 10, "connect": [10, 37], "uncommon": 10, "usual": [10, 23], "mechan": 10, "isn": [10, 21], "behaviour": [10, 34], "condit": [10, 29, 34], "wait": [10, 23, 41], "coroutin": 10, "after": [10, 26, 34], "attempt": 10, "stop_after_attempt": 10, "stop_after_5_attempt": 10, "OR": 10, "stop_after_delai": 10, "stop_after_10_s_or_5_retri": 10, "x": [10, 14, 20, 23, 24, 26, 30, 34, 41], "wait_fix": 10, "wait_2_": 10, "retry_if_exception_typ": 10, "ioerror": 10, "might_io_error": 10, "forev": 10, "interfac": [10, 19, 23], "open": [10, 23], "c": [10, 14, 19, 20, 29, 34, 36], "due": [10, 23, 24, 29], "larger": [10, 27, 29], "research": [10, 16], "plotli": [10, 29], "neat": [10, 36], "tutori": 10, "purpos": [10, 36], "ig": 10, "g": [10, 23, 36], "es": 10, "width": [10, 34], "fig": [10, 19, 23, 29, 41], "ax": [10, 19], "subplot": [10, 19], "target": [10, 23, 25], "layout": [10, 19], "circl": 10, "vertex_color": 10, "steelblu": 10, "vertex_label": 10, "vcount": 10, "edge_width": 10, "edge_color": 10, "666": 10, "edge_background": 10, "white": 10, "bandwidth": [10, 37], "dot": [10, 36], "net": [10, 23], "orient": 10, "pure": 10, "lightweight": [10, 23], "perfect": 10, "hobbi": 10, "queri": [10, 19, 23, 29, 36], "db": 10, "path": [10, 23, 36, 37, 39, 41], "char": 10, "stai": [10, 23], "sloc": 10, "logic": 10, "lloc": 10, "estim": [10, 20, 23, 26], "cyclomat": 10, "correspond": [10, 19, 21, 25], "decis": 10, "count": [10, 21], "halstead": 10, "deriv": [10, 21], "distinct": 10, "operand": 10, "index": [10, 19, 26, 29], "measur": [10, 20, 41], "mix": 10, "abov": 10, "cc": 10, "httpx": 10, "similar": [10, 32, 34, 36], "advantag": 10, "asynchron": 10, "doesn": [10, 23], "lead": [10, 20, 23, 26], "improv": 10, "deal": 10, "concurr": 10, "yourself": [10, 14, 26], "put": 10, "valu": [10, 20, 23, 25, 26, 29, 36, 41], "delet": [10, 23, 41], "async": [10, 16], "asynccli": 10, "client": [10, 16], "await": 10, "pair": [10, 19, 34], "env": [10, 14], "api_kei": [10, 16], "mysupersecretapikei": 10, "domain": 10, "mydomain": 10, "load_dotenv": 10, "dotenv_valu": 10, "os": [10, 16, 37, 41], "getenv": 10, "dictionari": [10, 23], "did": [10, 23, 29, 34, 37], "interact": [10, 14, 16, 41], "sdk": 10, "item": [10, 19, 34], "page": [10, 12, 21], "notion_cli": 10, "notion_token": 10, "list": [10, 14, 20, 23, 34], "my_pag": 10, "database_id": 10, "897e5a76": 10, "ae52": 10, "4b48": 10, "9fdf": 10, "e71f5945d1af": 10, "filter": [10, 19, 21, 26], "properti": [10, 34], "landmark": 10, "rich_text": 10, "pdoc": 12, "cool": [12, 23, 34], "hierarchi": 12, "configur": [12, 23], "altern": [12, 14, 23, 36], "sphinx": 12, "preprocess": [12, 14, 23], "exactli": 14, "load_ext": 14, "magic": 14, "extens": [14, 25], "lprun": 14, "my_funct": [14, 30], "10000": [14, 29], "400": 14, "1e": 14, "timer": 14, "001": 14, "0160793": 14, "ipython": 14, "input": [14, 19, 23, 29], "18": 14, "790da5f104f0": 14, "hit": [14, 26], "9999": 14, "16": [14, 19, 23], "37": 14, "46": 14, "livelossplot": 14, "ad": [14, 34], "callback": 14, "tensorboard": 14, "its": [14, 21, 23, 24, 29, 30, 34, 36], "progress": 14, "kera": 14, "dataset": [14, 19, 20, 23, 25, 26, 29, 30], "mnist": 14, "to_categor": 14, "sequenti": [14, 23], "layer": [14, 23], "flatten": [14, 23, 36], "dens": [14, 23], "activ": [14, 23], "plotlosseskera": 14, "x_train": [14, 20, 23], "y_train": [14, 20, 23, 26], "x_test": [14, 20, 23], "y_test": [14, 20, 23, 26], "load_data": [14, 23], "reshap": 14, "28": [14, 19, 23], "astyp": 14, "float32": 14, "255": 14, "input_shap": [14, 23], "softmax": [14, 23], "rmsprop": 14, "categorical_crossentropi": 14, "accuraci": [14, 23], "plotloss": 14, "fit": [14, 20, 23, 24, 26], "epoch": 14, "validation_data": 14, "verbos": [14, 23, 25], "latexifi": 14, "math": 14, "solv": [14, 16, 19], "sqrt": 14, "diagram": 14, "switch": 14, "back": [14, 34], "sklearn": [14, 20, 25, 26], "make_pipelin": [14, 25], "imput": 14, "simpleimput": [14, 25], "compos": [14, 18, 23, 25], "columntransform": 14, "onehotencod": 14, "robustscal": [14, 25], "ensembl": [14, 26], "randomforestclassifi": [14, 23], "set_config": 14, "numeric_preprocessor": 14, "imputation_mean": 14, "missing_valu": 14, "nan": 14, "strategi": [14, 41], "scale": [14, 23], "categorical_preprocessor": 14, "imputation_const": 14, "fill_valu": 14, "miss": [14, 34, 41], "constant": [14, 23], "one_hot": 14, "handle_unknown": [14, 23], "preprocessor": 14, "categor": [14, 19], "state": [14, 27], "gender": 14, "numer": 14, "ag": [14, 20, 30, 36], "weight": 14, "pipe": [14, 23, 26], "reload": 14, "reimport": 14, "my_function1": 14, "my_function2": 14, "limit": [14, 16], "widespread": 14, "isort": 14, "incompat": 14, "nbqa": 14, "er": 14, "toolchain": 14, "my_notebook": 14, "ipynb": 14, "float": [14, 25], "heavi": 14, "jupyterlab": 14, "scratch": 14, "jupytertempl": 14, "eda": [14, 23, 39], "labextens": 14, "jupyterlab_templ": 14, "enabl": 14, "jupyter_notebook_config": 14, "jupyterlabtempl": 14, "allowed_extens": 14, "template_dir": 14, "include_default": 14, "include_core_path": 14, "larg": [14, 25, 30, 34], "strip": 14, "size": [14, 19, 23, 25], "risk": 14, "sensit": [14, 16], "genai": 14, "vendor": 14, "openai": [14, 16], "huggingfac": [14, 23], "anthrop": [14, 16], "ask": [14, 41], "provider_api_kei": 14, "your_api_key_her": 14, "jupyter_ai": 14, "chatgpt": 14, "here": [16, 34, 41], "cost": [16, 25], "often": [16, 24], "exceed": 16, "token": [16, 25], "forget": 16, "context": 16, "pai": 16, "unimport": 16, "claim": 16, "achiev": [16, 23], "20x": [16, 26], "minim": [16, 20], "tri": [16, 30], "myself": 16, "notic": [16, 23], "cautiou": 16, "critic": [16, 36], "promptcompressor": 16, "your_prompt": 16, "llm_lingua": 16, "lgaalv": 16, "gpt2": 16, "dolli": 16, "compressed_prompt": 16, "compress_prompt": 16, "instruct": 16, "question": 16, "target_token": 16, "200": [16, 30], "turn": 16, "best": [16, 20, 23, 30], "origin_token": 16, "2430": 16, "compressed_token": 16, "261": 16, "ratio": [16, 20, 23], "gpt": 16, "consist": [16, 19], "stream": [16, 23], "respons": [16, 23, 36], "complet": [16, 19, 34], "openai_api_kei": 16, "anthropic_api_kei": 16, "mistral_api_kei": 16, "role": 16, "turbo": 16, "claud": 16, "instant": 16, "mistral": 16, "tini": 16, "unwant": 16, "behavior": [16, 41], "safe": 16, "between": [16, 19, 20, 21, 23], "inform": [16, 21, 34], "credit": 16, "card": 16, "number": [16, 27, 41], "sanit": 16, "toxic": 16, "inject": 16, "guard": 16, "llm_guard": 16, "scan_output": 16, "scan_prompt": 16, "input_scann": 16, "anonym": [16, 34], "promptinject": 16, "vault": 16, "openaikei": 16, "sql": [16, 19], "555": 16, "123": [16, 25, 36], "4567": 16, "192": 16, "168": 16, "8901": 16, "2345": 16, "6789": 16, "sanitized_prompt": 16, "results_valid": 16, "results_scor": 16, "chat": 16, "assist": 16, "redacted_person_1": 16, "redacted_email_address_1": 16, "redacted_phone_number_1": 16, "redacted_ip_address_1": 16, "redacted_credit_card_re_1": 16, "seamlessli": 18, "tensorflow": 18, "70": [18, 23], "transform": [18, 23, 34], "vision": 18, "horizontalflip": 18, "tograi": 18, "griddropout": 18, "verticalflip": 18, "channelshuffl": 18, "augmented_imag": 18, "arrai": [18, 19, 23, 34], "repetit": 19, "inspect": 19, "view": 19, "wide": [19, 25], "varieti": [19, 23], "excel": [19, 23], "bonu": 19, "export": 19, "dtale": 19, "df": [19, 20, 21, 25, 26, 29, 30, 32, 39], "datafram": [19, 20, 23, 25, 26, 32], "dict": [19, 23, 29], "fan": 19, "background": [19, 29], "appropri": [19, 20], "dark_background": 19, "pyqt": 19, "lot": [19, 34, 37], "summari": 19, "statist": [19, 20, 26, 32], "bar": 19, "chart": [19, 23], "pokemon": 19, "nulliti": 19, "understand": [19, 23, 25, 26], "column": [19, 20, 23, 30, 36], "relat": 19, "heatmap": 19, "great": [19, 37], "pick": [19, 30], "relationship": [19, 20], "your_data": 19, "\u03d5k": 19, "beween": 19, "ordin": 19, "interv": 19, "non": [19, 20, 23], "linear": [19, 20, 23], "revert": 19, "pearson": 19, "bivari": 19, "normal": [19, 34], "distribut": [19, 25], "plot_correlation_matrix": 19, "resourc": 19, "fixtur": 19, "fake_insurance_data": 19, "gz": 19, "corr_matrix": 19, "phik_matrix": 19, "x_label": 19, "y_label": 19, "vmin": 19, "vmax": 19, "color_map": 19, "blue": [19, 25], "matrix": 19, "fontsize_factor": 19, "figsiz": 19, "tight_layout": 19, "ugli": [19, 36], "overlap": 19, "unread": 19, "label": [19, 24], "adjust": [19, 23, 34], "date": [19, 21, 36, 41], "mdate": 19, "datetim": [19, 25, 34], "2023": [19, 34, 36], "25": [19, 23, 25, 30, 36], "30": [19, 23, 24, 34], "35": 19, "object": [19, 23, 41], "xaxi": 19, "set_major_formatt": 19, "dateformatt": 19, "geo": 19, "fill": [19, 34], "area": 19, "bubbl": 19, "hexbin": 19, "express": [19, 23, 34], "px": 19, "gapmind": 19, "2007": 19, "scatter_geo": 19, "iso_alpha": 19, "pop": 19, "subplot_mosa": 19, "arrang": 19, "fashion": 19, "control": [19, 23, 29], "aae": 19, "constrained_layout": 19, "axd": 19, "set_titl": 19, "multicollinear": 20, "phenomenon": 20, "predictor": [20, 23], "regress": [20, 23], "correl": [20, 25, 26], "unstabl": 20, "inconsist": 20, "coeffici": 20, "\ud835\udc15\ud835\udc1a\ud835\udc2b\ud835\udc22\ud835\udc1a\ud835\udc27\ud835\udc1c\ud835\udc1e": 20, "\ud835\udc08\ud835\udc27\ud835\udc1f\ud835\udc25\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 20, "\ud835\udc05\ud835\udc1a\ud835\udc1c\ud835\udc2d\ud835\udc28\ud835\udc2b": 20, "indic": 20, "present": 20, "formula": 20, "determin": [20, 23], "repeat": [20, 26], "each": [20, 23, 24, 26, 34, 36, 37], "compar": [20, 41], "contribut": [20, 23], "now": [20, 34, 36, 41], "drop": [20, 23, 30], "remain": 20, "\ud835\udc2c\ud835\udc2d\ud835\udc1a\ud835\udc2d\ud835\udc2c\ud835\udc26\ud835\udc28\ud835\udc1d\ud835\udc1e\ud835\udc25\ud835\udc2c": 20, "load_boston": 20, "statsmodel": [20, 26], "stat": 20, "outliers_influ": 20, "variance_inflation_factor": 20, "boston": 20, "feature_nam": [20, 25], "shape": [20, 23, 24], "crim": 20, "100373": 20, "zn": 20, "844013": 20, "indu": 20, "14": [20, 23], "485758": 20, "cha": 20, "152952": 20, "nox": 20, "73": 20, "894947": 20, "rm": [20, 41], "77": 20, "948283": 20, "21": [20, 34], "386850": 20, "di": 20, "699652": 20, "rad": 20, "167725": 20, "tax": 20, "227274": 20, "ptratio": 20, "85": 20, "029547": 20, "11": [20, 21], "104943": 20, "lstat": 20, "102025": 20, "algorithm": [20, 23, 24, 36], "catboost": [20, 23], "unknown": 20, "mismatch": 20, "beforehand": [20, 34], "categorymismatchtraintest": 20, "tabular": [20, 23], "train_test_valid": 20, "col1": 20, "col2": 20, "col3": 20, "d": [20, 29, 34, 36], "obtain": 20, "randomli": 20, "shuffl": [20, 23], "observ": 20, "comparison": 20, "eas": 20, "show_weight": 20, "hurt": 20, "permutationimport": 20, "svm": [20, 23], "svc": 20, "load_iri": [20, 23, 25], "model_select": [20, 23, 26], "train_test_split": [20, 23, 26], "iri": [20, 23], "target_nam": [20, 23], "perm": 20, "feature_1": [20, 23], "feature_2": 20, "feature_3": [20, 23], "feature_4": 20, "score": [20, 23, 24, 26], "pp": 20, "agnost": [20, 23], "ppscore": 20, "c_": [20, 25], "minimum": [20, 36], "redund": 20, "maximum": [20, 24, 34, 36], "relev": [20, 21], "smallest": [20, 30, 34, 41], "subset": [20, 29], "ml": [20, 26], "common": [20, 23, 32], "polar": [20, 30], "spark": [20, 26], "k": [20, 26, 41], "mrmr_select": 20, "make_classif": 20, "mrmr_classif": 20, "n_sampl": [20, 23, 26], "n_featur": [20, 23], "50": [20, 23, 26], "n_inform": 20, "n_redund": 20, "40": [20, 23, 25, 30], "selected_featur": 20, "restrict": 21, "social": [21, 23, 25], "servic": [21, 37], "hashtag": 21, "thread": 21, "platform": [21, 25], "instagram": [21, 37], "facebook": 21, "tweet": 21, "elon": 21, "musk": 21, "januari": 21, "simpli": [21, 26], "jsonl": 21, "max": [21, 23, 34, 36], "01": [21, 23, 36], "elonmusk": 21, "until": [21, 41], "scraper": [21, 37], "playstor": 21, "sort": [21, 23], "rate": 21, "countri": [21, 36], "google_play_scrap": 21, "_": [21, 23, 24, 34], "android": 21, "lang": [21, 25], "newest": 21, "filter_score_with": 21, "app_store_scrap": 21, "podcast": 21, "appl": [21, 34], "side": 21, "appstor": 21, "app_nam": 21, "app_id": 21, "id389801252": 21, "insta": 21, "389801252": 21, "how_mani": 21, "messi": [21, 34], "face": 21, "throw": [21, 34], "dialect": 21, "read_datafram": 21, "imdb": 21, "extractor": [21, 23], "crawl": 21, "download": [21, 37], "metadata": 21, "comment": [21, 23], "websit": [21, 25, 34, 41], "xml": 21, "fetch_url": 21, "adbar": 21, "output_format": 21, "imbal": 23, "higher": 23, "minor": 23, "lower": [23, 25], "loss": [23, 32], "misclassifi": 23, "compute_class_weight": 23, "tf": 23, "class_weight": 23, "uniqu": 23, "enumer": 23, "loop": 23, "backend": [23, 36], "clear_sess": 23, "bias": [23, 26], "\ud835\udc1d\ud835\udc1e\ud835\udc25": 23, "\ud835\udc26\ud835\udc28\ud835\udc1d\ud835\udc1e\ud835\udc25": 23, "clutter": 23, "increas": [23, 32], "create_model": 23, "noisi": 23, "centric": 23, "via": 23, "nearli": 23, "clf": 23, "n_estim": 23, "cl": 23, "classif": 23, "cleanlearn": 23, "label_issu": 23, "find_label_issu": 23, "is_label_issu": 23, "assess": [23, 26], "summar": 23, "precis": 23, "recal": 23, "f1": 23, "y_true": [23, 26], "y_pred": [23, 26], "00": [23, 29, 34, 36], "67": 23, "macro": 23, "avg": 23, "framework": 23, "care": [23, 34], "tupl": 23, "seed": [23, 27, 41], "sampler": 23, "tpesampl": 23, "trial": 23, "42": 23, "studi": 23, "create_studi": 23, "n_trial": 23, "reason": 23, "doubt": 23, "closer": 23, "\ud835\udc0f\ud835\udc2b\ud835\udc28\ud835\udc1b\ud835\udc1a\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "\ud835\udc16\ud835\udc2b\ud835\udc28\ud835\udc27\ud835\udc20\ud835\udc0f\ud835\udc2b\ud835\udc1e\ud835\udc1d\ud835\udc22\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "cannot": 23, "\ud835\udc03\ud835\udc22\ud835\udc2c\ud835\udc1a\ud835\udc20\ud835\udc2b\ud835\udc1e\ud835\udc1e\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "disagre": 23, "\ud835\udc11\ud835\udc1e\ud835\udc25\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc2f\ud835\udc1e\ud835\udc03\ud835\udc22\ud835\udc1f\ud835\udc1f\ud835\udc1e\ud835\udc2b\ud835\udc1e\ud835\udc27\ud835\udc1c\ud835\udc1e\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "rel": [23, 25], "doubtensembl": 23, "probareason": 23, "wrongpredictionreason": 23, "linear_model": [23, 26], "logisticregress": 23, "return_x_i": 23, "proba": 23, "wrong_pr": 23, "instanc": [23, 34], "predic": 23, "get_pred": 23, "stare": 23, "screen": [23, 34], "knockknock": 23, "notif": 23, "channel": 23, "slack": 23, "telegram": 23, "discord": 23, "ms": 23, "stick": 23, "email_send": 23, "recipient_email": 23, "coolmail": 23, "2coolmail": 23, "sender_email": 23, "anothercoolmail": 23, "train_model": 23, "torch": 23, "mymodel": 23, "nn": 23, "batch_siz": 23, "input_s": [23, 26], "depth": 23, "idx": 23, "param": 23, "conv2d": 23, "batchnorm2d": 23, "relu": 23, "maxpool2d": 23, "148": 23, "970": 23, "174": 23, "trainabl": 23, "mult": 23, "mb": [23, 25, 30], "05": 23, "forward": 23, "backward": 23, "06": 23, "honest": 23, "fastest": 23, "intelex": 23, "favourit": [23, 36], "vector": [23, 30], "regressor": 23, "lasso": 23, "dbscan": 23, "sklearnex": 23, "patch_sklearn": 23, "svr": 23, "make_regress": 23, "100000": 23, "nois": [23, 36], "\ud835\udc17\ud835\udc06\ud835\udc01\ud835\udc28\ud835\udc28\ud835\udc2c\ud835\udc2d": 23, "\ud835\udc05\ud835\udc1e\ud835\udc1a\ud835\udc2d\ud835\udc2e\ud835\udc2b\ud835\udc1e": 23, "\ud835\udc08\ud835\udc27\ud835\udc2d\ud835\udc1e\ud835\udc2b\ud835\udc1a\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 23, "\ud835\udc02\ud835\udc28\ud835\udc27\ud835\udc2c\ud835\udc2d\ud835\udc2b\ud835\udc1a\ud835\udc22\ud835\udc27\ud835\udc2d\ud835\udc2c": 23, "feature_0": 23, "similarli": 23, "feature_5": 23, "feature_9": 23, "mind": 23, "regulatori": 23, "industri": 23, "compani": 23, "xgb": 23, "dmatrix": 23, "reg": 23, "squarederror": 23, "eval_metr": 23, "rmse": 23, "interaction_constraint": 23, "model_with_constraint": 23, "hear": 23, "develop": [23, 30], "remov": [23, 25, 41], "pain": [23, 37], "choos": 23, "lightgbm": [23, 26], "task": 23, "tradit": 23, "focus": 23, "overal": 23, "piec": [23, 34, 41], "food": 23, "staff": 23, "rude": 23, "neg": 23, "That": [23, 30, 36], "toward": 23, "batteri": 23, "camera": 23, "opinion": 23, "feel": 23, "feedback": 23, "review": 23, "media": [23, 25], "monitor": 23, "27": 23, "atepccheckpointmanag": 23, "get_aspect_extractor": 23, "checkpoint": 23, "multilingu": 23, "auto_devic": 23, "were": 23, "stuff": 23, "unfriendli": 23, "extract_aspect": 23, "inference_sourc": 23, "pred_senti": 23, "implement": [23, 26, 30], "xgbrfregressor": 23, "xgbrf": 23, "rand": [23, 27], "deep": [23, 30], "Near": 23, "duplic": 23, "blurri": 23, "odd": 23, "irregularli": 23, "dark": 23, "light": 23, "lack": 23, "crazi": 23, "wget": 23, "nc": 23, "public": 23, "s3": 23, "amazonaw": 23, "image_fil": 23, "zip": 23, "unzip": [23, 37], "q": [23, 25, 34], "imagelab": 23, "own": 23, "dataset_path": 23, "data_path": 23, "find_issu": 23, "preval": 23, "issue_summari": 23, "issue_typ": 23, "decreas": 23, "shouldn": 23, "\ud835\udc00\ud835\udc25\ud835\udc29\ud835\udc21\ud835\udc1a\ud835\udc12\ud835\udc1e\ud835\udc25\ud835\udc1e\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 23, "curv": 23, "respond": 23, "lassocv": 23, "load_concret": 23, "alphaselect": 23, "cross": 23, "linspac": 23, "tensorflow_decision_forest": 23, "gbdt": 23, "tfdf": 23, "get_fil": 23, "adult": 23, "yggdrasil": 23, "yggdrasil_decision_forest": 23, "test_data": 23, "dataset_df": 23, "test_indic": 23, "len": [23, 24], "test_ds_pd": 23, "train_ds_pd": 23, "train_d": 23, "pd_dataframe_to_tf_dataset": 23, "incom": 23, "test_d": 23, "gradientboostedtreesmodel": 23, "multimod": 23, "covari": 23, "shift": 23, "quickstart": 23, "tabulardataset": 23, "tabularpredictor": 23, "train_data": 23, "inc": 23, "time_limit": 23, "240": 23, "leaderboard": 23, "maxpooling2d": 23, "64": 23, "pool_siz": 23, "layered_view": 23, "legend": 23, "to_fil": 23, "stratifiedkfold": 23, "fold": [23, 26], "repres": 23, "strata": 23, "case": [23, 26, 41], "stratyf": 23, "multilabelstratifiedkfold": 23, "iterstrat": 23, "ml_stratifi": 23, "mskf": 23, "n_split": [23, 26], "random_st": 23, "train_index": 23, "test_index": 23, "split": [23, 26], "nobodi": 23, "therefor": [23, 34], "crucial": 23, "point": [23, 34], "overcom": 23, "hurdl": 23, "lime": 23, "shap": 23, "category_encod": 23, "ordinalencod": 23, "lgbmregressor": [23, 26], "extratreesregressor": 23, "data_load": 23, "house_df": 23, "house_dict": 23, "house_pric": 23, "y_df": [23, 26], "salepric": 23, "to_fram": 23, "x_df": 23, "categorical_featur": 23, "col": [23, 32, 36], "dtype": [23, 30], "return_df": 23, "xtrain": 23, "xtest": 23, "ytrain": 23, "ytest": 23, "train_siz": 23, "75": [23, 25], "smartexplain": 23, "xpl": 23, "features_dict": 23, "y_target": 23, "run_app": 23, "title_stori": 23, "hous": 23, "price": 23, "8020": 23, "Not": 23, "huge": [23, 30], "solut": 23, "suit": 23, "detail": [23, 34, 41], "calcul": [23, 24, 32, 36], "bunch": 23, "drift": 23, "weak": 23, "segment": 23, "full_suit": 23, "iris_df": 23, "data_format": 23, "as_train_test": 23, "label_col": 23, "df_train": 23, "df_test": 23, "rf_clf": 23, "axi": [23, 41], "ds_train": 23, "cat_featur": 23, "ds_test": 23, "train_dataset": 23, "test_dataset": 23, "Its": 23, "plot_rank": 23, "individu": 23, "hover": 23, "dive": 23, "deeper": 23, "analys": 23, "criterion": 23, "gini": 23, "max_depth": 23, "suggest_int": 23, "mdpth": 23, "log": [23, 32, 34], "min_samples_split": 23, "mspl": 23, "min_samples_leaf": 23, "mlf": [23, 26], "min_weight_fraction_leaf": 23, "suggest_float": 23, "mwfr": 23, "max_featur": 23, "mft": 23, "max_leaf_nod": 23, "mnod": 23, "min_impurity_decreas": 23, "mid": 23, "maxim": [23, 24], "get_param_import": 23, "params_sort": 23, "kaggl": 23, "involv": [23, 34], "anomali": 23, "cluster": [23, 26], "categori": [23, 25], "cluster_comb": 23, "clustererensembl": 23, "kmean": 23, "n_cluster": 23, "minibatchkmean": 23, "agglomerativeclust": 23, "aligned_label": 23, "aligned_labels_": 23, "predicted_label": 23, "labels_": [23, 24], "varianc": [23, 25], "residualplot": 23, "exhibit": 23, "along": 23, "horizont": 23, "typic": 23, "suitabl": [23, 36], "wherea": 23, "dispers": 23, "residualsplot": 23, "multi": [23, 26], "hardwar": 23, "hyperopt": 23, "train_breast_canc": 23, "load_breast_canc": 23, "train_x": 23, "test_x": 23, "train_i": 23, "test_i": 23, "test_siz": [23, 26], "train_set": 23, "test_set": 23, "eval": 23, "evals_result": 23, "verbose_ev": 23, "mean_accuraci": 23, "binari": [23, 37], "logist": 23, "logloss": 23, "min_child_weight": 23, "subsampl": 23, "uniform": 23, "tuner": 23, "tune_config": 23, "tuneconfig": 23, "num_sampl": 23, "param_spac": 23, "get_best_result": 23, "mode": 23, "dl": 23, "why": [23, 24], "level": [23, 26, 36], "compat": 23, "neural": 23, "neuralnetclassifi": 23, "pipelin": [23, 37], "standardscal": 23, "mymodul": 23, "__init__": [23, 34, 41], "self": [23, 34], "num_unit": 23, "nonlin": 23, "dim": [23, 26], "kwarg": 23, "dropout": 23, "max_epoch": 23, "lr": 23, "iterator_train__shuffl": 23, "y_proba": 23, "predict_proba": 23, "fly": 23, "massiv": 23, "continu": 23, "updat": [23, 34, 37], "full": 23, "knn": [23, 24], "phish": 23, "predict_on": 23, "learn_on": 23, "mobilenet": 23, "swin": 23, "convnext": 23, "densenet": 23, "pretrain": 23, "list_model": 23, "densenet121": 23, "randn": 23, "224": 23, "uncertainti": 23, "mapieregressor": 23, "linearregress": [23, 26], "59": [23, 36], "mapie_regressor": 23, "y_pi": 23, "unsupervis": 24, "natur": 24, "suffer": 24, "pyod": 24, "densiti": 24, "averag": 24, "vote": 24, "detector": 24, "inlin": 24, "majority_vot": 24, "highest": 24, "sampl": [24, 26], "abod": 24, "iforest": 24, "generate_data": 24, "train_onli": 24, "n_model": 24, "zero": [24, 25], "gpl": 25, "cleantext": 25, "talk": 25, "send": [25, 34], "testmail": 25, "outlook": 25, "71112392": 25, "visit": 25, "testurl": 25, "free": 25, "u2018": 25, "u2019": 25, "minut": [25, 36], "fix_unicod": 25, "unicod": 25, "to_ascii": 25, "transliter": 25, "closest": 25, "ascii": 25, "lowercas": 25, "no_url": 25, "replac": [25, 30, 41], "special": [25, 34], "no_email": 25, "no_phone_numb": 25, "no_numb": 25, "no_digit": 25, "no_currency_symbol": 25, "currenc": 25, "symbol": 25, "no_punct": 25, "punctuat": 25, "german": 25, "pandas_dq": 25, "focuss": 25, "skew": 25, "dq_report": 25, "fix_dq": 25, "fdq": 25, "data_transform": 25, "fit_transform": 25, "whole": 25, "decim": [25, 36], "percentag": [25, 41], "note": [25, 34], "avail": [25, 34, 41], "spaci": 25, "text_1": 25, "twenti": 25, "five": 25, "dollar": 25, "text_2": 25, "hundr": 25, "fourti": 25, "three": 25, "thousand": 25, "four": 25, "text_3": 25, "nine": 25, "quarter": 25, "num_1": 25, "num_2": 25, "num_3": 25, "243421": 25, "integ": [25, 34, 36, 41], "fraction": 25, "big": [25, 34], "byte": 25, "naturals": 25, "1024000": 25, "equival": 25, "intword": 25, "123500000": 25, "million": 25, "dt": [25, 36], "naturaldelta": 25, "timedelta": 25, "1200": 25, "long": [25, 41], "eleg": [25, 36], "num_pipelin": 25, "knnimput": 25, "cat_pipelin": 25, "most_frequ": 25, "conveni": [25, 29, 30], "make_column_selector": 25, "regex": 25, "afterward": 25, "Will": [25, 34], "columns_with_featur": 25, "num_column": 25, "dtype_includ": 25, "tackl": 25, "dure": 25, "suffici": 25, "meaning": 25, "rarelabelencod": 25, "feature_engin": 25, "threshold": 25, "red": [25, 29], "green": [25, 29], "yellow": 25, "violet": 25, "rare_encod": 25, "tol": 25, "n_categori": 25, "df_encod": 25, "regularli": 26, "effect": 26, "period": 26, "check_season": 26, "infer": [26, 29], "air": 26, "passeng": 26, "monthli": 26, "frequenc": 26, "airpassengersdataset": 26, "ts": 26, "airpassangersdataset": 26, "is_season": 26, "partit": 26, "rest": 26, "both": [26, 34], "overfit": 26, "scikit": 26, "past": [26, 36], "cross_valid": 26, "gradientboostingregressor": 26, "ts_cv": 26, "cv": 26, "neg_mean_squared_error": 26, "gapleavepout": 26, "gapkfold": 26, "gaprollforward": 26, "min_train_s": 26, "gap_siz": 26, "max_test_s": 26, "nixtla": 26, "remot": 26, "rai": 26, "exogen": 26, "probabilist": 26, "lgb": 26, "lag": 26, "freq": 26, "predict": [26, 32], "exist": [26, 34], "pmdarima": 26, "autoarima": 26, "airpassengersdf": 26, "sf": 26, "season_length": 26, "h": [26, 36], "95": 26, "lazi": [26, 36], "backtest": 26, "splitter": 26, "llm": 26, "agent": 26, "pl": [26, 32], "mase": 26, "1mo": 26, "24": 26, "fh": 26, "beat": 26, "nbeat": 26, "nhit": 26, "y_train_df": 26, "ds": [26, 32], "1959": 26, "31": 26, "y_test_df": 26, "horizon": 26, "max_step": 26, "nf": 26, "y_hat_df": 26, "reset_index": 26, "tempor": 26, "feed": 26, "xgboost": 26, "singl": [26, 36], "multivari": 26, "flat": 26, "tp": 26, "sale": 26, "from_csv": 26, "sales_per_stor": 26, "add_index": 26, "store": [26, 34], "tick_calendar": 26, "work_dai": 26, "calendar_day_of_week": 26, "daily_revenu": 26, "revenu": [26, 29], "moving_sum": 26, "durat": 26, "off": 26, "approxim": 26, "matplotlib": [26, 29, 41], "rpt": 26, "signal": 26, "sigma": 26, "n_breakpoint": 26, "bkp": 26, "pw_constant": 26, "noise_std": 26, "algo": 26, "pelt": 26, "rbf": 26, "pen": 26, "construct": 27, "global": 27, "affect": [27, 34], "reset": 27, "undesir": 27, "unreproduc": 27, "across": 27, "reli": [27, 41], "subtl": 27, "rng": 27, "1234": 27, "sometim": [29, 41], "boolean": 29, "cython": 29, "under": [29, 41], "hood": 29, "filtered_df": 29, "might": 29, "tell": [29, 41], "datetimeindex": 29, "time_index": 29, "date_rang": 29, "2020": 29, "applymap": 29, "sales_data": 29, "5000": 29, "15000": 29, "sales_df": 29, "val": 29, "els": 29, "set_opt": 29, "2343129": 29, "8956701": 29, "224289": 29, "blindli": 30, "row": 30, "wise": 30, "obviou": 30, "\ud835\udc12\ud835\udc30\ud835\udc22\ud835\udc1f\ud835\udc2d\ud835\udc1e\ud835\udc2b": 30, "parallel": 30, "dask": 30, "swifter": 30, "capabl": 30, "input_valu": 30, "output_valu": 30, "lambda": 30, "drastic": 30, "effici": [30, 34], "diet": 30, "optimize_dtyp": 30, "report_on_datafram": 30, "proposed_df": 30, "new_df": 30, "origin": 30, "memory_usag": 30, "sum": 30, "1024": 30, "props": 30, "constraint": 30, "pa": 30, "schema": 30, "dataframeschema": 30, "element_wis": 30, "alic": 30, "bob": 30, "charli": 30, "alreadi": [30, 32], "think": 30, "mayb": 30, "gain": [30, 32], "rewrit": 32, "reimplement": 32, "levenshtein": 32, "roc": 32, "r2": 32, "l1": 32, "huber": 32, "polars_d": 32, "group_bi": 32, "dummy_group": 32, "agg": 32, "actual": [32, 34], "num_ext": 32, "l2_loss": 32, "alia": 32, "l2": 32, "bce": 32, "binary_metrics_combo": 32, "combo": 32, "unnest": 32, "underscor": 34, "1_000_000": 34, "consecut": 34, "big_numb": 34, "1_000_000_000_000": 34, "behav": 34, "made": 34, "happi": 34, "mood": 34, "diari": 34, "hl": 34, "gl": 34, "urlpars": 34, "parse_q": 34, "unequ": 34, "length": 34, "shortest": 34, "itertool": 34, "zip_longest": 34, "pad": 34, "shorter": 34, "lose": 34, "aa": 34, "bb": 34, "reusabl": 34, "letter": 34, "num": [34, 36], "citi": [34, 36], "code_1": 34, "lh1234": 34, "bln": 34, "code_2": 34, "lh7672": 34, "muc": 34, "\ud835\udc26\ud835\udc1a\ud835\udc2d\ud835\udc2b\ud835\udc22\ud835\udc31": 34, "\ud835\udc26\ud835\udc2e\ud835\udc25\ud835\udc2d\ud835\udc22\ud835\udc29\ud835\udc25\ud835\udc22\ud835\udc1c\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 34, "matmul": 34, "nest": [34, 36], "techniqu": [34, 41], "block": 34, "earli": 34, "invalid": 34, "edg": [34, 41], "calculate_pric": 34, "price_per_unit": 34, "collect": 34, "secret": 34, "getpass": 34, "getus": 34, "overrid": 34, "__call__": 34, "example_inst": 34, "paragraph": 34, "lorem": 34, "ipsum": 34, "dolor": 34, "sit": 34, "amet": 34, "consectetur": 34, "adipisc": 34, "elit": 34, "nec": 34, "tellu": 34, "vita": 34, "turpi": 34, "tempu": 34, "porttitor": 34, "fusc": 34, "cursu": 34, "nisi": 34, "eu": 34, "urna": 34, "pharetra": 34, "congu": 34, "ex": [34, 37], "aliquet": 34, "quisqu": 34, "consequat": 34, "nulla": 34, "bibendum": 34, "risu": 34, "wrapped_text": 34, "lru_cach": 34, "maxsiz": 34, "128": 34, "fibonacci": 34, "onc": 34, "myclass": 34, "expensive_oper": 34, "expens": 34, "my_object": 34, "noth": 34, "fruit": 34, "orang": 34, "pear": 34, "banana": 34, "largest": 34, "\ud835\udc21\ud835\udc1e\ud835\udc1a\ud835\udc29\ud835\udc2a": 34, "satisfi": 34, "greater": 34, "equal": 34, "min": [34, 36], "children": 34, "heapq": 34, "nlargest": 34, "nsmallest": 34, "__\ud835\udc2c\ud835\udc2d\ud835\udc2b__": 34, "__\ud835\udc2b\ud835\udc1e\ud835\udc29\ud835\udc2b__": 34, "represent": 34, "intend": 34, "human": [34, 36], "unambigu": 34, "todai": 34, "repr": 34, "07": 34, "02": [34, 36, 41], "771969": 34, "unlik": 34, "unpack": 34, "dict_1": 34, "dict_2": 34, "re": 34, "match_exampl": 34, "assign": 34, "part": [34, 41], "kiwi": 34, "fruit_count": 34, "haven": 34, "been": 34, "yet": 34, "append": 34, "merced": 34, "anim": 34, "regular": 34, "p": 34, "mistak": 34, "among": 34, "insid": 34, "danger": 34, "increment_numb": 34, "dynam": 34, "attribut": 34, "__\ud835\udc2c\ud835\udc25\ud835\udc28\ud835\udc2d\ud835\udc2c__": 34, "space": 34, "prevent": 34, "runtim": 34, "z": 34, "whatev": 34, "sport": 34, "basketbal": 34, "volleybal": 34, "tenni": 34, "handbal": 34, "stack": 34, "multiprocess": 36, "processor": 36, "process_imag": 36, "path1": 36, "path2": 36, "n_job": 36, "difficulti": 36, "friendli": 36, "timezon": 36, "daylight": 36, "to_iso8601_str": 36, "08t13": 36, "798316": 36, "now_in_london": 36, "europ": 36, "08t12": 36, "799317": 36, "subtract": 36, "diff_for_human": 36, "ago": 36, "delta": 36, "week": 36, "in_word": 36, "51": 36, "pretti": 36, "logger": 36, "debug": 36, "pseudo": 36, "determinist": [36, 41], "atmospher": 36, "rnd": 36, "sequenc": 36, "groupbi": 36, "Of": 36, "cours": 36, "\ud835\udc29\ud835\udc32\ud835\udc2d\ud835\udc21\ud835\udc28\ud835\udc27": 36, "\ud835\udc1b\ud835\udc1e\ud835\udc27\ud835\udc1e\ud835\udc1d\ud835\udc22\ud835\udc1c\ud835\udc2d": 36, "unstructur": 36, "my_dict": 36, "person": 36, "street": 36, "st": [36, 39, 41], "york": 36, "usa": 36, "chromedriv": 37, "driver": 37, "somehow": 37, "browser": 37, "straightforward": 37, "energi": 37, "ci": 37, "cd": 37, "chrome": 37, "webdriver_manag": 37, "chromedrivermanag": 37, "executable_path": 37, "your_vers": 37, "monei": 37, "chrome_opt": 37, "chromeopt": 37, "add_argu": 37, "blink": 37, "imagesen": 37, "frame": 39, "compon": 39, "pandas_profil": 39, "streamlit_pandas_profil": 39, "st_profile_report": 39, "profile_report": 39, "numprocess": 41, "random": 41, "addit": 41, "flag": 41, "cover": 41, "\ud835\udc1c\ud835\udc28\ud835\udc2f": 41, "src": 41, "90": 41, "stmt": 41, "module1": 41, "257": 41, "13": 41, "94": 41, "module2": 41, "359": 41, "97": 41, "nowadai": 41, "everyth": 41, "baselin": 41, "dif": 41, "mark": 41, "mpl_image_compar": 41, "testfil": 41, "test_plotting_lin": 41, "instafail": 41, "failur": 41, "chatti": 41, "tldr": 41, "smarter": 41, "uphold": 41, "uncov": 41, "unexpect": 41, "bug": 41, "encourag": 41, "test_addition_commut": 41, "assert": 41, "essenti": 41, "softwar": 41, "isol": 41, "independ": 41, "cheap": 41, "fake": 41, "mimic": 41, "permiss": 41, "disk": 41, "unixf": 41, "staticmethod": 41, "filenam": 41, "test_unix_f": 41, "mocker": 41, "patch": 41, "assert_called_once_with": 41, "freeze_tim": 41, "2015": 41}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"delight": 0, "data": [0, 10, 18, 19, 21, 23, 25, 26, 32, 36], "scienc": [0, 32], "why": 0, "thi": 0, "book": 0, "exist": 0, "small": 0, "snippet": 0, "big": 0, "upgrad": 0, "miscellan": [1, 2], "must": 1, "have": 1, "vscode": 1, "extens": [1, 23], "python": [1, 4, 5, 10, 14, 34, 35, 36, 42], "project": [1, 8], "setup": 1, "from": [1, 10, 14, 21, 34], "templat": [1, 14], "cookiecutt": 1, "scaffold": 1, "smol": 1, "develop": 1, "well": 1, "commit": 1, "commitizen": 1, "autom": 3, "bash": 3, "command": 3, "makefil": 3, "test": [3, 4, 20, 41, 42], "nox": 3, "ci": 4, "cd": 4, "github": 4, "action": 4, "workflow": 4, "local": 4, "act": 4, "cach": [4, 10, 34], "depend": [4, 10, 41], "code": [5, 6, 10, 14, 19], "style": [5, 29], "remov": [5, 10, 14], "unus": 5, "line": [5, 30], "autoflak": 5, "ensur": 5, "document": [5, 12, 13], "interrog": 5, "sort": [5, 10], "your": [5, 7, 8, 10, 12, 14, 16, 20, 23, 25, 29, 34, 36, 37, 41], "import": [5, 20], "automat": [5, 10, 14, 26], "isort": 5, "format": [5, 29], "black": 5, "lint": 5, "yaml": 5, "file": [5, 10, 21], "yamllint": 5, "blazingli": 5, "fast": [5, 26], "ruff": 5, "correct": 5, "misspel": 5, "codebas": 5, "codespel": 5, "qualiti": [6, 14, 25], "memori": [7, 30], "optim": [7, 23, 34], "identifi": [7, 14, 23], "bottleneck": [7, 14], "regard": 7, "memory_profil": 7, "secur": 8, "detect": [8, 24, 25, 26], "common": 8, "issu": [8, 25], "bandit": 8, "vulner": 8, "environ": [8, 10], "store": [8, 21], "credenti": 8, "safe": 8, "keyr": 8, "type": [9, 34], "enforc": 9, "typeguard": 9, "static": 9, "check": [9, 10, 20, 26], "mypi": 9, "faster": 9, "pyright": 9, "cool": [10, 11], "tool": [10, 11, 14], "work": [10, 36], "countri": 10, "currenc": 10, "subdivis": 10, "more": [10, 21, 26, 34], "gener": [10, 12, 14, 23, 36], "better": [10, 34], "requir": 10, "pipreq": 10, "packag": 10, "its": [10, 25], "pip": 10, "autoremov": 10, "get": [10, 20, 21, 23, 29, 34, 41], "distanc": 10, "between": [10, 34], "postal": 10, "unit": 10, "pint": 10, "supercharg": 10, "profil": [10, 39], "scalen": 10, "fix": [10, 25], "unicod": 10, "error": [10, 41], "ftfy": 10, "background": 10, "imag": [10, 18, 23, 37], "rembg": 10, "build": 10, "modern": 10, "cli": 10, "app": [10, 21], "typer": 10, "realist": 10, "fake": 10, "faker": 10, "enrich": 10, "progress": 10, "bar": 10, "rich": 10, "set": [10, 20, 23, 29, 34], "descript": 10, "tqdm": 10, "convert": [10, 25], "emoji": 10, "text": [10, 21, 25, 34], "emot": 10, "print": [10, 34], "hardwar": 10, "inform": 10, "version": 10, "number": [10, 25, 34, 36], "request": 10, "unifi": 10, "messi": 10, "column": [10, 25], "unifynam": 10, "broken": 10, "link": 10, "websit": 10, "matplotlib": [10, 19], "termin": 10, "displai": [10, 14, 19, 29], "tree": 10, "latex": [10, 14], "acronym": 10, "make": [10, 25, 34], "ascii": 10, "art": 10, "ner": 10, "spaci": 10, "creat": [10, 14], "tikz": 10, "pictur": 10, "human": [10, 25], "readabl": [10, 29, 34], "regex": 10, "pregex": 10, "perform": [10, 23, 30], "ocr": 10, "easyocr": 10, "diagram": 10, "power": [10, 19, 21, 23, 36], "retri": 10, "function": [10, 16, 32, 34], "tenac": 10, "graph": 10, "analysi": [10, 23], "igraph": 10, "speedtest": 10, "via": 10, "minimalist": 10, "databas": 10, "tinydb": 10, "calcul": [10, 20], "metric": 10, "radon": 10, "altern": 10, "manag": [10, 37], "configur": 10, "dotenv": 10, "notion": 10, "auto": 12, "api": [12, 23], "jupyt": [14, 15], "notebook": [14, 15], "tip": [14, 15, 27, 28, 29, 31, 32, 35, 37, 38, 39, 40], "trick": [14, 15, 27, 28, 29, 31, 32, 35, 37, 38, 39, 40], "line_profil": 14, "render": 14, "live": 14, "loss": [14, 16], "deep": [14, 26], "learn": [14, 22, 23, 25, 26], "model": [14, 23], "express": 14, "scikit": [14, 23, 25], "pipelin": [14, 25], "html": 14, "autoreload": 14, "modul": [14, 41], "appli": [14, 30], "reus": 14, "juptyer": 14, "output": [14, 41], "cell": 14, "nbstripout": 14, "bring": 14, "llm": [14, 16, 17], "Into": 14, "ai": 14, "compress": 16, "prompt": 16, "With": [16, 30], "No": [16, 19], "llmlingua": 16, "One": [16, 30], "call": 16, "ani": 16, "litellm": 16, "safeguard": 16, "llmguard": 16, "augment": 18, "albument": 18, "eda": 19, "analyz": 19, "visual": [19, 23], "interact": [19, 23], "d": 19, "tale": 19, "us": [19, 23, 34], "dark": 19, "mode": 19, "pandasgui": 19, "miss": 19, "valu": [19, 34], "missingno": 19, "correl": 19, "phik": 19, "x": 19, "axi": 19, "time": [19, 26, 29], "seri": [19, 26, 29], "plot": [19, 23, 29, 41], "correctli": 19, "autofmt_xd": 19, "beauti": 19, "map": 19, "plotli": 19, "mosaic": 19, "featur": [20, 23, 25, 26], "select": [20, 23, 25], "varianc": 20, "inflat": 20, "factor": 20, "vif": 20, "new": 20, "categori": 20, "deepcheck": [20, 23], "permut": 20, "eli5": 20, "find": [20, 23], "most": 20, "predict": [20, 23], "variabl": [20, 34], "target": 20, "scale": 20, "mrmr": 20, "scrape": [21, 37], "twitter": 21, "youtub": 21, "snscrape": 21, "googl": 21, "plai": 21, "review": 21, "read": 21, "csv": 21, "without": 21, "problem": 21, "clevercsv": 21, "web": 21, "gather": 21, "trafilatura": 21, "machin": [22, 26], "train": 23, "comput": 23, "class": [23, 34], "weight": 23, "reset": 23, "tensorflow": 23, "kera": 23, "global": 23, "state": 23, "dirti": 23, "label": [23, 25], "cleanlab": 23, "evalu": 23, "classifi": 23, "sklearn": 23, "s": [23, 41], "classification_report": 23, "obtain": 23, "reproduc": [23, 27], "result": 23, "optuna": 23, "bad": 23, "doubtlab": 23, "notifi": 23, "when": 23, "finish": 23, "summari": 23, "pytorch": 23, "torchinfo": 23, "boost": [23, 30], "intel": 23, "incorport": 23, "domain": 23, "knowledg": 23, "xgboost": 23, "constraint": 23, "automl": 23, "flaml": 23, "aspect": 23, "base": [23, 41], "seniment": 23, "pyabsa": 23, "random": [23, 27, 36], "forest": 23, "problemat": 23, "cleanvis": 23, "regular": 23, "paramet": [23, 34], "decis": 23, "autogluon": 23, "visualkera": 23, "multilabel": 23, "stratifi": 23, "kfold": 23, "iter": [23, 34], "stratif": 23, "interpret": 23, "shapash": 23, "valid": [23, 26, 30], "high": 23, "ensembl": [23, 24], "combo": 23, "residu": 23, "yellowbrick": 23, "distribut": 23, "hyperparamet": 23, "rai": 23, "tune": 23, "skorch": 23, "onlin": 23, "ml": 23, "river": 23, "sota": 23, "vision": 23, "timm": 23, "guarante": 23, "interv": 23, "mapi": 23, "outlier": 24, "preprocess": [25, 26], "clean": 25, "natur": 25, "languag": 25, "numer": 25, "represent": 25, "date": 25, "friendli": 25, "cleaner": 25, "definit": 25, "easili": [25, 36], "rare": 25, "encod": 25, "engin": [25, 26], "season": 26, "dart": 26, "cross": 26, "timeseriessplit": 26, "tscv": 26, "forecast": 26, "mlforecast": 26, "lightn": 26, "statsforecast": 26, "polar": [26, 32, 33], "backend": [26, 29], "functim": 26, "neuralforecast": 26, "effici": 26, "temporian": 26, "chang": [26, 29], "point": 26, "ruptur": 26, "numpi": [27, 28], "achiev": 27, "np": 27, "randomst": 27, "panda": [29, 30, 31, 39], "filter": 29, "frequenc": 29, "pd": 29, "infer_freq": 29, "datafram": [29, 30], "precis": 29, "float": 29, "util": [30, 36], "librari": [30, 34], "speed": [30, 36, 37], "up": [30, 36, 37], "reduc": 30, "dtype_diet": 30, "pandera": 30, "modin": 30, "plugin": 32, "pure": 34, "built": 34, "queri": 34, "urllib": 34, "pars": 34, "zip": 34, "longest": 34, "improv": 34, "name": 34, "slice": 34, "wai": 34, "matrix": 34, "multipl": 34, "guard": 34, "claus": 34, "If": 34, "statement": 34, "hide": 34, "password": 34, "input": 34, "user": 34, "turn": 34, "callabl": 34, "wrap": 34, "textwrap": 34, "add": 34, "lru": 34, "method": 34, "functool": 34, "cached_properti": 34, "For": [34, 36, 41], "els": 34, "loop": [34, 36], "heap": 34, "differ": 34, "__str__": 34, "__repr__": 34, "neat": 34, "merg": 34, "dictionari": [34, 36], "switch": 34, "case": 34, "walru": 34, "oper": 34, "count": 34, "occurr": 34, "an": 34, "counter": 34, "default": 34, "defaultdict": 34, "structur": [34, 36], "tupl": 34, "namedtupl": 34, "mutabl": 34, "argument": 34, "object": 34, "__slots__": 34, "modifi": 34, "3": 34, "12": 34, "joblib": 36, "parallel": [36, 41], "datetim": [36, 41], "pendulum": 36, "prettifi": 36, "pprint": 36, "easi": 36, "log": 36, "loguru": 36, "truli": 36, "benedict": 36, "selenium": [37, 38], "webdriv": 37, "disabl": 37, "load": 37, "streamlit": [39, 40], "emb": 39, "pytest": 41, "steroid": 41, "xdist": 41, "shuffl": 41, "order": 41, "randomli": 41, "coverag": 41, "cov": 41, "mpl": 41, "instantli": 41, "show": 41, "suit": 41, "limit": 41, "minimum": 41, "properti": 41, "hypothesi": 41, "mock": 41, "freez": 41, "freezegun": 41}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinxcontrib.bibtex": 9, "sphinx": 56}})
\ No newline at end of file
+Search.setIndex({"docnames": ["README", "book/Miscellaneous/Chapter", "book/Miscellaneous/index", "book/codequality/automation", "book/codequality/cicd", "book/codequality/codestyle", "book/codequality/index", "book/codequality/memory", "book/codequality/security", "book/codequality/typing", "book/cooltools/Chapter", "book/cooltools/index", "book/documentation/Chapter", "book/documentation/index", "book/jupyternotebook/Chapter", "book/jupyternotebook/index", "book/llm/Chapter", "book/llm/index", "book/machinelearning/dataaugmentation", "book/machinelearning/eda", "book/machinelearning/featureselection", "book/machinelearning/getdata", "book/machinelearning/index", "book/machinelearning/modeltraining", "book/machinelearning/outlierdetection", "book/machinelearning/preprocessing", "book/machinelearning/timeseries", "book/numpy/Chapter", "book/numpy/index", "book/pandas/Chapter", "book/pandas/additionallibs", "book/pandas/index", "book/polars/Chapter", "book/polars/index", "book/pythontricks/Chapter", "book/pythontricks/index", "book/pythontricks/utility", "book/selenium/Chapter", "book/selenium/index", "book/streamlit/Chapter", "book/streamlit/index", "book/testing/Chapter", "book/testing/index"], "filenames": ["README.md", "book/Miscellaneous/Chapter.ipynb", "book/Miscellaneous/index.ipynb", "book/codequality/automation.ipynb", "book/codequality/cicd.ipynb", "book/codequality/codestyle.ipynb", "book/codequality/index.ipynb", "book/codequality/memory.ipynb", "book/codequality/security.ipynb", "book/codequality/typing.ipynb", "book/cooltools/Chapter.ipynb", "book/cooltools/index.ipynb", "book/documentation/Chapter.ipynb", "book/documentation/index.ipynb", "book/jupyternotebook/Chapter.ipynb", "book/jupyternotebook/index.ipynb", "book/llm/Chapter.ipynb", "book/llm/index.ipynb", "book/machinelearning/dataaugmentation.ipynb", "book/machinelearning/eda.ipynb", "book/machinelearning/featureselection.ipynb", "book/machinelearning/getdata.ipynb", "book/machinelearning/index.ipynb", "book/machinelearning/modeltraining.ipynb", "book/machinelearning/outlierdetection.ipynb", "book/machinelearning/preprocessing.ipynb", "book/machinelearning/timeseries.ipynb", "book/numpy/Chapter.ipynb", "book/numpy/index.ipynb", "book/pandas/Chapter.ipynb", "book/pandas/additionallibs.ipynb", "book/pandas/index.ipynb", "book/polars/Chapter.ipynb", "book/polars/index.ipynb", "book/pythontricks/Chapter.ipynb", "book/pythontricks/index.ipynb", "book/pythontricks/utility.ipynb", "book/selenium/Chapter.ipynb", "book/selenium/index.ipynb", "book/streamlit/Chapter.ipynb", "book/streamlit/index.ipynb", "book/testing/Chapter.ipynb", "book/testing/index.ipynb"], "titles": ["Delightful Data Science", "<span class=\"section-number\">14.1. </span>Miscellaneous", "<span class=\"section-number\">14. </span>Miscellaneous", "<span class=\"section-number\">1.1. </span>Automation", "<span class=\"section-number\">1.2. </span>CI/CD", "<span class=\"section-number\">1.3. </span>Code Style", "<span class=\"section-number\">1. </span>Code Quality", "<span class=\"section-number\">1.4. </span>Memory Optimization", "<span class=\"section-number\">1.5. </span>Security in Projects", "<span class=\"section-number\">1.6. </span>Typing", "<span class=\"section-number\">2.1. </span>Cool Tools", "<span class=\"section-number\">2. </span>Cool Tools", "<span class=\"section-number\">4.1. </span>Documentation", "<span class=\"section-number\">4. </span>Documentation", "<span class=\"section-number\">3.1. </span>Jupyter Notebook Tips and Tricks", "<span class=\"section-number\">3. </span>Jupyter Notebook Tricks and Tips", "<span class=\"section-number\">6.1. </span>LLM", "<span class=\"section-number\">6. </span>LLM", "<span class=\"section-number\">5.1. </span>Data Augmentation", "<span class=\"section-number\">5.2. </span>EDA", "<span class=\"section-number\">5.3. </span>Feature Selection", "<span class=\"section-number\">5.4. </span>Get Data", "<span class=\"section-number\">5. </span>Machine Learning", "<span class=\"section-number\">5.5. </span>Model Training", "<span class=\"section-number\">5.6. </span>Outlier Detection", "<span class=\"section-number\">5.8. </span>Preprocessing", "<span class=\"section-number\">5.7. </span>Time Series", "<span class=\"section-number\">7.1. </span>NumPy Tips and Tricks", "<span class=\"section-number\">7. </span>NumPy Tips and Tricks", "<span class=\"section-number\">8.1. </span>Pandas Tips and Tricks", "<span class=\"section-number\">8.2. </span>Utility Libraries for Pandas", "<span class=\"section-number\">8. </span>Pandas Tricks and Tips", "<span class=\"section-number\">9.1. </span>Polars Tips &amp; Tricks", "<span class=\"section-number\">9. </span>Polars", "<span class=\"section-number\">10.1. </span>Pure Python + Built-in libraries", "<span class=\"section-number\">10. </span>Python Tips and Tricks", "<span class=\"section-number\">10.2. </span>Utilities for Python", "<span class=\"section-number\">11.1. </span>Selenium Tips and Tricks", "<span class=\"section-number\">11. </span>Selenium Tips and Tricks", "<span class=\"section-number\">12.1. </span>Streamlit Tips and Tricks", "<span class=\"section-number\">12. </span>Streamlit Tips and Tricks", "<span class=\"section-number\">13.1. </span>Testing", "<span class=\"section-number\">13. </span>Testing in Python"], "terms": {"It": [0, 1, 4, 5, 8, 9, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 34, 36, 37, 41], "wa": [0, 1, 10, 23, 26, 34, 41], "decemb": [0, 21], "2022": [0, 8, 21], "when": [0, 1, 4, 5, 9, 10, 14, 16, 20, 25, 29, 34, 36, 37, 41], "i": [0, 7, 10, 16, 20, 23, 24, 34, 36, 41], "start": [0, 1, 8, 29, 34], "write": [0, 1, 5, 9, 10, 14, 19, 29, 36], "daili": 0, "linkedin": [0, 21], "post": 0, "share": [0, 34], "one": [0, 5, 10, 14, 19, 23, 25, 27, 29, 30, 34, 36, 37, 39], "short": [0, 25], "python": [0, 3, 7, 8, 9, 12, 16, 18, 19, 20, 21, 23, 24, 25, 26, 37, 41], "tip": 0, "per": [0, 14, 23, 25], "dai": [0, 26, 36], "my": [0, 25], "main": [0, 4, 8, 10, 23, 36], "goal": 0, "what": [0, 1, 9, 10, 21, 23, 29, 34, 36, 39, 41], "learnt": 0, "over": [0, 10, 18, 23, 26], "year": [0, 19], "am": 0, "current": [0, 5, 10, 23], "learn": [0, 10, 20], "other": [0, 5, 8, 10, 19, 21, 23, 27, 29, 34, 41], "thought": 0, "s": [0, 1, 4, 8, 9, 10, 12, 14, 19, 20, 21, 26, 27, 29, 30, 34, 36, 37], "us": [0, 1, 3, 4, 5, 7, 8, 9, 10, 14, 16, 18, 20, 21, 24, 25, 26, 27, 29, 30, 36, 37, 39, 41], "me": [0, 25], "probabl": [0, 4, 10, 23, 34, 37], "peopl": 0, "too": [0, 4, 10, 19, 21, 23, 26, 29, 34, 36], "As": 0, "time": [0, 1, 4, 5, 9, 10, 14, 23, 30, 36, 37, 41], "went": 0, "more": [0, 1, 5, 8, 9, 16, 19, 20, 23, 24, 25, 29, 36], "found": [0, 8, 10, 34], "soon": 0, "realiz": 0, "could": [0, 20, 21, 27], "compil": [0, 14, 23], "comprehens": 0, "guid": 0, "anyon": 0, "interest": [0, 41], "becom": 0, "better": [0, 23, 30], "scientist": [0, 32], "thu": [0, 21, 23], "idea": 0, "born": 0, "The": [0, 8, 10, 19, 20, 21, 23, 25, 34, 37, 41], "contain": [0, 10, 14, 23], "all": [0, 5, 10, 14, 16, 19, 20, 23, 25, 27, 30, 32, 34, 36, 41], "author": 0, "well": [0, 5, 10, 23], "mani": [0, 1, 10, 23, 34, 41], "come": [0, 8, 10, 21, 23, 26, 34, 36, 41], "futur": [0, 23, 26], "call": [0, 8, 10, 25, 34, 41], "becaus": [0, 5, 10, 23, 26, 29], "aim": [0, 10, 23], "make": [0, 1, 4, 5, 7, 9, 14, 16, 19, 20, 23, 30, 36, 37, 41], "your": [0, 1, 3, 4, 9, 18, 19, 21, 26, 27, 30, 32, 39], "journei": 0, "help": [0, 1, 9, 10, 14, 16, 19, 23, 41], "you": [0, 1, 3, 4, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 32, 34, 36, 37, 39, 41], "By": [0, 23, 29, 30, 37, 41], "incorpor": [0, 23], "trick": [0, 34], "workflow": [0, 23], "can": [0, 1, 3, 4, 5, 7, 8, 9, 10, 14, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 34, 36, 37, 39, 41], "project": [0, 3, 10, 12, 21, 27, 37, 41], "enjoy": 0, "success": 0, "add": [1, 9, 10, 14, 16, 23, 30], "8": [1, 3, 8, 19, 20, 23, 34, 36, 41], "work": [1, 8, 9, 14, 16, 18, 19, 20, 23, 26, 29, 34], "boost": [1, 18, 26], "product": [1, 9, 23, 29], "\ud835\udc0f\ud835\udc32\ud835\udc2d\ud835\udc21\ud835\udc28\ud835\udc27": 1, "\ud835\udc08\ud835\udc27\ud835\udc1d\ud835\udc1e\ud835\udc27\ud835\udc2d": 1, "sure": [1, 5, 9, 14, 41], "indent": [1, 34], "correct": [1, 10, 26], "everi": [1, 4, 8, 10, 14, 20, 21, 23, 24], "enter": [1, 34], "\ud835\udc0f\ud835\udc32\ud835\udc25\ud835\udc1a\ud835\udc27\ud835\udc1c\ud835\udc1e": 1, "A": [1, 3, 10, 12, 14, 18, 19, 20, 21, 23, 29, 34, 36, 41], "brainer": 1, "includ": [1, 8, 10, 19, 23, 24, 25, 26, 34, 36], "benefit": 1, "like": [1, 5, 8, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 32, 34, 37, 41], "paramet": [1, 36], "suggest": [1, 8], "code": [1, 3, 8, 9, 23, 29, 34, 39, 41], "navig": 1, "signatur": 1, "microsoft": [1, 16, 23], "declar": 1, "default": [1, 10, 23, 29, 30, 37, 41], "languag": [1, 10, 16, 21, 36], "server": [1, 14], "\ud835\udc06\ud835\udc22\ud835\udc2d\ud835\udc0b\ud835\udc1e\ud835\udc27\ud835\udc2c": 1, "provid": [1, 5, 8, 10, 14, 16, 19, 21, 23, 25, 26, 30, 34, 36, 41], "power": [1, 18, 20, 24, 26], "featur": [1, 10, 34], "git": [1, 14], "experi": 1, "see": [1, 3, 7, 9, 10, 14, 19, 20, 21, 23, 29, 34, 36, 37, 41], "specif": [1, 10, 14, 23, 34, 37], "line": [1, 3, 7, 8, 10, 14, 19, 23, 26, 29, 34, 39], "whom": 1, "which": [1, 7, 8, 9, 10, 20, 23, 26, 27, 29, 34, 41], "pull": [1, 4], "request": [1, 5, 8, 36], "messag": [1, 10, 16, 36], "And": [1, 10, 16, 18, 19, 23, 29], "much": [1, 16, 23, 36], "\ud835\udc09\ud835\udc2e\ud835\udc29\ud835\udc32\ud835\udc2d\ud835\udc1e\ud835\udc2b": 1, "notebook": 1, "support": [1, 4, 5, 10, 16, 19, 20, 21, 23, 24, 25, 26, 34], "allow": [1, 4, 10, 19, 23, 34, 41], "ani": [1, 8, 10, 23, 34, 41], "environ": [1, 3, 16], "jupyt": [1, 10], "kernel": 1, "\ud835\udc00\ud835\udc11\ud835\udc04\ud835\udc0f\ud835\udc0b": 1, "\ud835\udc1f\ud835\udc28\ud835\udc2b": 1, "automat": [1, 8, 19, 20, 23, 25, 30, 37, 41], "evalu": [1, 5, 26], "real": [1, 14, 21, 41], "type": [1, 5, 10, 19, 20, 23, 26, 30], "displai": [1, 26, 36], "variabl": [1, 5, 9, 10, 19, 23, 25, 26], "error": [1, 5, 9, 21, 23, 25, 34, 36], "readabl": [1, 25], "wai": [1, 3, 10, 14, 23, 25, 29, 30, 36, 37, 41], "onli": [1, 5, 9, 10, 14, 16, 19, 20, 23, 25, 26, 29, 30, 34, 36, 37], "3": [1, 3, 4, 7, 8, 9, 10, 14, 16, 19, 20, 21, 23, 24, 26, 27, 29, 37, 41], "7": [1, 3, 7, 8, 14, 19, 20, 23, 24, 29, 34, 41], "\ud835\udc0f\ud835\udc1a\ud835\udc2d\ud835\udc21": 1, "gener": [1, 26, 27, 34, 39, 41], "intern": [1, 10], "import": [1, 3, 7, 8, 9, 10, 14, 16, 18, 19, 21, 23, 24, 25, 26, 27, 29, 30, 32, 34, 36, 37, 39, 41], "statement": [1, 5, 16, 30, 41], "\ud835\udc13\ud835\udc1e\ud835\udc2c\ud835\udc2d": 1, "\ud835\udc04\ud835\udc31\ud835\udc29\ud835\udc25\ud835\udc28\ud835\udc2b\ud835\udc1e\ud835\udc2b": 1, "show": [1, 10, 19, 20, 23, 26, 29], "test": [1, 5, 8, 10, 14, 16, 23, 26, 32], "explor": 1, "without": [1, 9, 10, 12, 19, 23, 34, 41], "effort": [1, 21], "instead": [1, 4, 5, 9, 10, 20, 25, 26, 30, 34, 37, 41], "go": [1, 9, 10, 37], "through": [1, 8, 9, 10, 23, 37], "output": [1, 10, 16, 20, 21, 23, 24, 25, 34, 36], "termin": [1, 34], "\ud835\udc1a\ud835\udc2e\ud835\udc2d\ud835\udc28\ud835\udc03\ud835\udc28\ud835\udc1c\ud835\udc2c\ud835\udc2d\ud835\udc2b\ud835\udc22\ud835\udc27\ud835\udc20": 1, "quickli": [1, 14, 23], "docstr": [1, 5], "function": [1, 5, 7, 8, 9, 14, 19, 21, 23, 25, 26, 29, 30, 36, 41], "ar": [1, 4, 5, 10, 14, 16, 18, 20, 23, 24, 26, 27, 29, 34, 36, 37, 41], "new": [1, 4, 10, 14, 16, 23, 25, 34, 36, 37], "data": [1, 8, 14, 20, 24, 27, 29, 30, 34, 39], "scienc": [1, 27], "hassl": [1, 10], "set": [1, 3, 8, 14, 16, 19, 25, 26, 27, 36, 37, 41], "up": [1, 3, 5, 10, 16, 23, 26, 34, 41], "structur": [1, 14], "try": [1, 5, 7, 8, 9, 10, 12, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 30, 36, 41], "command": [1, 8, 10, 14, 21, 34], "tool": [1, 3, 5, 8, 20, 23, 34], "creat": [1, 3, 8, 12, 16, 19, 23, 34, 36, 41], "thi": [1, 3, 5, 8, 10, 19, 20, 23, 25, 26, 27, 29, 30, 34, 36, 37, 41], "save": [1, 10, 16, 21, 30, 34, 36, 37, 41], "standard": [1, 3, 10, 21, 26, 34, 36], "There": [1, 10, 23], "ton": 1, "github": [1, 21], "sai": [1, 5, 10, 14, 29, 34], "goodby": [1, 5], "tediou": 1, "link": [1, 9, 23], "repositori": [1, 10], "http": [1, 4, 8, 10, 21, 23, 25, 34, 36, 37], "com": [1, 4, 10, 16, 21, 23, 25, 34, 37], "drivendata": 1, "do": [1, 3, 5, 8, 9, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 30, 34, 36, 37, 39, 41], "want": [1, 3, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 25, 26, 30, 34, 36, 37, 39, 41], "someth": [1, 10, 34], "react": 1, "app": [1, 5, 23, 34, 39], "anyth": [1, 4], "ai": [1, 10, 23], "an": [1, 8, 9, 10, 14, 16, 19, 20, 23, 24, 25, 36, 41], "entir": 1, "codebas": [1, 10, 30], "base": [1, 10, 19, 20, 24, 25, 29, 30, 34, 36], "markdown": [1, 5], "file": [1, 3, 4, 8, 14, 25, 29, 41], "describ": [1, 10, 26, 34], "kind": 1, "applic": [1, 8, 10, 16, 19, 23], "necessari": [1, 4], "boilerpl": 1, "clear": [1, 23], "But": [1, 5, 8, 9, 10, 20, 23, 24, 26, 29, 34, 36, 37, 39, 41], "alwai": [1, 5, 20, 23], "easi": [1, 10, 14, 18, 21, 23, 24, 37], "team": [1, 23], "With": [1, 3, 4, 5, 10, 14, 19, 20, 23, 27, 34, 36, 39, 41], "get": [1, 5, 8, 9, 14, 30, 36, 37], "releas": [1, 23, 37], "manag": [1, 23], "design": 1, "defin": [1, 3, 4, 9, 10, 18, 19, 20, 23, 24, 29, 30, 34, 37, 41], "rule": 1, "bump": 1, "version": [1, 3, 4, 8, 9, 25, 37], "changelog": 1, "life": [1, 23], "easier": [1, 5, 26, 34], "enforc": [1, 5, 30], "descript": 1, "struggl": [3, 10], "rememb": [3, 10], "exact": [3, 23, 26], "seri": [3, 20, 23, 30], "need": [3, 4, 5, 8, 9, 10, 12, 14, 16, 20, 21, 23, 24, 29, 30, 34], "build": [3, 4, 23, 25], "packag": [3, 8, 16, 21, 23, 26, 27, 30, 41], "Or": [3, 10], "manual": [3, 5, 10, 14, 19, 34, 36, 37], "run": [3, 4, 5, 7, 8, 9, 10, 12, 20, 23, 26, 41], "instal": [3, 4, 5, 7, 8, 9, 10, 12, 14, 16, 18, 19, 20, 21, 23, 24, 25, 26, 30, 32, 36, 37, 39, 41], "depend": [3, 19], "rescu": 3, "have": [3, 5, 10, 14, 20, 23, 24, 25, 26, 29, 30, 32, 34, 36, 37, 41], "execut": [3, 14, 34, 41], "those": [3, 10, 34, 37], "below": [3, 4, 7, 8, 9, 10, 14, 19, 20, 21, 23, 24, 26, 29, 30, 34, 36, 37, 41], "how": [3, 5, 7, 9, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 34, 36, 41], "we": [3, 8, 10, 14, 16, 20, 21, 23, 24, 34, 41], "our": [3, 16, 34], "format": [3, 10, 16, 19, 21, 25, 34, 36], "black": [3, 14, 25], "name": [3, 4, 8, 9, 10, 16, 20, 21, 23, 25, 29, 30, 36, 41], "echo": [3, 10, 34], "requir": [3, 4, 41], "pip": [3, 4, 5, 7, 8, 9, 12, 14, 16, 18, 19, 20, 21, 23, 24, 25, 26, 30, 32, 36, 37, 39, 41], "r": [3, 4, 8, 10, 20], "txt": [3, 4, 10], "quiet": 3, "pytest": 3, "against": [3, 8, 16, 20, 23], "multipl": [3, 10, 19, 20, 23, 24, 26], "hard": [3, 10, 24], "step": [3, 4, 14, 19, 23, 27], "local": [3, 10], "custom": [3, 5, 10, 23], "session": [3, 10, 23], "script": [3, 7, 10, 23], "exampl": [3, 5, 8, 10, 21, 23, 24, 26, 30, 34, 36, 37, 41], "where": [3, 10, 20, 23, 24, 34, 39, 41], "\ud835\udc2d\ud835\udc1e\ud835\udc2c\ud835\udc2d\ud835\udc2c": 3, "\ud835\udc27\ud835\udc28\ud835\udc31\ud835\udc1f\ud835\udc22\ud835\udc25\ud835\udc1e": 3, "\ud835\udc29\ud835\udc32": 3, "moreov": 3, "anoth": [3, 27], "\ud835\udc25\ud835\udc22\ud835\udc27\ud835\udc2d": 3, "flake8": [3, 5, 14], "highli": [3, 20, 25], "customiz": 3, "so": [3, 4, 9, 10, 14, 20, 23, 24, 34, 36, 37, 41], "check": [3, 5, 8, 16, 23, 30, 34, 37, 41], "out": [3, 5, 10, 14, 16, 19, 23, 26], "document": [3, 10, 34, 41], "noxfil": 3, "py": [3, 4, 5, 7, 8, 9, 10, 12, 14, 41], "6": [3, 7, 10, 14, 19, 20, 23, 29, 34, 36, 41], "9": [3, 4, 7, 16, 19, 20, 23, 25, 29, 34], "def": [3, 5, 7, 9, 10, 14, 23, 24, 29, 30, 34, 36, 41], "lint": 3, "don": [4, 5, 10, 14, 23, 26, 30, 32, 34, 36, 37, 41], "t": [4, 5, 10, 14, 21, 23, 24, 26, 30, 32, 34, 36, 37, 41], "wast": [4, 5, 37], "commit": [4, 14], "push": [4, 14, 34], "chang": [4, 14, 20, 23, 30, 34, 37], "docker": 4, "imag": [4, 36, 41], "machin": [4, 20, 23], "curl": 4, "raw": [4, 10, 23], "githubusercont": [4, 23], "nekto": 4, "master": 4, "sh": 4, "sudo": 4, "bash": 4, "whenev": [4, 29], "trigger": 4, "again": [4, 10, 20, 23, 30, 32, 41], "even": [4, 5, 9, 10, 25, 26, 30], "didn": 4, "small": [4, 10, 14, 16, 23, 29, 30, 34], "snippet": [4, 5, 14], "skip": [4, 8], "next": [4, 21, 34, 36], "branch": 4, "job": [4, 5, 10], "ubuntu": 4, "latest": [4, 37], "checkout": 4, "v4": 4, "setup": 4, "poetri": [4, 10], "pipenv": 4, "unit": [4, 14, 30, 41], "python3": 4, "u": [4, 14], "m": [4, 7, 10, 19, 23, 26], "unittest": 4, "If": [5, 10, 12, 14, 19, 23, 25, 30, 32, 36, 41], "problemat": 5, "difficult": [5, 12, 20, 29], "read": [5, 10, 29], "reduc": [5, 14, 16, 24, 41], "perform": [5, 16, 19, 20, 26, 34, 36, 41], "interpret": [5, 20, 29, 34], "ha": [5, 8, 10, 20, 26, 29, 32, 34], "spend": 5, "less": [5, 26, 29, 34], "unnecessari": [5, 30], "potenti": [5, 8], "issu": [5, 10, 23, 26, 29], "aris": 5, "conflict": [5, 10], "clean": [5, 10, 14, 34, 41], "optim": [5, 10, 14, 20, 29], "also": [5, 8, 10, 16, 21, 23, 24, 26, 30, 34, 36, 37, 41], "fine": 5, "tune": 5, "process": [5, 8, 14, 20], "place": 5, "One": [5, 10, 14, 23, 34, 36], "aspect": 5, "qualiti": [5, 23, 30], "maintain": [5, 10], "In": [5, 8, 10, 14, 20, 21, 23, 26, 29, 30, 34, 41], "about": [5, 20, 23, 34], "method": [5, 10, 19, 20, 23, 24, 26], "class": [5, 10, 24, 25, 26, 36, 41], "print": [5, 8, 9, 14, 20, 21, 23, 25, 26, 27, 30, 36], "coverag": [5, 23], "report": [5, 8, 19, 23, 39, 41], "poorli": 5, "v": [5, 41], "bigger": [5, 23, 29], "look": [5, 10, 14, 18, 19, 23, 25, 41], "nasti": [5, 10], "order": 5, "them": [5, 8, 10, 14, 20, 23, 25, 29, 34, 36, 41], "librari": [5, 8, 10, 12, 18, 19, 20, 21, 23, 24, 25, 26, 36, 39], "alphabet": [5, 10], "separ": 5, "section": [5, 23], "cli": [5, 8, 21], "avoid": [5, 9, 23, 29], "focu": [5, 23], "high": [5, 8, 10, 20], "hand": 5, "tire": [5, 10, 36], "thei": [5, 8, 9, 10, 16, 20, 25, 29, 34, 36, 41], "form": [5, 10], "sinc": [5, 8, 21, 23, 25, 26, 34, 41], "popular": [5, 23, 29, 32, 39], "choic": [5, 23, 30], "config": [5, 10, 14, 23], "nice": [5, 10, 14, 21, 41], "catch": [5, 9], "befor": [5, 9, 23, 26], "caus": [5, 9, 23, 25], "problem": [5, 9, 10, 16, 19, 20, 23, 25, 36], "still": [5, 9, 10, 14, 19, 23], "pylint": 5, "10x": 5, "100x": 5, "faster": [5, 23, 26], "linter": 5, "written": [5, 9, 10], "rust": 5, "magnitud": 5, "than": [5, 8, 9, 16, 23, 24, 26, 29, 34, 36], "while": [5, 10, 19, 23, 34, 37], "integr": [5, 9, 23, 37], "some_fil": 5, "json": [5, 10, 19, 21], "divid": 5, "b": [5, 7, 10, 14, 19, 20, 29, 34, 36, 41], "result": [5, 8, 10, 14, 19, 20, 21, 24, 25, 26, 27, 30, 34, 36, 41], "except": [5, 10, 20], "zerodivisionerror": 5, "e": [5, 10, 19, 23, 36], "infin": 5, "return": [5, 7, 9, 14, 16, 21, 23, 24, 26, 29, 30, 34, 36, 41], "appli": [5, 18, 23, 29], "blacken": 5, "doc": [5, 10], "latex": 5, "restructuredtext": 5, "unformat": 5, "anymor": [5, 10, 27, 36], "md": 5, "typo": 5, "word": [5, 10, 19, 25], "sourc": [5, 10, 14, 19, 23], "touch": [5, 10], "nich": 5, "term": [5, 23], "fals": [5, 8, 10, 14, 23, 24, 34, 37], "posit": [5, 19, 23], "directori": [5, 14, 41], "most": [7, 10, 23, 29, 30, 41], "amount": [7, 9, 14], "modul": [7, 8, 12, 21, 23, 27, 36], "analysi": 7, "consumpt": [7, 23], "within": [7, 10, 14, 39], "decor": [7, 9, 10, 23, 34], "profil": [7, 8, 14], "pass": [7, 9, 10, 23], "option": [7, 10, 23, 29, 30, 37, 41], "load": [7, 10, 14, 23, 26], "from": [7, 9, 16, 19, 20, 23, 24, 25, 26, 30, 36, 37, 39, 41], "my_func": 7, "1": [7, 8, 10, 14, 16, 19, 20, 21, 23, 24, 25, 26, 29, 34, 36, 41], "10": [7, 8, 10, 14, 19, 20, 23, 25, 26, 29, 34, 36], "2": [7, 8, 10, 14, 19, 20, 21, 23, 25, 26, 29, 34, 36, 41], "del": 7, "mem": 7, "usag": [7, 16, 30], "increment": 7, "occurr": 7, "content": [7, 14, 16, 23, 25], "41": 7, "mib": 7, "4": [7, 8, 10, 14, 16, 19, 20, 23, 26, 29, 34, 37, 41], "5": [7, 8, 10, 14, 16, 19, 20, 21, 23, 25, 26, 29, 34, 41], "49": [7, 23], "102": 7, "rang": [7, 10, 14, 19, 20, 23, 24, 25, 26, 34, 36], "100": [7, 9, 10, 12, 16, 23, 30, 41], "194": 7, "145": 7, "0": [7, 8, 10, 14, 16, 19, 20, 23, 24, 25, 30, 34, 41], "22": [7, 26], "20": [7, 19, 20, 23, 25, 29, 41], "find": [8, 9, 26], "known": 8, "abstract": 8, "syntax": [8, 10, 36], "tree": [8, 20, 23, 34], "plugin": [8, 41], "produc": [8, 41], "ignor": [8, 14, 23, 34], "verifi": 8, "ssl": 8, "certif": 8, "\ud835\udc2f\ud835\udc1e\ud835\udc2b\ud835\udc22\ud835\udc1f\ud835\udc32": 8, "\ud835\udc05\ud835\udc1a\ud835\udc25\ud835\udc2c\ud835\udc1e": 8, "immedi": [8, 29, 34, 41], "identifi": [8, 10, 20, 26], "bandit_test": 8, "www": [8, 10, 36, 37], "googl": [8, 23, 34], "de": [8, 10, 21, 25, 34], "info": [8, 36], "none": [8, 34], "exclud": 8, "node_visitor": 8, "warn": [8, 10, 36], "unabl": 8, "qualifi": 8, "12": [8, 14, 20, 21, 23, 26], "23": [8, 36], "15": [8, 19, 20, 23], "32": [8, 23], "44": [8, 36], "650893": 8, "b501": 8, "request_with_no_cert_valid": 8, "disabl": 8, "sever": [8, 23], "confid": [8, 23], "cwe": 8, "295": 8, "mitr": 8, "org": [8, 10, 36], "definit": 8, "html": 8, "locat": [8, 19, 23], "readthedoc": 8, "io": 8, "en": [8, 10, 21, 25], "b501_request_with_no_cert_valid": 8, "status_cod": 8, "scan": 8, "total": [8, 10, 14, 23, 41], "nosec": 8, "metric": [8, 14, 23, 26, 32], "undefin": 8, "low": [8, 23], "medium": 8, "audit": 8, "advisori": 8, "databas": [8, 16, 41], "should": [8, 10, 34, 36, 41], "upgrad": [8, 41], "id": [8, 10, 21, 34], "fix": [8, 23, 34], "flask": [8, 10], "pysec": 8, "2019": 8, "179": 8, "2018": 8, "66": 8, "setuptool": 8, "56": [8, 23], "ghsa": 8, "r9hx": 8, "vwmv": 8, "q579": 8, "65": 8, "almost": 8, "password": 8, "api": [8, 10, 16, 21, 24, 36, 41], "kei": [8, 10, 16, 19, 23, 27, 34], "never": [8, 23, 25, 26], "plain": [8, 10, 36], "text": [8, 14, 23, 29, 36], "would": [8, 16, 23, 26, 34], "trivial": 8, "access": [8, 36], "anybodi": 8, "who": 8, "To": [8, 10, 19, 20, 23, 24, 29, 34, 37, 41], "wrapper": [8, 21, 41], "around": [8, 41], "system": [8, 16, 23, 41], "maco": 8, "keychain": 8, "window": 8, "locker": 8, "etc": [8, 10, 19, 21, 23], "safer": 8, "retriev": [8, 21, 34], "easili": [8, 9, 10, 18, 19, 21, 23, 34], "field": [8, 34], "done": [8, 23, 34], "set_password": 8, "mydb": 8, "usernam": [8, 34], "get_password": 8, "hint": 9, "expect": [9, 16, 41], "wrong": 9, "awai": 9, "rais": [9, 10], "thing": [9, 12, 23, 41], "typecheck": 9, "say_hello": 9, "str": [9, 10, 34], "f": [9, 10, 14, 19, 30, 34, 36], "hello": [9, 10, 14, 16, 34], "checker": [9, 20], "analyz": [9, 10, 23, 26], "ensur": [9, 10, 16, 26, 34], "align": 9, "reliabl": 9, "bank": 9, "deposit": 9, "int": [9, 10, 30], "balanc": [9, 23], "withdraw": 9, "1000": [9, 20, 26, 29, 36], "wish": 9, "fast": [9, 10, 18, 23, 29, 30, 34, 41], "match": [9, 10, 34], "typescript": 9, "commun": [9, 32], "extra": [9, 34], "3x": [9, 16, 30], "5x": [9, 30], "og": 9, "whether": 9, "pleas": [9, 29], "consid": [9, 23, 24, 41], "know": [10, 20, 21, 23, 29, 34], "headach": 10, "pycountri": 10, "iso": 10, "alpha_2": 10, "alpha_3": 10, "eur": 10, "freez": 10, "veri": [10, 20, 23, 41], "good": [10, 23], "virtual": 10, "encount": [10, 16], "follow": [10, 12, 14, 20, 37], "desir": 10, "unus": 10, "realli": [10, 25, 29, 41], "y": [10, 14, 19, 20, 23, 26, 34, 41], "two": [10, 14, 20, 23, 25, 34], "pgeocod": 10, "just": [10, 14, 19, 23, 29, 30, 34], "specifi": [10, 19, 23, 25, 29, 34, 36, 41], "km": 10, "dist": 10, "geodist": 10, "query_postal_cod": 10, "10117": 10, "80331": 10, "ever": 10, "convers": 10, "manipul": [10, 36], "handl": [10, 20, 21, 23, 25, 26, 34, 36], "physic": 10, "quantiti": [10, 34], "arithmet": 10, "keep": 10, "track": [10, 14], "accur": [10, 26], "initi": [10, 23], "registri": 10, "ureg": 10, "unitregistri": 10, "33": 10, "kilomet": 10, "feet": 10, "108267": 10, "71653543308": 10, "foot": 10, "oper": [10, 29, 30], "speed": [10, 23, 26, 41], "hour": [10, 26, 30, 36], "198": 10, "steroid": [10, 23, 36], "cpu": [10, 41], "gpu": [10, 23], "memori": [10, 23, 29, 34, 36], "bottleneck": 10, "propos": 10, "web": [10, 19, 25, 37], "gui": [10, 23], "my_modul": [10, 14], "repair": 10, "scrambl": 10, "occur": [10, 20], "encod": [10, 23], "decod": 10, "foreign": 10, "appear": 10, "correctli": [10, 41], "fix_text": 10, "doe": [10, 16, 25], "\u00e2": 10, "\u0153ftfy\u00e2": 10, "x9d": 10, "mean": [10, 14, 20, 23, 36], "\u00e2\u0153": 10, "mona": 10, "lisa": 10, "doesn\u00e3\u0192\u00e2": 10, "\u00e3": 10, "\u0161\u00e2": 10, "\u017e\u00e2": 10, "eyebrow": 10, "pre": [10, 23, 36, 41], "train": [10, 14, 16, 20, 24, 25, 26], "model": [10, 16, 18, 20, 24, 25, 26], "cv2": [10, 18], "input_path": 10, "car": [10, 34], "jpg": [10, 18, 36], "output_path": 10, "car2": 10, "input_fil": 10, "imread": [10, 18], "output_fil": 10, "imwrit": 10, "clunki": 10, "intuit": [10, 23, 25, 36], "auto": [10, 26], "ditch": [10, 32], "argpars": 10, "hello_script": 10, "bye": 10, "__name__": [10, 36], "__main__": [10, 36], "john": [10, 16, 36], "annoi": [10, 37, 41], "few": [10, 19], "divers": [10, 41], "address": [10, 16, 23, 25, 36], "phone": [10, 16, 25], "email": [10, 16, 23, 25], "fr_fr": 10, "phone_numb": 10, "color": [10, 25, 29, 36], "offer": [10, 19, 23, 24, 26, 34, 36], "beauti": [10, 14], "bore": 10, "url": [10, 21, 25, 34, 36], "25000000": 10, "\ud835\udc2d\ud835\udc2a\ud835\udc1d\ud835\udc26": 10, "set_descript": 10, "glob": 10, "sample_data": 10, "csv": [10, 19, 23, 26, 29], "emoticon": 10, "give": [10, 23, 26, 30, 36], "insight": 10, "especi": [10, 29, 34, 37, 41], "sentiment": [10, 23], "emot_obj": 10, "core": 10, "love": 10, "watermark": 10, "same": [10, 14, 19, 34, 41], "endpoint": 10, "second": [10, 23, 25, 36], "delai": [10, 36], "take": [10, 16, 23, 34, 36, 41], "60": [10, 23], "httpbin": 10, "requests_cach": 10, "cachedsess": 10, "test_cach": 10, "string": [10, 19, 29, 30, 32, 34], "fuzzi": 10, "differ": [10, 18, 19, 21, 23, 26, 37], "variat": 10, "panda": [10, 19, 20, 21, 23, 25, 26, 32, 36], "pd": [10, 19, 20, 23, 25, 26, 30, 39], "util": [10, 14, 23, 24, 26], "unify_nam": 10, "deduplicate_list_str": 10, "read_csv": [10, 19, 23, 30, 39], "bairro": 10, "imovel": 10, "value_count": 10, "threshold_count": 10, "500": [10, 21, 23], "\ud835\udc25\ud835\udc22\ud835\udc27\ud835\udc24\ud835\udc1c\ud835\udc21\ud835\udc1e\ud835\udc1c\ud835\udc24\ud835\udc1e\ud835\udc2b": 10, "recurs": 10, "mai": [10, 20, 25], "harm": [10, 16, 20], "search": [10, 21, 36], "engin": [10, 23], "rank": [10, 20, 23], "linkcheck": 10, "bashplotlib": 10, "littl": 10, "basic": 10, "quick": [10, 14], "visual": [10, 14], "histogram": 10, "scatter": 10, "plot": [10, 14], "hist": 10, "stop": [10, 14, 34], "resolv": 10, "pipdeptre": 10, "possibl": [10, 23], "wrote": 10, "acrosort": 10, "tex": 10, "fun": 10, "sundai": 10, "publish": 10, "\ud835\udc82\ud835\udc84\ud835\udc93\ud835\udc90": 10, "\ud835\udc82\ud835\udc83\ud835\udc83\ud835\udc93\ud835\udc86\ud835\udc97\ud835\udc8a\ud835\udc82\ud835\udc95\ud835\udc8a\ud835\udc90\ud835\udc8f": 10, "\ud835\udc94\ud835\udc89\ud835\udc90\ud835\udc93\ud835\udc95\ud835\udc87\ud835\udc90\ud835\udc93\ud835\udc8e": 10, "\ud835\udc8d\ud835\udc90\ud835\udc8f\ud835\udc88\ud835\udc87\ud835\udc90\ud835\udc93\ud835\udc8e": 10, "begin": [10, 34], "lnkd": 10, "etf8qs5w": 10, "acrosort_tex": 10, "old": [10, 23, 34, 37], "pyfiglet": 10, "banner": 10, "introduc": [10, 34], "user": [10, 14, 16, 21], "font": 10, "ascii_art": 10, "figlet_format": 10, "world": [10, 14], "bubblehead": 10, "bulbhead": 10, "entiti": 10, "recognit": 10, "displaci": 10, "detect": [10, 16, 20, 21, 23], "super": [10, 23], "some": [10, 20, 23, 30, 34, 41], "sentenc": [10, 23], "span": 10, "chelsea": 10, "footbal": [10, 34], "club": 10, "english": 10, "profession": 10, "fulham": 10, "west": 10, "london": [10, 36], "1905": 10, "plai": [10, 34, 41], "home": 10, "game": [10, 41], "stamford": 10, "bridg": 10, "compet": 10, "premier": 10, "leagu": 10, "top": [10, 14, 23, 24], "divis": 10, "won": 10, "first": [10, 23, 34], "major": [10, 23, 24], "honour": 10, "championship": 10, "1955": 10, "nlp": 10, "en_core_web_sm": 10, "render": 10, "style": [10, 19], "ent": 10, "true": [10, 14, 19, 23, 24, 25, 30], "paper": 10, "graphic": 10, "element": [10, 30, 34], "notori": [10, 24], "No": [10, 12, 14], "worri": 10, "figur": [10, 19, 41], "tikzplotlib": 10, "insert": [10, 16], "pyplot": [10, 19, 26, 41], "plt": [10, 19, 26, 41], "numpi": [10, 14, 18, 19, 20, 23, 24, 25, 34], "np": [10, 14, 18, 19, 20, 23, 24, 25, 34], "ggplot": 10, "arang": 10, "sin": 10, "pi": 10, "s2": 10, "co": 10, "o": 10, "lw": 10, "xlabel": [10, 41], "ylabel": [10, 41], "voltag": 10, "mv": 10, "titl": [10, 19], "simpl": [10, 12, 23], "frac": 10, "alpha": [10, 23, 24], "grid": [10, 19], "mytikz": 10, "For": [10, 19, 23, 25, 27, 29], "pattern": [10, 25, 26, 34], "break": [10, 34], "down": 10, "complex": [10, 23, 25, 30, 34], "simpler": 10, "ones": [10, 23, 41], "combin": [10, 23, 24], "end": [10, 29, 34, 41], "either": [10, 30, 34], "ip": [10, 16], "digit": [10, 25], "port": [10, 23], "anylett": 10, "anydigit": 10, "anyfrom": 10, "quantifi": [10, 23], "atleastatmost": 10, "group": 10, "captur": [10, 19], "http_protocol": 10, "alphanum": 10, "domain_nam": 10, "n": [10, 26, 34], "61": [10, 20, 23], "tld": 10, "ip_octet": 10, "at_least_at_most": 10, "port_numb": 10, "sub": 10, "togeth": 10, "effortlessli": [10, 14], "extract": [10, 21, 23, 26, 34], "optic": 10, "charact": [10, 34], "built": [10, 26, 30, 36, 41], "pytorch": [10, 18, 26], "80": [10, 23], "latin": 10, "chines": 10, "arab": 10, "cyril": 10, "given": [10, 29, 41], "ps": 10, "recommend": [10, 23, 30], "reader": 10, "image_path": [10, 36], "english_imag": 10, "png": [10, 23], "readtext": 10, "draw": 10, "variou": [10, 19, 23, 24, 25, 26], "node": [10, 23, 34], "cloud": [10, 19], "aw": [10, 23], "azur": 10, "gcp": 10, "architectur": 10, "comput": [10, 14, 18, 34], "ec2": 10, "rd": 10, "network": [10, 21, 23], "elb": 10, "worker": 10, "direct": [10, 23], "tb": 10, "lb": 10, "worker1": 10, "worker2": 10, "worker3": 10, "worker4": 10, "worker5": 10, "event": 10, "program": [10, 29, 36], "fail": [10, 41], "let": [10, 14, 19, 23, 26, 29, 34], "instabl": [10, 24], "internet": 10, "connect": [10, 37], "uncommon": 10, "usual": [10, 23], "mechan": 10, "isn": [10, 21], "behaviour": [10, 34], "condit": [10, 29, 34], "wait": [10, 23, 41], "coroutin": 10, "after": [10, 26, 34], "attempt": 10, "stop_after_attempt": 10, "stop_after_5_attempt": 10, "OR": 10, "stop_after_delai": 10, "stop_after_10_s_or_5_retri": 10, "x": [10, 14, 20, 23, 24, 26, 30, 34, 41], "wait_fix": 10, "wait_2_": 10, "retry_if_exception_typ": 10, "ioerror": 10, "might_io_error": 10, "forev": 10, "interfac": [10, 19, 23], "open": [10, 23], "c": [10, 14, 19, 20, 29, 34, 36], "due": [10, 23, 24, 29], "larger": [10, 27, 29], "research": [10, 16], "plotli": [10, 29], "neat": [10, 36], "tutori": 10, "purpos": [10, 36], "ig": 10, "g": [10, 23, 36], "es": 10, "width": [10, 34], "fig": [10, 19, 23, 29, 41], "ax": [10, 19], "subplot": [10, 19], "target": [10, 23, 25], "layout": [10, 19], "circl": 10, "vertex_color": 10, "steelblu": 10, "vertex_label": 10, "vcount": 10, "edge_width": 10, "edge_color": 10, "666": 10, "edge_background": 10, "white": 10, "bandwidth": [10, 37], "dot": [10, 36], "net": [10, 23], "orient": 10, "pure": 10, "lightweight": [10, 23], "perfect": 10, "hobbi": 10, "db": 10, "path": [10, 23, 36, 37, 39, 41], "char": 10, "stai": [10, 23], "sloc": 10, "logic": 10, "lloc": 10, "estim": [10, 20, 23, 26], "cyclomat": 10, "correspond": [10, 19, 21, 25], "decis": 10, "count": [10, 21], "halstead": 10, "deriv": [10, 21], "distinct": 10, "operand": 10, "index": [10, 19, 26, 29], "measur": [10, 20, 41], "mix": 10, "abov": 10, "cc": 10, "httpx": 10, "similar": [10, 29, 32, 34, 36], "advantag": 10, "asynchron": 10, "doesn": [10, 23, 24], "lead": [10, 20, 23, 26], "improv": 10, "deal": 10, "concurr": 10, "yourself": [10, 14, 26], "put": 10, "valu": [10, 20, 23, 25, 26, 29, 36, 41], "delet": [10, 23, 41], "async": [10, 16], "asynccli": 10, "client": [10, 16], "await": 10, "pair": [10, 19, 34], "env": [10, 14], "api_kei": [10, 16], "mysupersecretapikei": 10, "domain": 10, "mydomain": 10, "load_dotenv": 10, "dotenv_valu": 10, "os": [10, 16, 37, 41], "getenv": 10, "dictionari": [10, 23], "did": [10, 23, 29, 34, 37], "interact": [10, 14, 16, 41], "sdk": 10, "item": [10, 19, 34], "page": [10, 12, 21], "notion_cli": 10, "notion_token": 10, "list": [10, 14, 20, 23, 34], "my_pag": 10, "database_id": 10, "897e5a76": 10, "ae52": 10, "4b48": 10, "9fdf": 10, "e71f5945d1af": 10, "filter": [10, 19, 21, 26], "properti": [10, 34], "landmark": 10, "rich_text": 10, "pypika": 10, "nearli": [10, 23], "tabl": 10, "histori": 10, "q": [10, 23, 25, 34], "from_": 10, "join": 10, "customer_id": 10, "select": 10, "star": 10, "get_sql": 10, "ON": 10, "pdoc": 12, "cool": [12, 23, 34], "hierarchi": 12, "configur": [12, 23], "altern": [12, 14, 23, 36], "sphinx": 12, "preprocess": [12, 14, 23], "exactli": 14, "load_ext": 14, "magic": 14, "extens": [14, 25], "lprun": 14, "my_funct": [14, 30], "10000": [14, 29], "400": 14, "1e": 14, "timer": 14, "001": 14, "0160793": 14, "ipython": 14, "input": [14, 19, 23, 29], "18": 14, "790da5f104f0": 14, "hit": [14, 26], "9999": 14, "16": [14, 19, 23], "37": 14, "46": 14, "livelossplot": 14, "ad": [14, 34], "callback": 14, "tensorboard": 14, "its": [14, 21, 23, 24, 29, 30, 34, 36], "progress": 14, "kera": 14, "dataset": [14, 19, 20, 23, 24, 25, 26, 29, 30], "mnist": 14, "to_categor": 14, "sequenti": [14, 23], "layer": [14, 23], "flatten": [14, 23, 36], "dens": [14, 23], "activ": [14, 23], "plotlosseskera": 14, "x_train": [14, 20, 23], "y_train": [14, 20, 23, 26], "x_test": [14, 20, 23], "y_test": [14, 20, 23, 26], "load_data": [14, 23], "reshap": 14, "28": [14, 19, 23], "astyp": 14, "float32": 14, "255": 14, "input_shap": [14, 23], "softmax": [14, 23], "rmsprop": 14, "categorical_crossentropi": 14, "accuraci": [14, 23], "plotloss": 14, "fit": [14, 20, 23, 24, 26], "epoch": 14, "validation_data": 14, "verbos": [14, 23, 25], "latexifi": 14, "math": 14, "solv": [14, 16, 19], "sqrt": 14, "diagram": 14, "switch": 14, "back": [14, 34], "sklearn": [14, 20, 24, 25, 26], "make_pipelin": [14, 25], "imput": 14, "simpleimput": [14, 25], "compos": [14, 18, 23, 25], "columntransform": 14, "onehotencod": 14, "robustscal": [14, 25], "ensembl": [14, 26], "randomforestclassifi": [14, 23], "set_config": 14, "numeric_preprocessor": 14, "imputation_mean": 14, "missing_valu": 14, "nan": 14, "strategi": [14, 41], "scale": [14, 23], "categorical_preprocessor": 14, "imputation_const": 14, "fill_valu": 14, "miss": [14, 34, 41], "constant": [14, 23], "one_hot": 14, "handle_unknown": [14, 23], "preprocessor": 14, "categor": [14, 19], "state": [14, 27], "gender": 14, "numer": 14, "ag": [14, 20, 30, 36], "weight": 14, "pipe": [14, 23, 26], "reload": 14, "reimport": 14, "my_function1": 14, "my_function2": 14, "limit": [14, 16], "widespread": 14, "isort": 14, "incompat": 14, "nbqa": 14, "er": 14, "toolchain": 14, "my_notebook": 14, "ipynb": 14, "float": [14, 25], "heavi": 14, "jupyterlab": 14, "scratch": 14, "jupytertempl": 14, "eda": [14, 23, 39], "labextens": 14, "jupyterlab_templ": 14, "enabl": 14, "jupyter_notebook_config": 14, "jupyterlabtempl": 14, "allowed_extens": 14, "template_dir": 14, "include_default": 14, "include_core_path": 14, "larg": [14, 25, 30, 34], "strip": 14, "size": [14, 19, 23, 25], "risk": 14, "sensit": [14, 16], "genai": 14, "vendor": 14, "openai": [14, 16], "huggingfac": [14, 23], "anthrop": [14, 16], "ask": [14, 41], "provider_api_kei": 14, "your_api_key_her": 14, "jupyter_ai": 14, "chatgpt": 14, "here": [16, 34, 41], "cost": [16, 25], "often": [16, 24], "exceed": 16, "token": [16, 25], "forget": 16, "context": 16, "pai": 16, "unimport": 16, "claim": 16, "achiev": [16, 23], "20x": [16, 26], "minim": [16, 20], "tri": [16, 30], "myself": 16, "notic": [16, 23], "cautiou": 16, "critic": [16, 36], "promptcompressor": 16, "your_prompt": 16, "llm_lingua": 16, "lgaalv": 16, "gpt2": 16, "dolli": 16, "compressed_prompt": 16, "compress_prompt": 16, "instruct": 16, "question": 16, "target_token": 16, "200": [16, 30], "turn": 16, "best": [16, 20, 23, 30], "origin_token": 16, "2430": 16, "compressed_token": 16, "261": 16, "ratio": [16, 20, 23], "gpt": 16, "consist": [16, 19, 29], "stream": [16, 23], "respons": [16, 23, 36], "complet": [16, 19, 34], "openai_api_kei": 16, "anthropic_api_kei": 16, "mistral_api_kei": 16, "role": 16, "turbo": 16, "claud": 16, "instant": 16, "mistral": 16, "tini": 16, "unwant": 16, "behavior": [16, 41], "safe": 16, "between": [16, 19, 20, 21, 23], "inform": [16, 21, 34], "credit": 16, "card": 16, "number": [16, 27, 41], "sanit": 16, "toxic": 16, "inject": 16, "guard": 16, "llm_guard": 16, "scan_output": 16, "scan_prompt": 16, "input_scann": 16, "anonym": [16, 34], "promptinject": 16, "vault": 16, "openaikei": 16, "sql": [16, 19], "555": 16, "123": [16, 25, 36], "4567": 16, "192": 16, "168": 16, "8901": 16, "2345": 16, "6789": 16, "sanitized_prompt": 16, "results_valid": 16, "results_scor": 16, "chat": 16, "assist": 16, "redacted_person_1": 16, "redacted_email_address_1": 16, "redacted_phone_number_1": 16, "redacted_ip_address_1": 16, "redacted_credit_card_re_1": 16, "seamlessli": 18, "tensorflow": 18, "70": [18, 23], "transform": [18, 23, 34], "vision": 18, "horizontalflip": 18, "tograi": 18, "griddropout": 18, "verticalflip": 18, "channelshuffl": 18, "augmented_imag": 18, "arrai": [18, 19, 23, 34], "repetit": 19, "inspect": 19, "view": 19, "wide": [19, 25], "varieti": [19, 23], "excel": [19, 23], "bonu": 19, "export": 19, "dtale": 19, "df": [19, 20, 21, 25, 26, 29, 30, 32, 39], "datafram": [19, 20, 23, 25, 26, 32], "dict": [19, 23, 29], "fan": 19, "background": [19, 29], "appropri": [19, 20], "dark_background": 19, "pyqt": 19, "lot": [19, 34, 37], "summari": 19, "statist": [19, 20, 26, 32], "bar": 19, "chart": [19, 23], "pokemon": 19, "nulliti": 19, "understand": [19, 23, 25, 26], "column": [19, 20, 23, 30, 36], "relat": 19, "heatmap": 19, "great": [19, 37], "pick": [19, 30], "relationship": [19, 20], "your_data": 19, "\u03d5k": 19, "beween": 19, "ordin": 19, "interv": 19, "non": [19, 20, 23], "linear": [19, 20, 23], "revert": 19, "pearson": 19, "bivari": 19, "normal": [19, 34], "distribut": [19, 25], "plot_correlation_matrix": 19, "resourc": 19, "fixtur": 19, "fake_insurance_data": 19, "gz": 19, "corr_matrix": 19, "phik_matrix": 19, "x_label": 19, "y_label": 19, "vmin": 19, "vmax": 19, "color_map": 19, "blue": [19, 25], "matrix": 19, "fontsize_factor": 19, "figsiz": 19, "tight_layout": 19, "ugli": [19, 36], "overlap": 19, "unread": 19, "label": [19, 24], "adjust": [19, 23, 34], "date": [19, 21, 36, 41], "mdate": 19, "datetim": [19, 25, 34], "2023": [19, 34, 36], "25": [19, 23, 25, 30, 36], "30": [19, 23, 24, 34], "35": 19, "object": [19, 23, 41], "xaxi": 19, "set_major_formatt": 19, "dateformatt": 19, "geo": 19, "fill": [19, 34], "area": 19, "bubbl": 19, "hexbin": 19, "express": [19, 23, 34], "px": 19, "gapmind": 19, "queri": [19, 23, 29, 36], "2007": 19, "scatter_geo": 19, "iso_alpha": 19, "pop": 19, "subplot_mosa": 19, "arrang": 19, "fashion": 19, "control": [19, 23, 29], "aae": 19, "constrained_layout": 19, "axd": 19, "set_titl": 19, "multicollinear": 20, "phenomenon": 20, "predictor": [20, 23, 24], "regress": [20, 23], "correl": [20, 25, 26], "unstabl": 20, "inconsist": 20, "coeffici": 20, "\ud835\udc15\ud835\udc1a\ud835\udc2b\ud835\udc22\ud835\udc1a\ud835\udc27\ud835\udc1c\ud835\udc1e": 20, "\ud835\udc08\ud835\udc27\ud835\udc1f\ud835\udc25\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 20, "\ud835\udc05\ud835\udc1a\ud835\udc1c\ud835\udc2d\ud835\udc28\ud835\udc2b": 20, "indic": [20, 34], "present": 20, "formula": 20, "determin": [20, 23], "repeat": [20, 26], "each": [20, 23, 24, 26, 34, 36, 37], "compar": [20, 41], "contribut": [20, 23], "now": [20, 34, 36, 41], "drop": [20, 23, 30], "remain": 20, "\ud835\udc2c\ud835\udc2d\ud835\udc1a\ud835\udc2d\ud835\udc2c\ud835\udc26\ud835\udc28\ud835\udc1d\ud835\udc1e\ud835\udc25\ud835\udc2c": 20, "load_boston": 20, "statsmodel": [20, 26], "stat": 20, "outliers_influ": 20, "variance_inflation_factor": 20, "boston": 20, "feature_nam": [20, 25], "shape": [20, 23, 24, 29], "crim": 20, "100373": 20, "zn": 20, "844013": 20, "indu": 20, "14": [20, 23], "485758": 20, "cha": 20, "152952": 20, "nox": 20, "73": 20, "894947": 20, "rm": [20, 41], "77": 20, "948283": 20, "21": [20, 34], "386850": 20, "di": 20, "699652": 20, "rad": 20, "167725": 20, "tax": 20, "227274": 20, "ptratio": 20, "85": 20, "029547": 20, "11": [20, 21], "104943": 20, "lstat": 20, "102025": 20, "algorithm": [20, 23, 24, 36], "catboost": [20, 23], "unknown": 20, "mismatch": 20, "beforehand": [20, 34], "categorymismatchtraintest": 20, "tabular": [20, 23], "train_test_valid": 20, "col1": 20, "col2": 20, "col3": 20, "d": [20, 29, 34, 36], "obtain": 20, "randomli": 20, "shuffl": [20, 23], "observ": 20, "comparison": 20, "eas": 20, "show_weight": 20, "hurt": 20, "permutationimport": 20, "svm": [20, 23], "svc": 20, "load_iri": [20, 23, 25], "model_select": [20, 23, 26], "train_test_split": [20, 23, 26], "iri": [20, 23], "target_nam": [20, 23], "perm": 20, "feature_1": [20, 23], "feature_2": 20, "feature_3": [20, 23], "feature_4": 20, "score": [20, 23, 24, 26], "pp": 20, "agnost": [20, 23], "ppscore": 20, "c_": [20, 25], "minimum": [20, 36], "redund": 20, "maximum": [20, 24, 34, 36], "relev": [20, 21], "smallest": [20, 30, 34, 41], "subset": [20, 29], "ml": [20, 26], "common": [20, 23, 32], "polar": [20, 30], "spark": [20, 26], "k": [20, 26, 41], "mrmr_select": 20, "make_classif": 20, "mrmr_classif": 20, "n_sampl": [20, 23, 26], "n_featur": [20, 23], "50": [20, 23, 26], "n_inform": 20, "n_redund": 20, "40": [20, 23, 25, 30], "selected_featur": 20, "restrict": 21, "social": [21, 23, 25], "servic": [21, 37], "hashtag": 21, "thread": 21, "platform": [21, 25], "instagram": [21, 37], "facebook": 21, "tweet": 21, "elon": 21, "musk": 21, "januari": 21, "simpli": [21, 26], "jsonl": 21, "max": [21, 23, 34, 36], "01": [21, 23, 24, 36], "elonmusk": 21, "until": [21, 41], "scraper": [21, 37], "playstor": 21, "sort": [21, 23], "rate": [21, 24], "countri": [21, 36], "google_play_scrap": 21, "_": [21, 23, 24, 34], "android": 21, "lang": [21, 25], "newest": 21, "filter_score_with": 21, "app_store_scrap": 21, "podcast": 21, "appl": [21, 34], "side": [21, 29], "appstor": 21, "app_nam": 21, "app_id": 21, "id389801252": 21, "insta": 21, "389801252": 21, "how_mani": 21, "messi": [21, 34], "face": 21, "throw": [21, 34], "dialect": 21, "read_datafram": 21, "imdb": 21, "extractor": [21, 23], "crawl": 21, "download": [21, 37], "metadata": 21, "comment": [21, 23], "websit": [21, 25, 34, 41], "xml": 21, "fetch_url": 21, "adbar": 21, "output_format": 21, "imbal": 23, "higher": 23, "minor": 23, "lower": [23, 25], "loss": [23, 32], "misclassifi": 23, "compute_class_weight": 23, "tf": 23, "class_weight": 23, "uniqu": 23, "enumer": 23, "loop": 23, "backend": [23, 36], "clear_sess": 23, "bias": [23, 26], "\ud835\udc1d\ud835\udc1e\ud835\udc25": 23, "\ud835\udc26\ud835\udc28\ud835\udc1d\ud835\udc1e\ud835\udc25": 23, "clutter": 23, "increas": [23, 32], "create_model": 23, "noisi": 23, "centric": 23, "via": 23, "clf": 23, "n_estim": 23, "cl": 23, "classif": 23, "cleanlearn": 23, "label_issu": 23, "find_label_issu": 23, "is_label_issu": 23, "assess": [23, 26], "summar": 23, "precis": 23, "recal": 23, "f1": 23, "y_true": [23, 26], "y_pred": [23, 26], "00": [23, 29, 34, 36], "67": 23, "macro": 23, "avg": 23, "framework": 23, "care": [23, 34], "tupl": 23, "seed": [23, 27, 41], "sampler": 23, "tpesampl": 23, "trial": 23, "42": 23, "studi": 23, "create_studi": 23, "n_trial": 23, "reason": 23, "doubt": 23, "closer": 23, "\ud835\udc0f\ud835\udc2b\ud835\udc28\ud835\udc1b\ud835\udc1a\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "\ud835\udc16\ud835\udc2b\ud835\udc28\ud835\udc27\ud835\udc20\ud835\udc0f\ud835\udc2b\ud835\udc1e\ud835\udc1d\ud835\udc22\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "cannot": 23, "\ud835\udc03\ud835\udc22\ud835\udc2c\ud835\udc1a\ud835\udc20\ud835\udc2b\ud835\udc1e\ud835\udc1e\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "disagre": 23, "\ud835\udc11\ud835\udc1e\ud835\udc25\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc2f\ud835\udc1e\ud835\udc03\ud835\udc22\ud835\udc1f\ud835\udc1f\ud835\udc1e\ud835\udc2b\ud835\udc1e\ud835\udc27\ud835\udc1c\ud835\udc1e\ud835\udc11\ud835\udc1e\ud835\udc1a\ud835\udc2c\ud835\udc28\ud835\udc27": 23, "rel": [23, 25], "doubtensembl": 23, "probareason": 23, "wrongpredictionreason": 23, "linear_model": [23, 26], "logisticregress": 23, "return_x_i": 23, "proba": 23, "wrong_pr": 23, "instanc": [23, 34], "predic": 23, "get_pred": 23, "stare": 23, "screen": [23, 34], "knockknock": 23, "notif": 23, "channel": 23, "slack": 23, "telegram": 23, "discord": 23, "ms": 23, "stick": 23, "email_send": 23, "recipient_email": 23, "coolmail": 23, "2coolmail": 23, "sender_email": 23, "anothercoolmail": 23, "train_model": 23, "torch": 23, "mymodel": 23, "nn": 23, "batch_siz": 23, "input_s": [23, 26], "depth": 23, "idx": 23, "param": 23, "conv2d": 23, "batchnorm2d": 23, "relu": 23, "maxpool2d": 23, "148": 23, "970": 23, "174": 23, "trainabl": 23, "mult": 23, "mb": [23, 25, 30], "05": 23, "forward": 23, "backward": 23, "06": 23, "honest": 23, "fastest": 23, "intelex": 23, "favourit": [23, 36], "vector": [23, 30], "regressor": 23, "lasso": 23, "dbscan": 23, "sklearnex": 23, "patch_sklearn": 23, "svr": 23, "make_regress": 23, "100000": 23, "nois": [23, 36], "\ud835\udc17\ud835\udc06\ud835\udc01\ud835\udc28\ud835\udc28\ud835\udc2c\ud835\udc2d": 23, "\ud835\udc05\ud835\udc1e\ud835\udc1a\ud835\udc2d\ud835\udc2e\ud835\udc2b\ud835\udc1e": 23, "\ud835\udc08\ud835\udc27\ud835\udc2d\ud835\udc1e\ud835\udc2b\ud835\udc1a\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 23, "\ud835\udc02\ud835\udc28\ud835\udc27\ud835\udc2c\ud835\udc2d\ud835\udc2b\ud835\udc1a\ud835\udc22\ud835\udc27\ud835\udc2d\ud835\udc2c": 23, "feature_0": 23, "similarli": 23, "feature_5": 23, "feature_9": 23, "mind": 23, "regulatori": 23, "industri": 23, "compani": 23, "xgb": 23, "dmatrix": 23, "reg": 23, "squarederror": 23, "eval_metr": 23, "rmse": 23, "interaction_constraint": 23, "model_with_constraint": 23, "hear": 23, "develop": [23, 30], "remov": [23, 25, 41], "pain": [23, 37], "choos": 23, "lightgbm": [23, 26], "task": 23, "tradit": 23, "focus": 23, "overal": 23, "piec": [23, 34, 41], "food": 23, "staff": 23, "rude": 23, "neg": 23, "That": [23, 30, 36], "toward": 23, "batteri": 23, "camera": 23, "opinion": 23, "feel": 23, "feedback": 23, "review": 23, "media": [23, 25], "monitor": 23, "27": 23, "atepccheckpointmanag": 23, "get_aspect_extractor": 23, "checkpoint": 23, "multilingu": 23, "auto_devic": 23, "were": 23, "stuff": 23, "unfriendli": 23, "extract_aspect": 23, "inference_sourc": 23, "pred_senti": 23, "implement": [23, 26, 30], "xgbrfregressor": 23, "xgbrf": 23, "rand": [23, 27], "deep": [23, 30], "Near": 23, "duplic": 23, "blurri": 23, "odd": 23, "irregularli": 23, "dark": 23, "light": 23, "lack": 23, "crazi": 23, "wget": 23, "nc": 23, "public": 23, "s3": 23, "amazonaw": 23, "image_fil": 23, "zip": 23, "unzip": [23, 37], "imagelab": 23, "own": 23, "dataset_path": 23, "data_path": 23, "find_issu": 23, "preval": 23, "issue_summari": 23, "issue_typ": 23, "decreas": 23, "shouldn": 23, "\ud835\udc00\ud835\udc25\ud835\udc29\ud835\udc21\ud835\udc1a\ud835\udc12\ud835\udc1e\ud835\udc25\ud835\udc1e\ud835\udc1c\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 23, "curv": 23, "respond": 23, "lassocv": 23, "load_concret": 23, "alphaselect": 23, "cross": 23, "linspac": 23, "tensorflow_decision_forest": 23, "gbdt": 23, "tfdf": 23, "get_fil": 23, "adult": 23, "yggdrasil": 23, "yggdrasil_decision_forest": 23, "test_data": 23, "dataset_df": 23, "test_indic": 23, "len": [23, 24], "test_ds_pd": 23, "train_ds_pd": 23, "train_d": 23, "pd_dataframe_to_tf_dataset": 23, "incom": 23, "test_d": 23, "gradientboostedtreesmodel": 23, "multimod": 23, "covari": 23, "shift": 23, "quickstart": 23, "tabulardataset": 23, "tabularpredictor": 23, "train_data": 23, "inc": 23, "time_limit": 23, "240": 23, "leaderboard": 23, "maxpooling2d": 23, "64": 23, "pool_siz": 23, "layered_view": 23, "legend": 23, "to_fil": 23, "stratifiedkfold": 23, "fold": [23, 26], "repres": 23, "strata": 23, "case": [23, 26, 41], "stratyf": 23, "multilabelstratifiedkfold": 23, "iterstrat": 23, "ml_stratifi": 23, "mskf": 23, "n_split": [23, 26], "random_st": 23, "train_index": 23, "test_index": 23, "split": [23, 26], "nobodi": 23, "therefor": [23, 29, 34], "crucial": 23, "point": [23, 34], "overcom": 23, "hurdl": 23, "lime": 23, "shap": 23, "category_encod": 23, "ordinalencod": 23, "lgbmregressor": [23, 26], "extratreesregressor": 23, "data_load": 23, "house_df": 23, "house_dict": 23, "house_pric": 23, "y_df": [23, 26], "salepric": 23, "to_fram": 23, "x_df": 23, "categorical_featur": 23, "col": [23, 32, 36], "dtype": [23, 30], "return_df": 23, "xtrain": 23, "xtest": 23, "ytrain": 23, "ytest": 23, "train_siz": 23, "75": [23, 25], "smartexplain": 23, "xpl": 23, "features_dict": 23, "y_target": 23, "run_app": 23, "title_stori": 23, "hous": 23, "price": 23, "8020": 23, "Not": 23, "huge": [23, 30], "solut": 23, "suit": 23, "detail": [23, 34, 41], "calcul": [23, 24, 32, 36], "bunch": 23, "drift": 23, "weak": 23, "segment": 23, "full_suit": 23, "iris_df": 23, "data_format": 23, "as_train_test": 23, "label_col": 23, "df_train": 23, "df_test": 23, "rf_clf": 23, "axi": [23, 41], "ds_train": 23, "cat_featur": 23, "ds_test": 23, "train_dataset": 23, "test_dataset": 23, "Its": 23, "plot_rank": 23, "individu": 23, "hover": 23, "dive": 23, "deeper": 23, "analys": 23, "criterion": 23, "gini": 23, "max_depth": 23, "suggest_int": 23, "mdpth": 23, "log": [23, 32, 34], "min_samples_split": 23, "mspl": 23, "min_samples_leaf": 23, "mlf": [23, 26], "min_weight_fraction_leaf": 23, "suggest_float": 23, "mwfr": 23, "max_featur": 23, "mft": 23, "max_leaf_nod": 23, "mnod": 23, "min_impurity_decreas": 23, "mid": 23, "maxim": [23, 24], "get_param_import": 23, "params_sort": 23, "kaggl": 23, "involv": [23, 34], "anomali": 23, "cluster": [23, 26], "categori": [23, 25], "cluster_comb": 23, "clustererensembl": 23, "kmean": 23, "n_cluster": 23, "minibatchkmean": 23, "agglomerativeclust": 23, "aligned_label": 23, "aligned_labels_": 23, "predicted_label": 23, "labels_": [23, 24], "varianc": [23, 25], "residualplot": 23, "exhibit": 23, "along": 23, "horizont": 23, "typic": 23, "suitabl": [23, 36], "wherea": 23, "dispers": 23, "residualsplot": 23, "multi": [23, 26], "hardwar": 23, "hyperopt": 23, "train_breast_canc": 23, "load_breast_canc": 23, "train_x": 23, "test_x": 23, "train_i": 23, "test_i": 23, "test_siz": [23, 26], "train_set": 23, "test_set": 23, "eval": 23, "evals_result": 23, "verbose_ev": 23, "mean_accuraci": 23, "binari": [23, 29, 37], "logist": 23, "logloss": 23, "min_child_weight": 23, "subsampl": 23, "uniform": 23, "tuner": 23, "tune_config": 23, "tuneconfig": 23, "num_sampl": 23, "param_spac": 23, "get_best_result": 23, "mode": 23, "dl": 23, "why": [23, 24], "level": [23, 26, 36], "compat": 23, "neural": 23, "neuralnetclassifi": 23, "pipelin": [23, 37], "standardscal": 23, "mymodul": 23, "__init__": [23, 34, 41], "self": [23, 24, 34], "num_unit": 23, "nonlin": 23, "dim": [23, 26], "kwarg": 23, "dropout": 23, "max_epoch": 23, "lr": 23, "iterator_train__shuffl": 23, "y_proba": 23, "predict_proba": 23, "fly": 23, "massiv": 23, "continu": 23, "updat": [23, 34, 37], "full": 23, "knn": [23, 24], "phish": 23, "predict_on": 23, "learn_on": 23, "mobilenet": 23, "swin": 23, "convnext": 23, "densenet": 23, "pretrain": 23, "list_model": 23, "densenet121": 23, "randn": 23, "224": 23, "uncertainti": 23, "mapieregressor": 23, "linearregress": [23, 26], "59": [23, 36], "mapie_regressor": 23, "y_pi": 23, "unsupervis": 24, "natur": 24, "suffer": 24, "pyod": 24, "densiti": 24, "averag": 24, "vote": 24, "detector": 24, "inlin": 24, "majority_vot": 24, "highest": 24, "sampl": [24, 26], "abod": 24, "iforest": 24, "generate_data": 24, "train_onli": 24, "n_model": 24, "zero": [24, 25], "conform": 24, "predict": [24, 26, 32], "threshold": [24, 25], "calibr": 24, "alarm": 24, "isolationforest": 24, "deel": 24, "anomaly_detect": 24, "splitcad": 24, "basepredictor": 24, "redefin": 24, "nonconform": 24, "adpredictor": 24, "score_sampl": 24, "wrap": 24, "isol": [24, 41], "forest": 24, "if_predictor": 24, "instanti": 24, "cad": 24, "IF": 24, "if_cad": 24, "z": [24, 34], "fit_ratio": 24, "new_data": 24, "gpl": 25, "cleantext": 25, "talk": 25, "send": [25, 34], "testmail": 25, "outlook": 25, "71112392": 25, "visit": 25, "testurl": 25, "free": 25, "u2018": 25, "u2019": 25, "minut": [25, 36], "fix_unicod": 25, "unicod": 25, "to_ascii": 25, "transliter": 25, "closest": 25, "ascii": 25, "lowercas": 25, "no_url": 25, "replac": [25, 30, 41], "special": [25, 34], "no_email": 25, "no_phone_numb": 25, "no_numb": 25, "no_digit": 25, "no_currency_symbol": 25, "currenc": 25, "symbol": 25, "no_punct": 25, "punctuat": 25, "german": 25, "pandas_dq": 25, "focuss": 25, "skew": 25, "dq_report": 25, "fix_dq": 25, "fdq": 25, "data_transform": 25, "fit_transform": 25, "whole": 25, "decim": [25, 36], "percentag": [25, 41], "note": [25, 34], "avail": [25, 34, 41], "spaci": 25, "text_1": 25, "twenti": 25, "five": 25, "dollar": 25, "text_2": 25, "hundr": 25, "fourti": 25, "three": 25, "thousand": 25, "four": 25, "text_3": 25, "nine": 25, "quarter": 25, "num_1": 25, "num_2": 25, "num_3": 25, "243421": 25, "integ": [25, 34, 36, 41], "fraction": 25, "big": [25, 29, 34], "byte": 25, "naturals": 25, "1024000": 25, "equival": 25, "intword": 25, "123500000": 25, "million": [25, 29], "dt": [25, 36], "naturaldelta": 25, "timedelta": 25, "1200": 25, "long": [25, 41], "eleg": [25, 36], "num_pipelin": 25, "knnimput": 25, "cat_pipelin": 25, "most_frequ": 25, "conveni": [25, 29, 30], "make_column_selector": 25, "regex": 25, "afterward": 25, "Will": [25, 34], "columns_with_featur": 25, "num_column": 25, "dtype_includ": 25, "tackl": 25, "dure": 25, "suffici": 25, "meaning": 25, "rarelabelencod": 25, "feature_engin": 25, "red": [25, 29], "green": [25, 29], "yellow": 25, "violet": 25, "rare_encod": 25, "tol": 25, "n_categori": 25, "df_encod": 25, "regularli": 26, "effect": 26, "period": 26, "check_season": 26, "infer": [26, 29], "air": 26, "passeng": 26, "monthli": 26, "frequenc": 26, "airpassengersdataset": 26, "ts": 26, "airpassangersdataset": 26, "is_season": 26, "partit": 26, "rest": 26, "both": [26, 34], "overfit": 26, "scikit": 26, "past": [26, 36], "cross_valid": 26, "gradientboostingregressor": 26, "ts_cv": 26, "cv": 26, "neg_mean_squared_error": 26, "gapleavepout": 26, "gapkfold": 26, "gaprollforward": 26, "min_train_s": 26, "gap_siz": 26, "max_test_s": 26, "nixtla": 26, "remot": 26, "rai": 26, "exogen": 26, "probabilist": 26, "lgb": 26, "lag": 26, "freq": 26, "exist": [26, 29, 34], "pmdarima": 26, "autoarima": 26, "airpassengersdf": 26, "sf": 26, "season_length": 26, "h": [26, 36], "95": 26, "lazi": [26, 36], "backtest": 26, "splitter": 26, "llm": 26, "agent": 26, "pl": [26, 32], "mase": 26, "1mo": 26, "24": 26, "fh": 26, "beat": 26, "nbeat": 26, "nhit": 26, "y_train_df": 26, "ds": [26, 32], "1959": 26, "31": 26, "y_test_df": 26, "horizon": 26, "max_step": 26, "nf": 26, "y_hat_df": 26, "reset_index": 26, "tempor": 26, "feed": 26, "xgboost": 26, "singl": [26, 36], "multivari": 26, "flat": 26, "tp": 26, "sale": 26, "from_csv": 26, "sales_per_stor": 26, "add_index": 26, "store": [26, 29, 34], "tick_calendar": 26, "work_dai": 26, "calendar_day_of_week": 26, "daily_revenu": 26, "revenu": [26, 29], "moving_sum": 26, "durat": 26, "off": 26, "approxim": 26, "matplotlib": [26, 29, 41], "rpt": 26, "signal": 26, "sigma": 26, "n_breakpoint": 26, "bkp": 26, "pw_constant": 26, "noise_std": 26, "algo": 26, "pelt": 26, "rbf": 26, "pen": 26, "construct": 27, "global": 27, "affect": [27, 34], "reset": 27, "undesir": 27, "unreproduc": 27, "across": 27, "reli": [27, 41], "subtl": 27, "rng": 27, "1234": 27, "sometim": [29, 41], "boolean": 29, "cython": 29, "under": [29, 41], "hood": 29, "filtered_df": 29, "might": 29, "tell": [29, 41], "datetimeindex": 29, "time_index": 29, "date_rang": 29, "2020": 29, "applymap": 29, "sales_data": 29, "5000": 29, "15000": 29, "sales_df": 29, "val": 29, "els": 29, "set_opt": 29, "2343129": 29, "8956701": 29, "224289": 29, "human": [29, 34, 36], "row": [29, 30], "slow": 29, "On": 29, "0s": 29, "1s": 29, "meant": 29, "compact": 29, "consum": 29, "space": [29, 34], "effici": [29, 30, 34], "100000000": 29, "1m": 29, "58": 29, "to_csv": 29, "8s": 29, "to_parquet": 29, "blindli": 30, "wise": 30, "obviou": 30, "\ud835\udc12\ud835\udc30\ud835\udc22\ud835\udc1f\ud835\udc2d\ud835\udc1e\ud835\udc2b": 30, "parallel": 30, "dask": 30, "swifter": 30, "capabl": 30, "input_valu": 30, "output_valu": 30, "lambda": 30, "drastic": 30, "diet": 30, "optimize_dtyp": 30, "report_on_datafram": 30, "proposed_df": 30, "new_df": 30, "origin": 30, "memory_usag": 30, "sum": 30, "1024": 30, "props": 30, "constraint": 30, "pa": 30, "schema": 30, "dataframeschema": 30, "element_wis": 30, "alic": 30, "bob": 30, "charli": 30, "alreadi": [30, 32], "think": 30, "mayb": 30, "gain": [30, 32], "rewrit": 32, "reimplement": 32, "levenshtein": 32, "roc": 32, "r2": 32, "l1": 32, "huber": 32, "polars_d": 32, "group_bi": 32, "dummy_group": 32, "agg": 32, "actual": [32, 34], "num_ext": 32, "l2_loss": 32, "alia": 32, "l2": 32, "bce": 32, "binary_metrics_combo": 32, "combo": 32, "unnest": 32, "underscor": 34, "1_000_000": 34, "consecut": 34, "big_numb": 34, "1_000_000_000_000": 34, "behav": 34, "made": 34, "happi": 34, "mood": 34, "diari": 34, "hl": 34, "gl": 34, "urlpars": 34, "parse_q": 34, "unequ": 34, "length": 34, "shortest": 34, "itertool": 34, "zip_longest": 34, "pad": 34, "shorter": 34, "lose": 34, "aa": 34, "bb": 34, "reusabl": 34, "letter": 34, "num": [34, 36], "citi": [34, 36], "code_1": 34, "lh1234": 34, "bln": 34, "code_2": 34, "lh7672": 34, "muc": 34, "\ud835\udc26\ud835\udc1a\ud835\udc2d\ud835\udc2b\ud835\udc22\ud835\udc31": 34, "\ud835\udc26\ud835\udc2e\ud835\udc25\ud835\udc2d\ud835\udc22\ud835\udc29\ud835\udc25\ud835\udc22\ud835\udc1c\ud835\udc1a\ud835\udc2d\ud835\udc22\ud835\udc28\ud835\udc27": 34, "matmul": 34, "nest": [34, 36], "techniqu": [34, 41], "block": 34, "earli": 34, "invalid": 34, "edg": [34, 41], "calculate_pric": 34, "price_per_unit": 34, "collect": 34, "secret": 34, "getpass": 34, "getus": 34, "overrid": 34, "__call__": 34, "example_inst": 34, "paragraph": 34, "lorem": 34, "ipsum": 34, "dolor": 34, "sit": 34, "amet": 34, "consectetur": 34, "adipisc": 34, "elit": 34, "nec": 34, "tellu": 34, "vita": 34, "turpi": 34, "tempu": 34, "porttitor": 34, "fusc": 34, "cursu": 34, "nisi": 34, "eu": 34, "urna": 34, "pharetra": 34, "congu": 34, "ex": [34, 37], "aliquet": 34, "quisqu": 34, "consequat": 34, "nulla": 34, "bibendum": 34, "risu": 34, "wrapped_text": 34, "lru_cach": 34, "maxsiz": 34, "128": 34, "fibonacci": 34, "onc": 34, "myclass": 34, "expensive_oper": 34, "expens": 34, "my_object": 34, "noth": 34, "fruit": 34, "orang": 34, "pear": 34, "banana": 34, "largest": 34, "\ud835\udc21\ud835\udc1e\ud835\udc1a\ud835\udc29\ud835\udc2a": 34, "satisfi": 34, "greater": 34, "equal": 34, "min": [34, 36], "children": 34, "heapq": 34, "nlargest": 34, "nsmallest": 34, "__\ud835\udc2c\ud835\udc2d\ud835\udc2b__": 34, "__\ud835\udc2b\ud835\udc1e\ud835\udc29\ud835\udc2b__": 34, "represent": 34, "intend": 34, "unambigu": 34, "todai": 34, "repr": 34, "07": 34, "02": [34, 36, 41], "771969": 34, "unlik": 34, "unpack": 34, "dict_1": 34, "dict_2": 34, "re": 34, "match_exampl": 34, "assign": 34, "part": [34, 41], "kiwi": 34, "fruit_count": 34, "haven": 34, "been": 34, "yet": 34, "append": 34, "merced": 34, "anim": 34, "regular": 34, "p": 34, "mistak": 34, "among": 34, "insid": 34, "danger": 34, "increment_numb": 34, "dynam": 34, "attribut": 34, "__\ud835\udc2c\ud835\udc25\ud835\udc28\ud835\udc2d\ud835\udc2c__": 34, "prevent": 34, "runtim": 34, "whatev": 34, "sport": 34, "basketbal": 34, "volleybal": 34, "tenni": 34, "handbal": 34, "parametr": 34, "stack": 34, "multiprocess": 36, "processor": 36, "process_imag": 36, "path1": 36, "path2": 36, "n_job": 36, "difficulti": 36, "friendli": 36, "timezon": 36, "daylight": 36, "to_iso8601_str": 36, "08t13": 36, "798316": 36, "now_in_london": 36, "europ": 36, "08t12": 36, "799317": 36, "subtract": 36, "diff_for_human": 36, "ago": 36, "delta": 36, "week": 36, "in_word": 36, "51": 36, "pretti": 36, "logger": 36, "debug": 36, "pseudo": 36, "determinist": [36, 41], "atmospher": 36, "rnd": 36, "sequenc": 36, "groupbi": 36, "Of": 36, "cours": 36, "\ud835\udc29\ud835\udc32\ud835\udc2d\ud835\udc21\ud835\udc28\ud835\udc27": 36, "\ud835\udc1b\ud835\udc1e\ud835\udc27\ud835\udc1e\ud835\udc1d\ud835\udc22\ud835\udc1c\ud835\udc2d": 36, "unstructur": 36, "my_dict": 36, "person": 36, "street": 36, "st": [36, 39, 41], "york": 36, "usa": 36, "chromedriv": 37, "driver": 37, "somehow": 37, "browser": 37, "straightforward": 37, "energi": 37, "ci": 37, "cd": 37, "chrome": 37, "webdriver_manag": 37, "chromedrivermanag": 37, "executable_path": 37, "your_vers": 37, "monei": 37, "chrome_opt": 37, "chromeopt": 37, "add_argu": 37, "blink": 37, "imagesen": 37, "frame": 39, "compon": 39, "pandas_profil": 39, "streamlit_pandas_profil": 39, "st_profile_report": 39, "profile_report": 39, "numprocess": 41, "random": 41, "addit": 41, "flag": 41, "cover": 41, "\ud835\udc1c\ud835\udc28\ud835\udc2f": 41, "src": 41, "90": 41, "stmt": 41, "module1": 41, "257": 41, "13": 41, "94": 41, "module2": 41, "359": 41, "97": 41, "nowadai": 41, "everyth": 41, "baselin": 41, "dif": 41, "mark": 41, "mpl_image_compar": 41, "testfil": 41, "test_plotting_lin": 41, "instafail": 41, "failur": 41, "chatti": 41, "tldr": 41, "smarter": 41, "uphold": 41, "uncov": 41, "unexpect": 41, "bug": 41, "encourag": 41, "test_addition_commut": 41, "assert": 41, "essenti": 41, "softwar": 41, "independ": 41, "cheap": 41, "fake": 41, "mimic": 41, "permiss": 41, "disk": 41, "unixf": 41, "staticmethod": 41, "filenam": 41, "test_unix_f": 41, "mocker": 41, "patch": 41, "assert_called_once_with": 41, "freeze_tim": 41, "2015": 41}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"delight": 0, "data": [0, 10, 18, 19, 21, 23, 25, 26, 32, 36], "scienc": [0, 32], "why": 0, "thi": 0, "book": 0, "exist": 0, "small": 0, "snippet": 0, "big": 0, "upgrad": 0, "miscellan": [1, 2], "must": 1, "have": 1, "vscode": 1, "extens": [1, 23], "python": [1, 4, 5, 10, 14, 34, 35, 36, 42], "project": [1, 8], "setup": 1, "from": [1, 10, 14, 21, 34], "templat": [1, 14], "cookiecutt": 1, "scaffold": 1, "smol": 1, "develop": 1, "well": 1, "commit": 1, "commitizen": 1, "autom": 3, "bash": 3, "command": 3, "makefil": 3, "test": [3, 4, 20, 41, 42], "nox": 3, "ci": 4, "cd": 4, "github": 4, "action": 4, "workflow": 4, "local": 4, "act": 4, "cach": [4, 10, 34], "depend": [4, 10, 41], "code": [5, 6, 10, 14, 19], "style": [5, 29], "remov": [5, 10, 14], "unus": 5, "line": [5, 30], "autoflak": 5, "ensur": 5, "document": [5, 12, 13], "interrog": 5, "sort": [5, 10], "your": [5, 7, 8, 10, 12, 14, 16, 20, 23, 25, 29, 34, 36, 37, 41], "import": [5, 20], "automat": [5, 10, 14, 26], "isort": 5, "format": [5, 29], "black": 5, "lint": 5, "yaml": 5, "file": [5, 10, 21], "yamllint": 5, "blazingli": 5, "fast": [5, 26], "ruff": 5, "correct": 5, "misspel": 5, "codebas": 5, "codespel": 5, "qualiti": [6, 14, 25], "memori": [7, 30], "optim": [7, 23, 34], "identifi": [7, 14, 23], "bottleneck": [7, 14], "regard": 7, "memory_profil": 7, "secur": 8, "detect": [8, 24, 25, 26], "common": 8, "issu": [8, 25], "bandit": 8, "vulner": 8, "environ": [8, 10], "store": [8, 21], "credenti": 8, "safe": 8, "keyr": 8, "type": [9, 34], "enforc": 9, "typeguard": 9, "static": 9, "check": [9, 10, 20, 26], "mypi": 9, "faster": [9, 29], "pyright": 9, "cool": [10, 11], "tool": [10, 11, 14], "work": [10, 36], "countri": 10, "currenc": 10, "subdivis": 10, "more": [10, 21, 26, 34], "gener": [10, 12, 14, 23, 36], "better": [10, 34], "requir": 10, "pipreq": 10, "packag": 10, "its": [10, 25], "pip": 10, "autoremov": 10, "get": [10, 20, 21, 23, 29, 34, 41], "distanc": 10, "between": [10, 34], "postal": 10, "unit": 10, "pint": 10, "supercharg": 10, "profil": [10, 39], "scalen": 10, "fix": [10, 25], "unicod": 10, "error": [10, 41], "ftfy": 10, "background": 10, "imag": [10, 18, 23, 37], "rembg": 10, "build": 10, "modern": 10, "cli": 10, "app": [10, 21], "typer": 10, "realist": 10, "fake": 10, "faker": 10, "enrich": 10, "progress": 10, "bar": 10, "rich": 10, "set": [10, 20, 23, 29, 34], "descript": 10, "tqdm": 10, "convert": [10, 25], "emoji": 10, "text": [10, 21, 25, 34], "emot": 10, "print": [10, 34], "hardwar": 10, "inform": 10, "version": 10, "number": [10, 25, 34, 36], "request": 10, "unifi": 10, "messi": 10, "column": [10, 25], "unifynam": 10, "broken": 10, "link": 10, "websit": 10, "matplotlib": [10, 19], "termin": 10, "displai": [10, 14, 19, 29], "tree": 10, "latex": [10, 14], "acronym": 10, "make": [10, 25, 34], "ascii": 10, "art": 10, "ner": 10, "spaci": 10, "creat": [10, 14], "tikz": 10, "pictur": 10, "human": [10, 25], "readabl": [10, 29, 34], "regex": 10, "pregex": 10, "perform": [10, 23, 30], "ocr": 10, "easyocr": 10, "diagram": 10, "power": [10, 19, 21, 23, 36], "retri": 10, "function": [10, 16, 32, 34], "tenac": 10, "graph": 10, "analysi": [10, 23], "igraph": 10, "speedtest": 10, "via": 10, "minimalist": 10, "databas": 10, "tinydb": 10, "calcul": [10, 20], "metric": 10, "radon": 10, "altern": 10, "manag": [10, 37], "configur": 10, "dotenv": 10, "notion": 10, "sql": 10, "queri": [10, 34], "builder": 10, "auto": 12, "api": [12, 23], "jupyt": [14, 15], "notebook": [14, 15], "tip": [14, 15, 27, 28, 29, 31, 32, 35, 37, 38, 39, 40], "trick": [14, 15, 27, 28, 29, 31, 32, 35, 37, 38, 39, 40], "line_profil": 14, "render": 14, "live": 14, "loss": [14, 16], "deep": [14, 26], "learn": [14, 22, 23, 25, 26], "model": [14, 23], "express": 14, "scikit": [14, 23, 25], "pipelin": [14, 25], "html": 14, "autoreload": 14, "modul": [14, 41], "appli": [14, 30], "reus": 14, "juptyer": 14, "output": [14, 41], "cell": 14, "nbstripout": 14, "bring": 14, "llm": [14, 16, 17], "Into": 14, "ai": 14, "compress": 16, "prompt": 16, "With": [16, 30], "No": [16, 19], "llmlingua": 16, "One": [16, 30], "call": 16, "ani": 16, "litellm": 16, "safeguard": 16, "llmguard": 16, "augment": 18, "albument": 18, "eda": 19, "analyz": 19, "visual": [19, 23], "interact": [19, 23], "d": 19, "tale": 19, "us": [19, 23, 34], "dark": 19, "mode": 19, "pandasgui": 19, "miss": 19, "valu": [19, 34], "missingno": 19, "correl": 19, "phik": 19, "x": 19, "axi": 19, "time": [19, 26, 29], "seri": [19, 26, 29], "plot": [19, 23, 29, 41], "correctli": 19, "autofmt_xd": 19, "beauti": 19, "map": 19, "plotli": 19, "mosaic": 19, "featur": [20, 23, 25, 26], "select": [20, 23, 25], "varianc": 20, "inflat": 20, "factor": 20, "vif": 20, "new": 20, "categori": 20, "deepcheck": [20, 23], "permut": 20, "eli5": 20, "find": [20, 23], "most": 20, "predict": [20, 23], "variabl": [20, 34], "target": 20, "scale": 20, "mrmr": 20, "scrape": [21, 37], "twitter": 21, "youtub": 21, "snscrape": 21, "googl": 21, "plai": 21, "review": 21, "read": 21, "csv": 21, "without": 21, "problem": 21, "clevercsv": 21, "web": 21, "gather": 21, "trafilatura": 21, "machin": [22, 26], "train": 23, "comput": 23, "class": [23, 34], "weight": 23, "reset": 23, "tensorflow": 23, "kera": 23, "global": 23, "state": 23, "dirti": 23, "label": [23, 25], "cleanlab": 23, "evalu": 23, "classifi": 23, "sklearn": 23, "s": [23, 41], "classification_report": 23, "obtain": 23, "reproduc": [23, 27], "result": 23, "optuna": 23, "bad": 23, "doubtlab": 23, "notifi": 23, "when": 23, "finish": 23, "summari": 23, "pytorch": 23, "torchinfo": 23, "boost": [23, 30], "intel": 23, "incorport": 23, "domain": 23, "knowledg": 23, "xgboost": 23, "constraint": 23, "automl": 23, "flaml": 23, "aspect": 23, "base": [23, 41], "seniment": 23, "pyabsa": 23, "random": [23, 27, 36], "forest": 23, "problemat": 23, "cleanvis": 23, "regular": 23, "paramet": [23, 34], "decis": 23, "autogluon": 23, "visualkera": 23, "multilabel": 23, "stratifi": 23, "kfold": 23, "iter": [23, 34], "stratif": 23, "interpret": 23, "shapash": 23, "valid": [23, 26, 30], "high": 23, "ensembl": [23, 24], "combo": 23, "residu": 23, "yellowbrick": 23, "distribut": 23, "hyperparamet": 23, "rai": 23, "tune": 23, "skorch": 23, "onlin": 23, "ml": 23, "river": 23, "sota": 23, "vision": 23, "timm": 23, "guarante": 23, "interv": 23, "mapi": 23, "outlier": 24, "robust": 24, "puncc": 24, "preprocess": [25, 26], "clean": 25, "natur": 25, "languag": 25, "numer": 25, "represent": 25, "date": 25, "friendli": 25, "cleaner": 25, "definit": 25, "easili": [25, 36], "rare": 25, "encod": 25, "engin": [25, 26], "season": 26, "dart": 26, "cross": 26, "timeseriessplit": 26, "tscv": 26, "forecast": 26, "mlforecast": 26, "lightn": 26, "statsforecast": 26, "polar": [26, 32, 33], "backend": [26, 29], "functim": 26, "neuralforecast": 26, "effici": 26, "temporian": 26, "chang": [26, 29], "point": 26, "ruptur": 26, "numpi": [27, 28], "achiev": 27, "np": 27, "randomst": 27, "panda": [29, 30, 31, 39], "filter": 29, "frequenc": 29, "pd": 29, "infer_freq": 29, "datafram": [29, 30], "precis": 29, "float": 29, "i": 29, "o": 29, "parquet": 29, "util": [30, 36], "librari": [30, 34], "speed": [30, 36, 37], "up": [30, 36, 37], "reduc": 30, "dtype_diet": 30, "pandera": 30, "modin": 30, "plugin": 32, "pure": 34, "built": 34, "urllib": 34, "pars": 34, "zip": 34, "longest": 34, "improv": 34, "name": 34, "slice": 34, "wai": 34, "matrix": 34, "multipl": 34, "guard": 34, "claus": 34, "If": 34, "statement": 34, "hide": 34, "password": 34, "input": 34, "user": 34, "turn": 34, "callabl": 34, "wrap": 34, "textwrap": 34, "add": 34, "lru": 34, "method": 34, "functool": 34, "cached_properti": 34, "For": [34, 36, 41], "els": 34, "loop": [34, 36], "heap": 34, "differ": 34, "__str__": 34, "__repr__": 34, "neat": 34, "merg": 34, "dictionari": [34, 36], "switch": 34, "case": 34, "walru": 34, "oper": 34, "count": 34, "occurr": 34, "an": 34, "counter": 34, "default": 34, "defaultdict": 34, "structur": [34, 36], "tupl": 34, "namedtupl": 34, "mutabl": 34, "argument": 34, "object": 34, "__slots__": 34, "modifi": 34, "3": 34, "12": 34, "joblib": 36, "parallel": [36, 41], "datetim": [36, 41], "pendulum": 36, "prettifi": 36, "pprint": 36, "easi": 36, "log": 36, "loguru": 36, "truli": 36, "benedict": 36, "selenium": [37, 38], "webdriv": 37, "disabl": 37, "load": 37, "streamlit": [39, 40], "emb": 39, "pytest": 41, "steroid": 41, "xdist": 41, "shuffl": 41, "order": 41, "randomli": 41, "coverag": 41, "cov": 41, "mpl": 41, "instantli": 41, "show": 41, "suit": 41, "limit": 41, "minimum": 41, "properti": 41, "hypothesi": 41, "mock": 41, "freez": 41, "freezegun": 41}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinxcontrib.bibtex": 9, "sphinx": 56}})
\ No newline at end of file