From 6506b3efb07871c8c2f8dc39821331b6ea88b054 Mon Sep 17 00:00:00 2001
From: piotrlaczkowski <piotr.laczkowski@gmail.com>
Date: Sun, 6 Oct 2024 18:10:40 +0100
Subject: [PATCH] Deployed e7c7ca7 to 1.8.0 with MkDocs 1.5.3 and mike 2.0.0

---
 1.8.0/404.html                      |  12 +-
 1.8.0/contributing/index.html       |  12 +-
 1.8.0/features/index.html           |  14 +--
 1.8.0/index.html                    |  46 ++++----
 1.8.0/integrations/index.html       |  42 +++----
 1.8.0/layers_factory/index.html     | 171 ++++++++++++++++++++--------
 1.8.0/motivation/index.html         |  14 +--
 1.8.0/search/search_index.json      |   2 +-
 1.8.0/sitemap.xml.gz                | Bin 127 -> 127 bytes
 1.8.0/transformer_blocks/index.html |  84 +++++++-------
 10 files changed, 234 insertions(+), 163 deletions(-)
diff --git a/1.8.0/404.html b/1.8.0/404.html
index 19c2093..f1aeadf 100644
--- a/1.8.0/404.html
+++ b/1.8.0/404.html
@@ -329,11 +329,11 @@
   
   
     <li class="md-nav__item">
-      <a href="/transformer_blocks/" class="md-nav__link">
+      <a href="/layers_factory/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🤖 TransformerBlocks
+    🏭 Layers Factory
   </span>
   
 
@@ -349,11 +349,11 @@
   
   
     <li class="md-nav__item">
-      <a href="/layers_factory/" class="md-nav__link">
+      <a href="/integrations/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🏭 Layers Factory
+    📦 Integrating Preprocessing Model
   </span>
   
 
@@ -369,11 +369,11 @@
   
   
     <li class="md-nav__item">
-      <a href="/integrations/" class="md-nav__link">
+      <a href="/transformer_blocks/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
+    🤖 TransformerBlocks
   </span>
   
 
diff --git a/1.8.0/contributing/index.html b/1.8.0/contributing/index.html
index 3819a29..2470e00 100644
--- a/1.8.0/contributing/index.html
+++ b/1.8.0/contributing/index.html
@@ -336,11 +336,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../transformer_blocks/" class="md-nav__link">
+      <a href="../layers_factory/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🤖 TransformerBlocks
+    🏭 Layers Factory
   </span>
   
 
@@ -356,11 +356,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../layers_factory/" class="md-nav__link">
+      <a href="../integrations/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🏭 Layers Factory
+    📦 Integrating Preprocessing Model
   </span>
   
 
@@ -376,11 +376,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../integrations/" class="md-nav__link">
+      <a href="../transformer_blocks/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
+    🤖 TransformerBlocks
   </span>
   
 
diff --git a/1.8.0/features/index.html b/1.8.0/features/index.html
index 72c0cdd..415754b 100644
--- a/1.8.0/features/index.html
+++ b/1.8.0/features/index.html
@@ -12,7 +12,7 @@
         <link rel="prev" href="..">
       
       
-        <link rel="next" href="../transformer_blocks/">
+        <link rel="next" href="../layers_factory/">
       
       
       <link rel="icon" href="../assets/images/favicon.png">
@@ -432,11 +432,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../transformer_blocks/" class="md-nav__link">
+      <a href="../layers_factory/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🤖 TransformerBlocks
+    🏭 Layers Factory
   </span>
   
 
@@ -452,11 +452,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../layers_factory/" class="md-nav__link">
+      <a href="../integrations/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🏭 Layers Factory
+    📦 Integrating Preprocessing Model
   </span>
   
 
@@ -472,11 +472,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../integrations/" class="md-nav__link">
+      <a href="../transformer_blocks/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
+    🤖 TransformerBlocks
   </span>
   
 
diff --git a/1.8.0/index.html b/1.8.0/index.html
index 20901b6..c61f895 100644
--- a/1.8.0/index.html
+++ b/1.8.0/index.html
@@ -371,17 +371,17 @@
         <li class="md-nav__item">
   <a href="#advanced-configuration-options" class="md-nav__link">
     <span class="md-ellipsis">
-      Advanced Configuration Options
+      💪🏻 Advanced Configuration Options
     </span>
   </a>
   
-    <nav class="md-nav" aria-label="Advanced Configuration Options">
+    <nav class="md-nav" aria-label="💪🏻 Advanced Configuration Options">
       <ul class="md-nav__list">
         
           <li class="md-nav__item">
   <a href="#transformer-blocks-configuration" class="md-nav__link">
     <span class="md-ellipsis">
-      Transformer Blocks Configuration
+      🤖 Transformer Blocks Configuration
     </span>
   </a>
   
@@ -390,7 +390,7 @@
           <li class="md-nav__item">
   <a href="#custom-preprocessors" class="md-nav__link">
     <span class="md-ellipsis">
-      Custom Preprocessors
+      🏗️ Custom Preprocessors
     </span>
   </a>
   
@@ -399,7 +399,7 @@
           <li class="md-nav__item">
   <a href="#feature-crosses" class="md-nav__link">
     <span class="md-ellipsis">
-      Feature Crosses
+      ♱ Feature Crosses
     </span>
   </a>
   
@@ -445,11 +445,11 @@
   
   
     <li class="md-nav__item">
-      <a href="transformer_blocks/" class="md-nav__link">
+      <a href="layers_factory/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🤖 TransformerBlocks
+    🏭 Layers Factory
   </span>
   
 
@@ -465,11 +465,11 @@
   
   
     <li class="md-nav__item">
-      <a href="layers_factory/" class="md-nav__link">
+      <a href="integrations/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🏭 Layers Factory
+    📦 Integrating Preprocessing Model
   </span>
   
 
@@ -485,11 +485,11 @@
   
   
     <li class="md-nav__item">
-      <a href="integrations/" class="md-nav__link">
+      <a href="transformer_blocks/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
+    🤖 TransformerBlocks
   </span>
   
 
@@ -594,17 +594,17 @@
         <li class="md-nav__item">
   <a href="#advanced-configuration-options" class="md-nav__link">
     <span class="md-ellipsis">
-      Advanced Configuration Options
+      💪🏻 Advanced Configuration Options
     </span>
   </a>
   
-    <nav class="md-nav" aria-label="Advanced Configuration Options">
+    <nav class="md-nav" aria-label="💪🏻 Advanced Configuration Options">
       <ul class="md-nav__list">
         
           <li class="md-nav__item">
   <a href="#transformer-blocks-configuration" class="md-nav__link">
     <span class="md-ellipsis">
-      Transformer Blocks Configuration
+      🤖 Transformer Blocks Configuration
     </span>
   </a>
   
@@ -613,7 +613,7 @@
           <li class="md-nav__item">
   <a href="#custom-preprocessors" class="md-nav__link">
     <span class="md-ellipsis">
-      Custom Preprocessors
+      🏗️ Custom Preprocessors
     </span>
   </a>
   
@@ -622,7 +622,7 @@
           <li class="md-nav__item">
   <a href="#feature-crosses" class="md-nav__link">
     <span class="md-ellipsis">
-      Feature Crosses
+      ♱ Feature Crosses
     </span>
   </a>
   
@@ -662,7 +662,7 @@ <h1 id="welcome-to-keras-data-processor-preprocessing-power-with-tensorflow-kera
 <h2 id="key-features">🔑 Key Features:</h2>
 <ul>
 <li>
-<p>🛠 <strong>Automated Feature Engineering</strong>: Automatically detects and applies the most suitable preprocessing steps for each feature type in your dataset, ensuring optimal data preparation with minimal manual intervention.</p>
+<p>🛠 <strong>Flexible Feature Engineering</strong>: Applies predefined preprocessing steps based on user-specified feature types, allowing for efficient and customizable data preparation with minimal manual coding.</p>
 </li>
 <li>
 <p>🎨 <strong>Customizable Preprocessing Pipelines</strong>: Tailor your preprocessing steps with ease. Choose from a comprehensive range of options for numeric, categorical, text data, and even complex feature crosses, allowing for precise and effective data handling.</p>
@@ -688,7 +688,7 @@ <h2 id="getting-started">🚀 Getting started:</h2>
 </code></pre></div>
 <p>Then you can simply configure your preprocessor:</p>
 <h2 id="building-preprocessor">🛠️ Building Preprocessor:</h2>
-<p>The simplest application of ths preprocessing model is as follows:</p>
+<p>The simplest application of the preprocessing model is as follows:</p>
 <div class="highlight"><pre><span></span><code><span class="kn">from</span> <span class="nn">kdp</span> <span class="kn">import</span> <span class="n">PreprocessingModel</span>
 <span class="kn">from</span> <span class="nn">kdp</span> <span class="kn">import</span> <span class="n">FeatureType</span>
 
@@ -712,7 +712,7 @@ <h2 id="building-preprocessor">🛠️ Building Preprocessor:</h2>
 <span class="c1"># construct the preprocessing pipelines</span>
 <span class="n">ppr</span><span class="o">.</span><span class="n">build_preprocessor</span><span class="p">()</span>
 </code></pre></div>
-<p>This wil output:</p>
+<p>This will output:</p>
 <div class="highlight"><pre><span></span><code><span class="p">{</span>
 <span class="s1">&#39;model&#39;</span><span class="o">:</span><span class="w"> </span><span class="o">&lt;</span><span class="nx">Functional</span><span class="w"> </span><span class="nx">name</span><span class="o">=</span><span class="nx">preprocessor</span><span class="p">,</span><span class="w"> </span><span class="nx">built</span><span class="o">=</span><span class="nx">True</span><span class="o">&gt;</span><span class="p">,</span>
 <span class="s1">&#39;inputs&#39;</span><span class="o">:</span><span class="w"> </span><span class="p">{</span>
@@ -747,8 +747,8 @@ <h2 id="building-preprocessor">🛠️ Building Preprocessor:</h2>
 <p class="admonition-title">Info</p>
 <p>You can use the preprocessing model independently to preprocess your data or integrate it into your Keras model as the first layer, see 👀 <a href="integrations/">Integrations</a></p>
 </div>
-<h2 id="advanced-configuration-options">Advanced Configuration Options</h2>
-<h3 id="transformer-blocks-configuration">Transformer Blocks Configuration</h3>
+<h2 id="advanced-configuration-options">💪🏻 Advanced Configuration Options</h2>
+<h3 id="transformer-blocks-configuration">🤖 Transformer Blocks Configuration</h3>
 <p>Enhance your preprocessing model with transformer blocks to capture complex patterns and interactions between features, see 👀 <a href="transformer_blocks/">Transformer Blocks</a>. You can configure the transformer blocks as follows:</p>
 <ul>
 <li><strong>Number of Blocks</strong>: Define how many transformer blocks to include in the preprocessing pipeline.</li>
@@ -772,7 +772,7 @@ <h3 id="transformer-blocks-configuration">Transformer Blocks Configuration</h3>
     <span class="o">**</span><span class="n">transfo_config</span>
 <span class="p">)</span>
 </code></pre></div>
-<h3 id="custom-preprocessors">Custom Preprocessors</h3>
+<h3 id="custom-preprocessors">🏗️ Custom Preprocessors</h3>
 <p>Tailor your preprocessing steps with custom preprocessors for each feature type. Define specific preprocessing logic that fits your data characteristics or domain-specific requirements, see 👀 <a href="features/#🚀-custom-preprocessing-steps">Custom Preprocessors</a>.</p>
 <ul>
 <li><strong>Custom Steps</strong>: Add custom preprocessing layers or functions to the predefined feature types.</li>
@@ -793,7 +793,7 @@ <h3 id="custom-preprocessors">Custom Preprocessors</h3>
     <span class="n">features_specs</span><span class="o">=</span><span class="n">features_spec</span>
 <span class="p">)</span>
 </code></pre></div>
-<h3 id="feature-crosses">Feature Crosses</h3>
+<h3 id="feature-crosses">♱ Feature Crosses</h3>
 <p>Create complex feature interactions by crossing features. This method combines features into a single feature, which can be particularly useful for models that benefit from understanding interactions between specific features, see 👀 <a href="features/#❌-cross-features">Feature Crosses</a>.</p>
 <ul>
 <li><strong>Crossing Features</strong>: Specify pairs of features to be crossed and the number of bins for hashing the crossed feature.</li>
diff --git a/1.8.0/integrations/index.html b/1.8.0/integrations/index.html
index 3942884..8779603 100644
--- a/1.8.0/integrations/index.html
+++ b/1.8.0/integrations/index.html
@@ -12,7 +12,7 @@
         <link rel="prev" href="../layers_factory/">
       
       
-        <link rel="next" href="../motivation/">
+        <link rel="next" href="../transformer_blocks/">
       
       
       <link rel="icon" href="../assets/images/favicon.png">
@@ -337,26 +337,6 @@
   
   
   
-    <li class="md-nav__item">
-      <a href="../transformer_blocks/" class="md-nav__link">
-        
-  
-  <span class="md-ellipsis">
-    🤖 TransformerBlocks
-  </span>
-  
-
-      </a>
-    </li>
-  
-
-    
-      
-      
-  
-  
-  
-  
     <li class="md-nav__item">
       <a href="../layers_factory/" class="md-nav__link">
         
@@ -446,6 +426,26 @@
   
   
   
+    <li class="md-nav__item">
+      <a href="../transformer_blocks/" class="md-nav__link">
+        
+  
+  <span class="md-ellipsis">
+    🤖 TransformerBlocks
+  </span>
+  
+
+      </a>
+    </li>
+  
+
+    
+      
+      
+  
+  
+  
+  
     <li class="md-nav__item">
       <a href="../motivation/" class="md-nav__link">
         
diff --git a/1.8.0/layers_factory/index.html b/1.8.0/layers_factory/index.html
index 208581b..ebe3dfc 100644
--- a/1.8.0/layers_factory/index.html
+++ b/1.8.0/layers_factory/index.html
@@ -9,7 +9,7 @@
       
       
       
-        <link rel="prev" href="../transformer_blocks/">
+        <link rel="prev" href="../features/">
       
       
         <link rel="next" href="../integrations/">
@@ -335,26 +335,6 @@
       
   
   
-  
-  
-    <li class="md-nav__item">
-      <a href="../transformer_blocks/" class="md-nav__link">
-        
-  
-  <span class="md-ellipsis">
-    🤖 TransformerBlocks
-  </span>
-  
-
-      </a>
-    </li>
-  
-
-    
-      
-      
-  
-  
     
   
   
@@ -404,15 +384,34 @@
     <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
       
         <li class="md-nav__item">
-  <a href="#kdp.layers_factory.PreprocessorLayerFactory" class="md-nav__link">
+  <a href="#using-keras-preprocessing-layers" class="md-nav__link">
     <span class="md-ellipsis">
-      PreprocessorLayerFactory
+      🎡 Using Keras Preprocessing Layers
     </span>
   </a>
   
 </li>
       
         <li class="md-nav__item">
+  <a href="#custom-kdp-preprocessing-layers" class="md-nav__link">
+    <span class="md-ellipsis">
+      🏗️ Custom KDP Preprocessing Layers
+    </span>
+  </a>
+  
+    <nav class="md-nav" aria-label="🏗️ Custom KDP Preprocessing Layers">
+      <ul class="md-nav__list">
+        
+          <li class="md-nav__item">
+  <a href="#kdp.layers_factory.PreprocessorLayerFactory" class="md-nav__link">
+    <span class="md-ellipsis">
+      PreprocessorLayerFactory
+    </span>
+  </a>
+  
+</li>
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.cast_to_float32_layer" class="md-nav__link">
     <span class="md-ellipsis">
       cast_to_float32_layer
@@ -420,8 +419,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.create_layer" class="md-nav__link">
     <span class="md-ellipsis">
       create_layer
@@ -429,8 +428,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_encoding_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_encoding_layer
@@ -438,8 +437,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_parsing_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_parsing_layer
@@ -447,8 +446,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_season_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_season_layer
@@ -456,8 +455,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.text_preprocessing_layer" class="md-nav__link">
     <span class="md-ellipsis">
       text_preprocessing_layer
@@ -465,14 +464,19 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.transformer_block_layer" class="md-nav__link">
     <span class="md-ellipsis">
       transformer_block_layer
     </span>
   </a>
   
+</li>
+        
+      </ul>
+    </nav>
+  
 </li>
       
     </ul>
@@ -509,6 +513,26 @@
   
   
   
+    <li class="md-nav__item">
+      <a href="../transformer_blocks/" class="md-nav__link">
+        
+  
+  <span class="md-ellipsis">
+    🤖 TransformerBlocks
+  </span>
+  
+
+      </a>
+    </li>
+  
+
+    
+      
+      
+  
+  
+  
+  
     <li class="md-nav__item">
       <a href="../motivation/" class="md-nav__link">
         
@@ -570,15 +594,34 @@
     <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
       
         <li class="md-nav__item">
-  <a href="#kdp.layers_factory.PreprocessorLayerFactory" class="md-nav__link">
+  <a href="#using-keras-preprocessing-layers" class="md-nav__link">
     <span class="md-ellipsis">
-      PreprocessorLayerFactory
+      🎡 Using Keras Preprocessing Layers
     </span>
   </a>
   
 </li>
       
         <li class="md-nav__item">
+  <a href="#custom-kdp-preprocessing-layers" class="md-nav__link">
+    <span class="md-ellipsis">
+      🏗️ Custom KDP Preprocessing Layers
+    </span>
+  </a>
+  
+    <nav class="md-nav" aria-label="🏗️ Custom KDP Preprocessing Layers">
+      <ul class="md-nav__list">
+        
+          <li class="md-nav__item">
+  <a href="#kdp.layers_factory.PreprocessorLayerFactory" class="md-nav__link">
+    <span class="md-ellipsis">
+      PreprocessorLayerFactory
+    </span>
+  </a>
+  
+</li>
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.cast_to_float32_layer" class="md-nav__link">
     <span class="md-ellipsis">
       cast_to_float32_layer
@@ -586,8 +629,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.create_layer" class="md-nav__link">
     <span class="md-ellipsis">
       create_layer
@@ -595,8 +638,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_encoding_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_encoding_layer
@@ -604,8 +647,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_parsing_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_parsing_layer
@@ -613,8 +656,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.date_season_layer" class="md-nav__link">
     <span class="md-ellipsis">
       date_season_layer
@@ -622,8 +665,8 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.text_preprocessing_layer" class="md-nav__link">
     <span class="md-ellipsis">
       text_preprocessing_layer
@@ -631,14 +674,19 @@
   </a>
   
 </li>
-      
-        <li class="md-nav__item">
+        
+          <li class="md-nav__item">
   <a href="#kdp.layers_factory.PreprocessorLayerFactory.transformer_block_layer" class="md-nav__link">
     <span class="md-ellipsis">
       transformer_block_layer
     </span>
   </a>
   
+</li>
+        
+      </ul>
+    </nav>
+  
 </li>
       
     </ul>
@@ -660,7 +708,30 @@
 
 
 <h1 id="preprocessing-layers-factory">🏭 Preprocessing Layers Factory</h1>
-<p>You can find all available layers in the <code>PreprocessorLayerFactory</code> class:</p>
+<p>The <code>PreprocessorLayerFactory</code> class provides a convenient way to create and manage preprocessing layers for your machine learning models. It supports both standard Keras preprocessing layers and custom layers defined within the KDP framework.</p>
+<h2 id="using-keras-preprocessing-layers">🎡 Using Keras Preprocessing Layers</h2>
+<p>All preprocessing layers available in Keras can be used within the <code>PreprocessorLayerFactory</code>. You can access these layers by their class names. Here's an example of how to use a Keras preprocessing layer:</p>
+<p><div class="highlight"><pre><span></span><code><span class="n">normalization_layer</span> <span class="o">=</span> <span class="n">PreprocessorLayerFactory</span><span class="o">.</span><span class="n">create_layer</span><span class="p">(</span>
+    <span class="s2">&quot;Normalization&quot;</span><span class="p">,</span>
+    <span class="n">axis</span><span class="o">=-</span><span class="mi">1</span><span class="p">,</span>
+    <span class="n">mean</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
+    <span class="n">variance</span><span class="o">=</span><span class="kc">None</span>
+<span class="p">)</span>
+</code></pre></div>
+Available layers:</p>
+<ul class="task-list">
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> Normalization</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> Discretization</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> CategoryEncoding</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> Hashing</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> HashedCrossing</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> StringLookup</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> IntegerLookup</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> TextVectorization</li>
+<li class="task-list-item"><label class="task-list-control"><input type="checkbox" disabled checked/><span class="task-list-indicator"></span></label> ... and more</li>
+</ul>
+<h2 id="custom-kdp-preprocessing-layers">🏗️ Custom KDP Preprocessing Layers</h2>
+<p>In addition to Keras layers, the <code>PreprocessorLayerFactory</code> includes several custom layers specific to the KDP framework. Here's a list of available custom layers:</p>
 
 
 <div class="doc doc-object doc-class">
diff --git a/1.8.0/motivation/index.html b/1.8.0/motivation/index.html
index 9e3a553..12b0cae 100644
--- a/1.8.0/motivation/index.html
+++ b/1.8.0/motivation/index.html
@@ -9,7 +9,7 @@
       
       
       
-        <link rel="prev" href="../integrations/">
+        <link rel="prev" href="../transformer_blocks/">
       
       
         <link rel="next" href="../contributing/">
@@ -338,11 +338,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../transformer_blocks/" class="md-nav__link">
+      <a href="../layers_factory/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🤖 TransformerBlocks
+    🏭 Layers Factory
   </span>
   
 
@@ -358,11 +358,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../layers_factory/" class="md-nav__link">
+      <a href="../integrations/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    🏭 Layers Factory
+    📦 Integrating Preprocessing Model
   </span>
   
 
@@ -378,11 +378,11 @@
   
   
     <li class="md-nav__item">
-      <a href="../integrations/" class="md-nav__link">
+      <a href="../transformer_blocks/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
+    🤖 TransformerBlocks
   </span>
   
 
diff --git a/1.8.0/search/search_index.json b/1.8.0/search/search_index.json
index b0799bb..544b5e8 100644
--- a/1.8.0/search/search_index.json
+++ b/1.8.0/search/search_index.json
@@ -1 +1 @@
-{"config":{"lang":["en"],"separator":"[\\s\\-]+","pipeline":["stopWordFilter"]},"docs":[{"location":"","title":"\ud83c\udf1f Welcome to Keras Data Processor - Preprocessing Power with TensorFlow Keras \ud83c\udf1f","text":"<p>Welcome to the Future of Data Preprocessing!</p> <p>Diving into the world of machine learning and data science, we often find ourselves tangled in the preprocessing jungle. Worry no more! Introducing a state-of-the-art data preprocessing model based on TensorFlow Keras and the innovative use of Keras preprocessing layers.</p> <p>Say goodbye to tedious data preparation tasks and hello to streamlined, efficient, and scalable data pipelines. Whether you're a seasoned data scientist or just starting out, this tool is designed to supercharge your ML workflows, making them more robust and faster than ever!</p>"},{"location":"#key-features","title":"\ud83d\udd11 Key Features:","text":"<ul> <li> <p>\ud83d\udee0 Automated Feature Engineering: Automatically detects and applies the most suitable preprocessing steps for each feature type in your dataset, ensuring optimal data preparation with minimal manual intervention.</p> </li> <li> <p>\ud83c\udfa8 Customizable Preprocessing Pipelines: Tailor your preprocessing steps with ease. Choose from a comprehensive range of options for numeric, categorical, text data, and even complex feature crosses, allowing for precise and effective data handling.</p> </li> <li> <p>\ud83d\udcca Scalability and Efficiency: Engineered for high performance, this tool handles large datasets effortlessly, leveraging TensorFlow's robust computational capabilities.</p> </li> <li> <p>\ud83e\udde0 Enhanced with Transformer Blocks: Incorporate transformer blocks into your preprocessing model to boost feature interaction analysis and uncover complex patterns, enhancing predictive model accuracy.</p> </li> <li> <p>\u2699\ufe0f Easy Integration: Designed to seamlessly integrate as the first layers in your TensorFlow Keras models, facilitating a smooth transition from raw data to trained model, accelerating your workflow significantly.</p> </li> </ul>"},{"location":"#getting-started","title":"\ud83d\ude80 Getting started:","text":"<p>We use poetry for handling dependencies so you will need to install it first. Then you can install the dependencies by running:</p> <p>To install dependencies:</p> <pre><code>poetry install\n</code></pre> <p>or to enter a dedicated env directly:</p> <pre><code>poetry shell\n</code></pre> <p>Then you can simply configure your preprocessor:</p>"},{"location":"#building-preprocessor","title":"\ud83d\udee0\ufe0f Building Preprocessor:","text":"<p>The simplest application of ths preprocessing model is as follows:</p> <pre><code>from kdp import PreprocessingModel\nfrom kdp import FeatureType\n\n# DEFINING FEATURES PROCESSORS\nfeatures_specs = {\n    # ======= NUMERICAL Features =========================\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    # ======= CATEGORICAL Features ========================\n    \"feat3\": FeatureType.STRING_CATEGORICAL,\n    \"feat4\": FeatureType.INTEGER_CATEGORICAL,\n    # ======= TEXT Features ========================\n    \"feat5\": FeatureType.TEXT,\n}\n\n# INSTANTIATE THE PREPROCESSING MODEL with your data\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n)\n# construct the preprocessing pipelines\nppr.build_preprocessor()\n</code></pre> <p>This wil output:</p> <pre><code>{\n'model': &lt;Functional name=preprocessor, built=True&gt;,\n'inputs': {\n    'feat1': &lt;KerasTensor shape=(None, 1), dtype=float32, sparse=None, name=feat1&gt;,\n    'feat2': &lt;KerasTensor shape=(None, 1), dtype=float32, sparse=None, name=feat2&gt;,\n    'feat3': &lt;KerasTensor shape=(None, 1), dtype=string, sparse=None, name=feat3&gt;,\n    'feat4': &lt;KerasTensor shape=(None, 1), dtype=int32, sparse=None, name=feat4&gt;,\n    'feat5': &lt;KerasTensor shape=(None, 1), dtype=string, sparse=None, name=feat5&gt;\n    },\n'signature': {\n    'feat1': TensorSpec(shape=(None, 1), dtype=tf.float32, name='feat1'),\n    'feat2': TensorSpec(shape=(None, 1), dtype=tf.float32, name='feat2'),\n    'feat3': TensorSpec(shape=(None, 1), dtype=tf.string, name='feat3'),\n    'feat4': TensorSpec(shape=(None, 1), dtype=tf.int32, name='feat4'),\n    'feat5': TensorSpec(shape=(None, 1), dtype=tf.string, name='feat5')\n    },\n'output_dims': 45\n}\n</code></pre> <p>This will result in the following preprocessing steps:</p> <p> </p> <p>Success</p> <p>You can define the preprocessing model with the <code>features_specs</code> dictionary, where the keys are the feature names and the values are the feature types. The model will automatically apply the appropriate preprocessing steps based on the feature type.</p> <p>You have access to several layers of customization per feature type, such as normalization, rescaling, or even definition of custom preprocessing steps.</p> <p>See \ud83d\udc40 Defining Features for more details.</p> <p>Info</p> <p>You can use the preprocessing model independently to preprocess your data or integrate it into your Keras model as the first layer, see \ud83d\udc40 Integrations</p>"},{"location":"#advanced-configuration-options","title":"Advanced Configuration Options","text":""},{"location":"#transformer-blocks-configuration","title":"Transformer Blocks Configuration","text":"<p>Enhance your preprocessing model with transformer blocks to capture complex patterns and interactions between features, see \ud83d\udc40 Transformer Blocks. You can configure the transformer blocks as follows:</p> <ul> <li>Number of Blocks: Define how many transformer blocks to include in the preprocessing pipeline.</li> <li>Number of Heads: Set the number of attention heads in each transformer block.</li> <li>Feed Forward Units: Specify the number of units in the feed-forward network of each block.</li> <li>Dropout Rate: Adjust the dropout rate to prevent overfitting during training.</li> <li>Placement: Choose whether to apply transformer blocks to only categorical features (<code>CATEGORICAL</code>) or to all features (<code>ALL_FEATURES</code>).</li> </ul> <p>Example configuration:</p> <pre><code>transfo_config = {\n    'transfo_nr_blocks': 3,\n    'transfo_nr_heads': 4,\n    'transfo_ff_units': 64,\n    'transfo_dropout_rate': 0.1,\n    'transfo_placement': 'ALL_FEATURES'\n}\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n    **transfo_config\n)\n</code></pre>"},{"location":"#custom-preprocessors","title":"Custom Preprocessors","text":"<p>Tailor your preprocessing steps with custom preprocessors for each feature type. Define specific preprocessing logic that fits your data characteristics or domain-specific requirements, see \ud83d\udc40 Custom Preprocessors.</p> <ul> <li>Custom Steps: Add custom preprocessing layers or functions to the predefined feature types.</li> <li>Flexibility: Mix and match standard and custom preprocessing steps to achieve optimal data transformation.</li> </ul> <p>Example of adding a custom preprocessor:</p> <pre><code>from kdp.custom_preprocessors import MyCustomScaler\n\nfeatures_specs = {\n    \"feat1\": {\n        'feature_type': FeatureType.FLOAT_NORMALIZED,\n        'preprocessors': [MyCustomScaler()]\n    }\n}\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec\n)\n</code></pre>"},{"location":"#feature-crosses","title":"Feature Crosses","text":"<p>Create complex feature interactions by crossing features. This method combines features into a single feature, which can be particularly useful for models that benefit from understanding interactions between specific features, see \ud83d\udc40 Feature Crosses.</p> <ul> <li>Crossing Features: Specify pairs of features to be crossed and the number of bins for hashing the crossed feature.</li> </ul> <p>Example of defining feature crosses:</p> <pre><code>feature_crosses = [\n    (\"feat1\", \"feat2\", 10),\n    (\"feat3\", \"feat4\", 5)\n]\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n    feature_crosses=feature_crosses\n)\n</code></pre> <p>These advanced configurations allow for greater flexibility and power in your preprocessing pipelines, enabling more sophisticated data transformations and feature engineering.</p>"},{"location":"contributing/","title":"\ud83d\udcbb Contributing: Join the Preprocessing Revolution! \ud83d\udee0\ufe0f","text":"<p>Eager to contribute? Great! We're excited to welcome new contributors to our project. Here's how you can get involved:</p>"},{"location":"contributing/#new-ideas-features-requests","title":"\ud83d\udca1 New Ideas / Features Requests","text":"<p>If you wan't to request a new feature or you have detected an issue, please use the following link: ISSUES</p>"},{"location":"contributing/#getting-started","title":"\ud83d\ude80 Getting Started:","text":"<ul> <li> <p> Fork the Repository: Visit our GitHub page, fork the repository, and clone it to your local machine.</p> </li> <li> <p> Set Up Your Environment: Make sure you have TensorFlow, Loguru, and all necessary dependencies installed.</p> </li> <li> <p> Make sure you have installed the pre-commit hook locally</p> </li> </ul> <p>??? installation-guide   Before using pre-commit hook you need to install it in your python environment.</p> <pre><code>    ```bash\n    conda install -c conda-forge pre-commit\n    ```\n\n    go to the root folder of this repository, activate your venv and use the following command:\n\n    ```bash\n    pre-commit install\n    ```\n</code></pre> <ul> <li> <p> Create a new branch to package your code</p> </li> <li> <p> Use standarized commit message:</p> </li> </ul> <p><code>{LABEL}(KDP): {message}</code></p> <p>This is very important for the automatic releases (semantic release) and to have clean history on the master branch.</p> <p>??? Labels-types</p> <pre><code>    | Label    | Usage                                                                                                                                                                                                                                             |\n    | -------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |\n    | break    | `break` is used to identify changes related to old compatibility or functionality that breaks the current usage (major)                                                                                                                           |\n    | feat     | `feat` is used to identify changes related to new backward-compatible abilities or functionality (minor)                                                                                                                                          |\n    | init     | `init` is used to indentify the starting related to the project (minor)                                                                                                                                                                           |\n    | enh      | `enh` is used to indentify changes related to amelioration of abilities or functionality (patch)                                                                                                                                                  |\n    | build    | `build` (also known as `chore`) is used to identify **development** changes related to the build system (involving scripts, configurations, or tools) and package dependencies (patch)                                                            |\n    | ci       | `ci` is used to identify **development** changes related to the continuous integration and deployment system - involving scripts, configurations, or tools (minor)                                                                                |\n    | docs     | `docs`  is used to identify documentation changes related to the project; whether intended externally for the end-users or internally for the developers (patch)                                                                                  |\n    | perf     | `perf`  is used to identify changes related to backward-compatible **performance improvements** (patch)                                                                                                                                           |\n    | refactor | `refactor` is used to identify changes related to modifying the codebase, which neither adds a feature nor fixes a bug - such as removing redundant code, simplifying the code, renaming variables, etc.&lt;br /&gt;i.e. handy for your wip ; ) (patch) |\n    | style    | `style`  is used to identify **development** changes related to styling the codebase, regardless of the meaning - such as indentations, semi-colons, quotes, trailing commas, and so on (patch)                                                   |\n    | test     | `test` is used to identify **development** changes related to tests - such as refactoring existing tests or adding new tests. (minor)                                                                                                             |\n    | fix      | `fix`  is used to identify changes related to backward-compatible bug fixes. (patch)                                                                                                                                                              |\n    | ops      | `ops` is used to identify changes related to deployment files like `values.yml`, `gateway.yml,` or `Jenkinsfile` in the **ops** directory. (minor)                                                                                                |\n    | hotfix   | `hotfix` is used to identify **production** changes related to backward-compatible bug fixes (patch)                                                                                                                                              |\n    | revert   | `revert` is used to identify backward changes (patch)                                                                                                                                                                                             |\n    | maint    | `maint` is used to identify **maintenance** changes related to project (patch)                                                                                                                                                                    |\n</code></pre> <ul> <li> Create your first Merge Request (MR) as soon as possible.</li> </ul> <p>Merge requests will be responsible for semantic-release storytelling and so use them wisely! The changelog report generated automatically will be based on your commits merged into main branch and should cover all the thins you did for the project, as an example:</p> <ul> <li> Separate your merge requests based on LABEL or functionality if you are working on <code>feat</code> label</li> </ul> <p>This about what part of feature you are working on, (messages) i.e.:</p> <pre><code>    - `initializaing base pre-processing code`\n    - `init repo structure`\n    - `adding pre-processing unit-tests`\n</code></pre> <ul> <li> Once the code is ready create a Merge Request (MR) into the DEV branch with a proper naming convention</li> </ul> <p>The name of your MR should follow the same exact convention as your commits (we have a dedicated check for this in the CI):</p> <pre><code>    `{LABEL}(KDP): {message}`\n</code></pre> <ul> <li> <p> Use small Merge Requests but do them more ofthen &lt; 400 ligns for quicker and simple review and not the whole project !</p> </li> <li> <p> Ask for a Code Review !</p> </li> <li> <p> Once your MR is approved, solve all your unresolved conversation and pass all the CI check before you can merge it.</p> </li> <li> <p> All the Tests for your code should pass -&gt; REMEMBER NO TESTS = NO MERGE \ud83d\udea8</p> </li> </ul>"},{"location":"features/","title":"Defining Features for Preprocessing \ud83c\udf1f","text":"<p>Customize the preprocessing pipeline by setting up a dictionary that maps feature names to their respective types, tailored to your specific requirements.</p>"},{"location":"features/#numeric-features","title":"\ud83d\udcaf Numeric Features","text":"<p>Explore various methods to define numerical features tailored to your needs:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom NumericalFeature <pre><code>features_specs = {\n    \"feat1\": \"float\",\n    \"feat2\": \"FLOAT\",\n    \"feat3\": \"FLOAT_NORMALIZED\",\n    \"feat3\": \"FLOAT_RESCALED\",\n    ...\n}\n</code></pre> <p>Utilize predefined preprocessing configurations with <code>FeatureType</code>.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>FLOAT</li> <li>FLOAT_NORMALIZED</li> <li>FLOAT_RESCALED</li> <li>FLOAT_DISCRETIZED</li> </ul> <p>Customize preprocessing by passing specific parameters to <code>NumericalFeature</code>.</p> <pre><code>from kdp.features import NumericalFeature\n\nfeatures_specs = {\n    \"feat3\": NumericalFeature(\n        name=\"feat3\",\n        feature_type=FeatureType.FLOAT_DISCRETIZED,\n        bin_boundaries=[(1, 10)],\n    ),\n    \"feat4\": NumericalFeature(\n        name=\"feat4\",\n        feature_type=FeatureType.FLOAT,\n    ),\n    ...\n}\n</code></pre> <p>Here's how the numeric preprocessing pipeline looks:</p> <p></p>"},{"location":"features/#categorical-features","title":"\ud83d\udc08\u200d\u2b1b Categorical Features","text":"<p>Define categorical features flexibly:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom CategoricalFeature <pre><code>features_specs = {\n    \"feat1\": \"INTEGER_CATEGORICAL\",\n    \"feat2\": \"STRING_CATEGORICAL\",\n    \"feat3\": \"string_categorical\",\n    ...\n}\n</code></pre> <p>Leverage default configurations with <code>FeatureType</code>.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.INTEGER_CATEGORICAL,\n    \"feat2\": FeatureType.STRING_CATEGORICAL,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>STRING_CATEGORICAL</li> <li>INTEGER_CATEGORICAL</li> </ul> <p>Tailor feature processing by specifying properties in <code>CategoricalFeature</code>.</p> <pre><code>from kdp.features\nfrom kdp.features import CategoricalFeature\n\nfeatures_specs = {\n    \"feat1\": CategoricalFeature(\n        name=\"feat7\",\n        feature_type=FeatureType.INTEGER_CATEGORICAL,\n        embedding_size=100,\n    ),\n    \"feat2\": CategoricalFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.STRING_CATEGORICAL,\n    ),\n    ...\n}\n</code></pre> <p>See how the categorical preprocessing pipeline appears:</p> <p></p>"},{"location":"features/#text-features","title":"\ud83d\udcdd Text Features","text":"<p>Customize text features in multiple ways to fit your project's demands:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom TextFeature <pre><code>features_specs = {\n    \"feat1\": \"text\",\n    \"feat2\": \"TEXT\",\n    ...\n}\n</code></pre> <p>Use <code>FeatureType</code> for automatic default preprocessing setups.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.TEXT,\n    \"feat2\": FeatureType.TEXT,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>TEXT</li> </ul> <p>Customize text preprocessing by passing specific arguments to <code>TextFeature</code>.</p> <pre><code>from kdp.features import TextFeature\n\nfeatures_specs = {\n    \"feat1\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.TEXT,\n        max_tokens=100,\n        stop_words=[\"stop\", \"next\"],\n    ),\n    \"feat2\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.TEXT,\n    ),\n    ...\n}\n</code></pre> <p>Here's how the text feature preprocessing pipeline looks:</p> <p></p>"},{"location":"features/#cross-features","title":"\u274c Cross Features","text":"<p>To implement cross features, specify a list of feature tuples in the <code>PreprocessingModel</code> like so:</p> <pre><code>from kdp.processor import PreprocessingModel\n\nppr = PreprocessingModel(\n    path_data=\"data/data.csv\",\n    features_specs={\n        \"feat6\": FeatureType.STRING_CATEGORICAL,\n        \"feat7\": FeatureType.INTEGER_CATEGORICAL,\n    },\n    feature_crosses=[(\"feat6\", \"feat7\", 5)],\n)\n</code></pre> <p>Example cross feature between INTEGER_CATEGORICAL and STRING_CATEGORICAL:</p> <p></p>"},{"location":"features/#date-features","title":"\ud83d\udcc6 Date Features","text":"<p>You can even process string encoded date features (format: 'YYYY-MM-DD'):</p> \ud83d\udd27 Using FeatureType\ud83d\udcaa Custom DateFeature <p>Use <code>FeatureType</code> for automatic default preprocessing setups.</p> <pre><code>from kdp.processor import PreprocessingModel\n\nppr = PreprocessingModel(\n    path_data=\"data/data.csv\",\n    features_specs={\n        \"feat1\": FeatureType.FLOAT,\n        \"feat2\": FeatureType.DATE,\n    },\n)\n</code></pre> <p>Customize text preprocessing by passing specific arguments to <code>TextFeature</code>.</p> <pre><code>from kdp.features import DateFeature\n\nfeatures_specs = {\n    \"feat1\": DateFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.FLOAT,\n    ),\n    \"feat2\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.DATE,\n        # additional option to add season layer:\n        add_season=True,  # adds one-hot season indicator (summer, winter, etc) defaults to False\n    ),\n    ...\n}\n</code></pre> <p>Example date and numeric processing pipeline:</p> <p></p>"},{"location":"features/#custom-preprocessing-steps","title":"\ud83d\ude80 Custom Preprocessing Steps","text":"<p>If you require even more customization, you can define custom preprocessing steps using the <code>Feature</code> class, using <code>preprocessors</code> attribute.</p> <p>The <code>preprocessors</code> attribute accepts a list of methods defined in <code>PreprocessorLayerFactory</code>.</p> <pre><code>from kdp.features import Feature\n\nfeatures_specs = {\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": Feature(\n        name=\"custom_feature_pipeline\",\n        feature_type=FeatureType.FLOAT_NORMALIZED,\n        preprocessors=[\n            tf.keras.layers.Rescaling,\n            tf.keras.layers.Normalization,\n\n        ],\n        # leyers required kwargs\n        scale=1,\n    )\n}\n</code></pre> <p>Here's how the text feature preprocessing pipeline looks:</p> <p></p> <p>The full list of available layers can be found: Preprocessing Layers Factory</p>"},{"location":"integrations/","title":"\ud83d\udd17 Integrating Preprocessing Model with other Keras Model:","text":"<p>You can then easily ingetrate this model into your keras model as the first layer:</p>"},{"location":"integrations/#example-1-using-the-preprocessing-model-as-the-first-layer-of-a-sequential-model","title":"Example 1: Using the Preprocessing Model as the first layer of a Sequential Model","text":"<pre><code>class FunctionalModelWithPreprocessing(tf.keras.Model):\n    def __init__(self, preprocessing_model: tf.keras.Model) -&gt; None:\n        \"\"\"Initialize the user model.\n\n        Args:\n            preprocessing_model (tf.keras.Model): The preprocessing model.\n        \"\"\"\n        super().__init__()\n        self.preprocessing_model = preprocessing_model\n\n        # Dynamically create inputs based on the preprocessing model's input shape\n        inputs = {\n            name: tf.keras.Input(shape=shape[1:], name=name)\n            for name, shape in self.preprocessing_model.input_shape.items()\n        }\n\n        # You can use the preprocessing model directly in the functional API.\n        x = self.preprocessing_model(inputs)\n\n        # Define the dense layer as part of the model architecture\n        output = tf.keras.layers.Dense(\n            units=128,\n            activation=\"relu\",\n        )(x)\n\n        # Use the Model's functional API to define inputs and outputs\n        self.model = tf.keras.Model(inputs=inputs, outputs=output)\n\n    def call(self, inputs: dict[str, tf.Tensor]) -&gt; tf.Tensor:\n        \"\"\"Call the item model with the given inputs.\"\"\"\n        return self.model(inputs)\n\n# Defining this model is not easy with builtin preprocessing layers:\n\nfrom kdp import PreprocessingModel\nfrom kdp import FeatureType\n\n# DEFINING FEATURES PROCESSORS\nfeatures_specs = {\n    # ======= NUMERICAL Features =========================\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    # ======= CATEGORICAL Features ========================\n    \"feat3\": FeatureType.STRING_CATEGORICAL,\n    \"feat4\": FeatureType.INTEGER_CATEGORICAL,\n    # ======= TEXT Features ========================\n    \"feat5\": FeatureType.TEXT,\n}\n\n# INSTANTIATE THE PREPROCESSING MODEL with your data\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n)\n# construct the preprocessing pipelines\nppr.build_preprocessor()\n\n# building a production / deployment ready model\nfull_model = FunctionalModelWithPreprocessing(\n    preprocessing_model=ppr.model,\n)\n</code></pre>"},{"location":"layers_factory/","title":"\ud83c\udfed Preprocessing Layers Factory","text":"<p>You can find all available layers in the <code>PreprocessorLayerFactory</code> class:</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.cast_to_float32_layer","title":"<code>cast_to_float32_layer(name='cast_to_float32', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a CastToFloat32Layer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'cast_to_float32'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the CastToFloat32Layer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.create_layer","title":"<code>create_layer(layer_class, name=None, **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a layer using the layer class name, automatically filtering kwargs based on the layer class.</p> <p>Parameters:</p> Name Type Description Default <code>layer_class</code> <code>str | Class Object</code> <p>The name of the layer class to be created (e.g., 'Normalization', 'Rescaling') or the class object itself.</p> required <code>name</code> <code>str</code> <p>The name of the layer. Optional.</p> <code>None</code> <code>**kwargs</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the specified layer class.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_encoding_layer","title":"<code>date_encoding_layer(name='date_encoding_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a DateEncodingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_encoding_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the DateEncodingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_parsing_layer","title":"<code>date_parsing_layer(name='date_parsing_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a DateParsingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_parsing_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the DateParsingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_season_layer","title":"<code>date_season_layer(name='date_season_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a SeasonLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_season_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the SeasonLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.text_preprocessing_layer","title":"<code>text_preprocessing_layer(name='text_preprocessing', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a TextPreprocessingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'text_preprocessing'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the TextPreprocessingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.transformer_block_layer","title":"<code>transformer_block_layer(name='transformer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a TransformerBlock layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'transformer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the TransformerBlock layer.</p>"},{"location":"motivation/","title":"\ud83c\udf66 The Motivation Behind Keras Data Processor","text":"<p>The burning question now is \u2753:</p> <p>Why create a new preprocessing pipeline or model when we already have an excellent tool like Keras FeatureSpace?</p> <p>While <code>Keras FeatureSpace</code> has been a cornerstone in many of my projects, delivering great results, I encountered significant challenges in a high-volume data project. The tool required multiple data passes (proportional to the number of features), executing <code>.adapt</code> for each feature. This led to exceedingly long preprocessing times and frequent out-of-memory errors.</p> <p>This experience motivated a deep dive into the internal workings of Keras FeatureSpace and thus, motivated me to develop a new preprocessing pipeline that could handle data more efficiently\u2014both in terms of speed and memory usage. Thus, the journey began to craft a solution that would:</p> <ul> <li> <p> Process data in a single pass, utilizing an iterative approach to avoid loading the entire dataset into memory, managed by a batch_size parameter.</p> </li> <li> <p> Introduce custom predefined preprocessing steps tailored to the feature type, controlled by a feature_type parameter.</p> </li> <li> <p> Offer greater flexibility for custom preprocessing steps and a more Pythonic internal implementation.</p> </li> <li> <p> Align closely with the API of Keras FeatureSpace (proposing something similar), with the hope that it might eventually be integrated into the KFS ecosystem.</p> </li> </ul>"},{"location":"motivation/#quick-benchmark-overview","title":"Quick Benchmark Overview","text":"<p>To demonstrate the effectiveness of our new preprocessing pipeline, we conducted a benchmark comparing it with the traditional Keras FeatureSpace (this will give you a glimps on what was described earlier for the big data cases). Here\u2019s how we did it:</p> Benchmarking Steps: <ul> <li> <p>Setup: We configure the benchmark by specifying a set number of features in a loop. Each feature's specification (either a normalized float or a categorical string) is defined in a dictionary.</p> </li> <li> <p>Data Generation: For each set number of data points determined in another loop, we generate mock data based on the feature specifications and data points, which is then saved to a CSV file.</p> </li> <li> <p>Memory Management: We use garbage collection to free up memory before and after each benchmarking run, coupled with a 10-second cooldown period to ensure all operations complete fully.</p> </li> <li> <p>Performance Measurement: For both the Keras Data Processor (KDP) and Keras Feature Space (FS), we measure and record CPU and memory usage before and after their respective functions run, noting the time taken.</p> </li> <li> <p>Results Compilation: We collect and log results including the number of features, data points, execution time, memory, and CPU usage for each function in a structured format.</p> </li> </ul> <p>The results clearly illustrate the benefits, especially as the complexity of the data increases:</p> <p></p> <p>The graph shows a steep rise in processing time with an increase in data points for both <code>KDP</code> and <code>FS</code>. However, KDP consistently outperforms <code>FS</code>, with the gap widening as the number of data points grows.</p> <p></p> <p>This graph depicts the processing time increase with more features. Again, <code>KDP</code> outpaces <code>FS</code>, demonstrating substantial efficiency improvements.</p> <p>The combined effect of both the number of features and data points leads to significant performance gains on the <code>KDP</code> sice and time and memory hungry <code>FS</code> for the bigger and more complex datasets. This project was born from the need for better efficiency, and it\u2019s my hope to continue refining this tool with community support, pushing the boundaries of what we can achieve in data preprocessing (and maybe one day integrating it directly into Keras \u2764\ufe0f)!</p> <p>There is much to be done and many features to be added, but I am excited to see where this journey takes us. Let\u2019s build something great together! \ud83d\ude80\ud83d\udd27</p>"},{"location":"transformer_blocks/","title":"\ud83e\udd16 TransformerBlocks \ud83c\udf1f","text":"<p>You can add transformer blocks to  your preprocessing model by simply defining required configuration when initializing the <code>Preprocessor</code> class:</p> <p>with the following arguments:</p> <ul> <li> <p><code>transfo_nr_blocks</code> (int): The number of transformer blocks in sequence (default=None, transformer block is disabled by default).</p> </li> <li> <p><code>transfo_nr_heads</code> (int): The number of heads for the transformer block (default=3).</p> </li> <li> <p><code>transfo_ff_units</code> (int): The number of feed forward units for the transformer (default=16).</p> </li> <li> <p><code>transfo_dropout_rate</code> (float): The dropout rate for the transformer block (default=0.25).</p> </li> <li> <p><code>transfo_placement</code> (str): The placement of the transformer block withe the following options:</p> <ul> <li><code>CATEGORICAL</code> -&gt; only after categorical and text variables</li> <li><code>ALL_FEATURES</code> -&gt; after all concatenated features).</li> </ul> </li> </ul> <p>This used a dedicated TransformerBlockLayer to handle the transformer block logic.</p>"},{"location":"transformer_blocks/#code-examples","title":"\ud83d\udcbb Code Examples:","text":"<pre><code>from kdp.processor import PreprocessingModel, OutputModeOptions, TransformerBlockPlacementOptions\n\nppr = PreprocessingModel(\n    path_data=\"data/test_data.csv\",\n    features_specs=features_specs,\n    features_stats_path=\"stats_data.json\",\n    output_mode=OutputModeOptions.CONCAT,\n    # TRANSFORMERS BLOCK CONTROLL\n    transfo_nr_blocks=3, # if 0, transformer block is disabled\n    transfo_nr_heads=3,\n    transfo_ff_units=16,\n    transfo_dropout_rate=0.25,\n    transfo_placement=TransformerBlockPlacementOptions.ALL_FEATURES,\n</code></pre> <p>There are two options for the <code>transfo_placement</code> argument controlled using <code>TransformerBlockPlacementOptions</code> class:</p> <ul> <li> <p> <code>CATEGORICAL</code>: The transformer block is applied only to the categorical + text features: <code>TransformerBlockPlacementOptions.CATEGORICAL</code> only.</p> <p>The corresponding architecture may thus look like this: </p> </li> <li> <p> <code>ALL_FEATURES</code>: The transformer block is applied to all features: <code>TransformerBlockPlacementOptions.ALL_FEATURES</code></p> <p>The corresponding architecture may thus look like this: </p> </li> </ul>"}]}
\ No newline at end of file
+{"config":{"lang":["en"],"separator":"[\\s\\-]+","pipeline":["stopWordFilter"]},"docs":[{"location":"","title":"\ud83c\udf1f Welcome to Keras Data Processor - Preprocessing Power with TensorFlow Keras \ud83c\udf1f","text":"<p>Welcome to the Future of Data Preprocessing!</p> <p>Diving into the world of machine learning and data science, we often find ourselves tangled in the preprocessing jungle. Worry no more! Introducing a state-of-the-art data preprocessing model based on TensorFlow Keras and the innovative use of Keras preprocessing layers.</p> <p>Say goodbye to tedious data preparation tasks and hello to streamlined, efficient, and scalable data pipelines. Whether you're a seasoned data scientist or just starting out, this tool is designed to supercharge your ML workflows, making them more robust and faster than ever!</p>"},{"location":"#key-features","title":"\ud83d\udd11 Key Features:","text":"<ul> <li> <p>\ud83d\udee0 Flexible Feature Engineering: Applies predefined preprocessing steps based on user-specified feature types, allowing for efficient and customizable data preparation with minimal manual coding.</p> </li> <li> <p>\ud83c\udfa8 Customizable Preprocessing Pipelines: Tailor your preprocessing steps with ease. Choose from a comprehensive range of options for numeric, categorical, text data, and even complex feature crosses, allowing for precise and effective data handling.</p> </li> <li> <p>\ud83d\udcca Scalability and Efficiency: Engineered for high performance, this tool handles large datasets effortlessly, leveraging TensorFlow's robust computational capabilities.</p> </li> <li> <p>\ud83e\udde0 Enhanced with Transformer Blocks: Incorporate transformer blocks into your preprocessing model to boost feature interaction analysis and uncover complex patterns, enhancing predictive model accuracy.</p> </li> <li> <p>\u2699\ufe0f Easy Integration: Designed to seamlessly integrate as the first layers in your TensorFlow Keras models, facilitating a smooth transition from raw data to trained model, accelerating your workflow significantly.</p> </li> </ul>"},{"location":"#getting-started","title":"\ud83d\ude80 Getting started:","text":"<p>We use poetry for handling dependencies so you will need to install it first. Then you can install the dependencies by running:</p> <p>To install dependencies:</p> <pre><code>poetry install\n</code></pre> <p>or to enter a dedicated env directly:</p> <pre><code>poetry shell\n</code></pre> <p>Then you can simply configure your preprocessor:</p>"},{"location":"#building-preprocessor","title":"\ud83d\udee0\ufe0f Building Preprocessor:","text":"<p>The simplest application of the preprocessing model is as follows:</p> <pre><code>from kdp import PreprocessingModel\nfrom kdp import FeatureType\n\n# DEFINING FEATURES PROCESSORS\nfeatures_specs = {\n    # ======= NUMERICAL Features =========================\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    # ======= CATEGORICAL Features ========================\n    \"feat3\": FeatureType.STRING_CATEGORICAL,\n    \"feat4\": FeatureType.INTEGER_CATEGORICAL,\n    # ======= TEXT Features ========================\n    \"feat5\": FeatureType.TEXT,\n}\n\n# INSTANTIATE THE PREPROCESSING MODEL with your data\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n)\n# construct the preprocessing pipelines\nppr.build_preprocessor()\n</code></pre> <p>This will output:</p> <pre><code>{\n'model': &lt;Functional name=preprocessor, built=True&gt;,\n'inputs': {\n    'feat1': &lt;KerasTensor shape=(None, 1), dtype=float32, sparse=None, name=feat1&gt;,\n    'feat2': &lt;KerasTensor shape=(None, 1), dtype=float32, sparse=None, name=feat2&gt;,\n    'feat3': &lt;KerasTensor shape=(None, 1), dtype=string, sparse=None, name=feat3&gt;,\n    'feat4': &lt;KerasTensor shape=(None, 1), dtype=int32, sparse=None, name=feat4&gt;,\n    'feat5': &lt;KerasTensor shape=(None, 1), dtype=string, sparse=None, name=feat5&gt;\n    },\n'signature': {\n    'feat1': TensorSpec(shape=(None, 1), dtype=tf.float32, name='feat1'),\n    'feat2': TensorSpec(shape=(None, 1), dtype=tf.float32, name='feat2'),\n    'feat3': TensorSpec(shape=(None, 1), dtype=tf.string, name='feat3'),\n    'feat4': TensorSpec(shape=(None, 1), dtype=tf.int32, name='feat4'),\n    'feat5': TensorSpec(shape=(None, 1), dtype=tf.string, name='feat5')\n    },\n'output_dims': 45\n}\n</code></pre> <p>This will result in the following preprocessing steps:</p> <p> </p> <p>Success</p> <p>You can define the preprocessing model with the <code>features_specs</code> dictionary, where the keys are the feature names and the values are the feature types. The model will automatically apply the appropriate preprocessing steps based on the feature type.</p> <p>You have access to several layers of customization per feature type, such as normalization, rescaling, or even definition of custom preprocessing steps.</p> <p>See \ud83d\udc40 Defining Features for more details.</p> <p>Info</p> <p>You can use the preprocessing model independently to preprocess your data or integrate it into your Keras model as the first layer, see \ud83d\udc40 Integrations</p>"},{"location":"#advanced-configuration-options","title":"\ud83d\udcaa\ud83c\udffb Advanced Configuration Options","text":""},{"location":"#transformer-blocks-configuration","title":"\ud83e\udd16 Transformer Blocks Configuration","text":"<p>Enhance your preprocessing model with transformer blocks to capture complex patterns and interactions between features, see \ud83d\udc40 Transformer Blocks. You can configure the transformer blocks as follows:</p> <ul> <li>Number of Blocks: Define how many transformer blocks to include in the preprocessing pipeline.</li> <li>Number of Heads: Set the number of attention heads in each transformer block.</li> <li>Feed Forward Units: Specify the number of units in the feed-forward network of each block.</li> <li>Dropout Rate: Adjust the dropout rate to prevent overfitting during training.</li> <li>Placement: Choose whether to apply transformer blocks to only categorical features (<code>CATEGORICAL</code>) or to all features (<code>ALL_FEATURES</code>).</li> </ul> <p>Example configuration:</p> <pre><code>transfo_config = {\n    'transfo_nr_blocks': 3,\n    'transfo_nr_heads': 4,\n    'transfo_ff_units': 64,\n    'transfo_dropout_rate': 0.1,\n    'transfo_placement': 'ALL_FEATURES'\n}\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n    **transfo_config\n)\n</code></pre>"},{"location":"#custom-preprocessors","title":"\ud83c\udfd7\ufe0f Custom Preprocessors","text":"<p>Tailor your preprocessing steps with custom preprocessors for each feature type. Define specific preprocessing logic that fits your data characteristics or domain-specific requirements, see \ud83d\udc40 Custom Preprocessors.</p> <ul> <li>Custom Steps: Add custom preprocessing layers or functions to the predefined feature types.</li> <li>Flexibility: Mix and match standard and custom preprocessing steps to achieve optimal data transformation.</li> </ul> <p>Example of adding a custom preprocessor:</p> <pre><code>from kdp.custom_preprocessors import MyCustomScaler\n\nfeatures_specs = {\n    \"feat1\": {\n        'feature_type': FeatureType.FLOAT_NORMALIZED,\n        'preprocessors': [MyCustomScaler()]\n    }\n}\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec\n)\n</code></pre>"},{"location":"#feature-crosses","title":"\u2671 Feature Crosses","text":"<p>Create complex feature interactions by crossing features. This method combines features into a single feature, which can be particularly useful for models that benefit from understanding interactions between specific features, see \ud83d\udc40 Feature Crosses.</p> <ul> <li>Crossing Features: Specify pairs of features to be crossed and the number of bins for hashing the crossed feature.</li> </ul> <p>Example of defining feature crosses:</p> <pre><code>feature_crosses = [\n    (\"feat1\", \"feat2\", 10),\n    (\"feat3\", \"feat4\", 5)\n]\n\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n    feature_crosses=feature_crosses\n)\n</code></pre> <p>These advanced configurations allow for greater flexibility and power in your preprocessing pipelines, enabling more sophisticated data transformations and feature engineering.</p>"},{"location":"contributing/","title":"\ud83d\udcbb Contributing: Join the Preprocessing Revolution! \ud83d\udee0\ufe0f","text":"<p>Eager to contribute? Great! We're excited to welcome new contributors to our project. Here's how you can get involved:</p>"},{"location":"contributing/#new-ideas-features-requests","title":"\ud83d\udca1 New Ideas / Features Requests","text":"<p>If you wan't to request a new feature or you have detected an issue, please use the following link: ISSUES</p>"},{"location":"contributing/#getting-started","title":"\ud83d\ude80 Getting Started:","text":"<ul> <li> <p> Fork the Repository: Visit our GitHub page, fork the repository, and clone it to your local machine.</p> </li> <li> <p> Set Up Your Environment: Make sure you have TensorFlow, Loguru, and all necessary dependencies installed.</p> </li> <li> <p> Make sure you have installed the pre-commit hook locally</p> </li> </ul> <p>??? installation-guide   Before using pre-commit hook you need to install it in your python environment.</p> <pre><code>    ```bash\n    conda install -c conda-forge pre-commit\n    ```\n\n    go to the root folder of this repository, activate your venv and use the following command:\n\n    ```bash\n    pre-commit install\n    ```\n</code></pre> <ul> <li> <p> Create a new branch to package your code</p> </li> <li> <p> Use standarized commit message:</p> </li> </ul> <p><code>{LABEL}(KDP): {message}</code></p> <p>This is very important for the automatic releases (semantic release) and to have clean history on the master branch.</p> <p>??? Labels-types</p> <pre><code>    | Label    | Usage                                                                                                                                                                                                                                             |\n    | -------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |\n    | break    | `break` is used to identify changes related to old compatibility or functionality that breaks the current usage (major)                                                                                                                           |\n    | feat     | `feat` is used to identify changes related to new backward-compatible abilities or functionality (minor)                                                                                                                                          |\n    | init     | `init` is used to indentify the starting related to the project (minor)                                                                                                                                                                           |\n    | enh      | `enh` is used to indentify changes related to amelioration of abilities or functionality (patch)                                                                                                                                                  |\n    | build    | `build` (also known as `chore`) is used to identify **development** changes related to the build system (involving scripts, configurations, or tools) and package dependencies (patch)                                                            |\n    | ci       | `ci` is used to identify **development** changes related to the continuous integration and deployment system - involving scripts, configurations, or tools (minor)                                                                                |\n    | docs     | `docs`  is used to identify documentation changes related to the project; whether intended externally for the end-users or internally for the developers (patch)                                                                                  |\n    | perf     | `perf`  is used to identify changes related to backward-compatible **performance improvements** (patch)                                                                                                                                           |\n    | refactor | `refactor` is used to identify changes related to modifying the codebase, which neither adds a feature nor fixes a bug - such as removing redundant code, simplifying the code, renaming variables, etc.&lt;br /&gt;i.e. handy for your wip ; ) (patch) |\n    | style    | `style`  is used to identify **development** changes related to styling the codebase, regardless of the meaning - such as indentations, semi-colons, quotes, trailing commas, and so on (patch)                                                   |\n    | test     | `test` is used to identify **development** changes related to tests - such as refactoring existing tests or adding new tests. (minor)                                                                                                             |\n    | fix      | `fix`  is used to identify changes related to backward-compatible bug fixes. (patch)                                                                                                                                                              |\n    | ops      | `ops` is used to identify changes related to deployment files like `values.yml`, `gateway.yml,` or `Jenkinsfile` in the **ops** directory. (minor)                                                                                                |\n    | hotfix   | `hotfix` is used to identify **production** changes related to backward-compatible bug fixes (patch)                                                                                                                                              |\n    | revert   | `revert` is used to identify backward changes (patch)                                                                                                                                                                                             |\n    | maint    | `maint` is used to identify **maintenance** changes related to project (patch)                                                                                                                                                                    |\n</code></pre> <ul> <li> Create your first Merge Request (MR) as soon as possible.</li> </ul> <p>Merge requests will be responsible for semantic-release storytelling and so use them wisely! The changelog report generated automatically will be based on your commits merged into main branch and should cover all the thins you did for the project, as an example:</p> <ul> <li> Separate your merge requests based on LABEL or functionality if you are working on <code>feat</code> label</li> </ul> <p>This about what part of feature you are working on, (messages) i.e.:</p> <pre><code>    - `initializaing base pre-processing code`\n    - `init repo structure`\n    - `adding pre-processing unit-tests`\n</code></pre> <ul> <li> Once the code is ready create a Merge Request (MR) into the DEV branch with a proper naming convention</li> </ul> <p>The name of your MR should follow the same exact convention as your commits (we have a dedicated check for this in the CI):</p> <pre><code>    `{LABEL}(KDP): {message}`\n</code></pre> <ul> <li> <p> Use small Merge Requests but do them more ofthen &lt; 400 ligns for quicker and simple review and not the whole project !</p> </li> <li> <p> Ask for a Code Review !</p> </li> <li> <p> Once your MR is approved, solve all your unresolved conversation and pass all the CI check before you can merge it.</p> </li> <li> <p> All the Tests for your code should pass -&gt; REMEMBER NO TESTS = NO MERGE \ud83d\udea8</p> </li> </ul>"},{"location":"features/","title":"Defining Features for Preprocessing \ud83c\udf1f","text":"<p>Customize the preprocessing pipeline by setting up a dictionary that maps feature names to their respective types, tailored to your specific requirements.</p>"},{"location":"features/#numeric-features","title":"\ud83d\udcaf Numeric Features","text":"<p>Explore various methods to define numerical features tailored to your needs:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom NumericalFeature <pre><code>features_specs = {\n    \"feat1\": \"float\",\n    \"feat2\": \"FLOAT\",\n    \"feat3\": \"FLOAT_NORMALIZED\",\n    \"feat3\": \"FLOAT_RESCALED\",\n    ...\n}\n</code></pre> <p>Utilize predefined preprocessing configurations with <code>FeatureType</code>.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>FLOAT</li> <li>FLOAT_NORMALIZED</li> <li>FLOAT_RESCALED</li> <li>FLOAT_DISCRETIZED</li> </ul> <p>Customize preprocessing by passing specific parameters to <code>NumericalFeature</code>.</p> <pre><code>from kdp.features import NumericalFeature\n\nfeatures_specs = {\n    \"feat3\": NumericalFeature(\n        name=\"feat3\",\n        feature_type=FeatureType.FLOAT_DISCRETIZED,\n        bin_boundaries=[(1, 10)],\n    ),\n    \"feat4\": NumericalFeature(\n        name=\"feat4\",\n        feature_type=FeatureType.FLOAT,\n    ),\n    ...\n}\n</code></pre> <p>Here's how the numeric preprocessing pipeline looks:</p> <p></p>"},{"location":"features/#categorical-features","title":"\ud83d\udc08\u200d\u2b1b Categorical Features","text":"<p>Define categorical features flexibly:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom CategoricalFeature <pre><code>features_specs = {\n    \"feat1\": \"INTEGER_CATEGORICAL\",\n    \"feat2\": \"STRING_CATEGORICAL\",\n    \"feat3\": \"string_categorical\",\n    ...\n}\n</code></pre> <p>Leverage default configurations with <code>FeatureType</code>.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.INTEGER_CATEGORICAL,\n    \"feat2\": FeatureType.STRING_CATEGORICAL,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>STRING_CATEGORICAL</li> <li>INTEGER_CATEGORICAL</li> </ul> <p>Tailor feature processing by specifying properties in <code>CategoricalFeature</code>.</p> <pre><code>from kdp.features\nfrom kdp.features import CategoricalFeature\n\nfeatures_specs = {\n    \"feat1\": CategoricalFeature(\n        name=\"feat7\",\n        feature_type=FeatureType.INTEGER_CATEGORICAL,\n        embedding_size=100,\n    ),\n    \"feat2\": CategoricalFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.STRING_CATEGORICAL,\n    ),\n    ...\n}\n</code></pre> <p>See how the categorical preprocessing pipeline appears:</p> <p></p>"},{"location":"features/#text-features","title":"\ud83d\udcdd Text Features","text":"<p>Customize text features in multiple ways to fit your project's demands:</p> \u2139\ufe0f Simple Declaration\ud83d\udd27 Using FeatureType\ud83d\udcaa Custom TextFeature <pre><code>features_specs = {\n    \"feat1\": \"text\",\n    \"feat2\": \"TEXT\",\n    ...\n}\n</code></pre> <p>Use <code>FeatureType</code> for automatic default preprocessing setups.</p> <pre><code>from kdp.features import FeatureType\n\nfeatures_specs = {\n    \"feat1\": FeatureType.TEXT,\n    \"feat2\": FeatureType.TEXT,\n    ...\n}\n</code></pre> <p>Available <code>FeatureType</code> options:</p> <ul> <li>TEXT</li> </ul> <p>Customize text preprocessing by passing specific arguments to <code>TextFeature</code>.</p> <pre><code>from kdp.features import TextFeature\n\nfeatures_specs = {\n    \"feat1\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.TEXT,\n        max_tokens=100,\n        stop_words=[\"stop\", \"next\"],\n    ),\n    \"feat2\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.TEXT,\n    ),\n    ...\n}\n</code></pre> <p>Here's how the text feature preprocessing pipeline looks:</p> <p></p>"},{"location":"features/#cross-features","title":"\u274c Cross Features","text":"<p>To implement cross features, specify a list of feature tuples in the <code>PreprocessingModel</code> like so:</p> <pre><code>from kdp.processor import PreprocessingModel\n\nppr = PreprocessingModel(\n    path_data=\"data/data.csv\",\n    features_specs={\n        \"feat6\": FeatureType.STRING_CATEGORICAL,\n        \"feat7\": FeatureType.INTEGER_CATEGORICAL,\n    },\n    feature_crosses=[(\"feat6\", \"feat7\", 5)],\n)\n</code></pre> <p>Example cross feature between INTEGER_CATEGORICAL and STRING_CATEGORICAL:</p> <p></p>"},{"location":"features/#date-features","title":"\ud83d\udcc6 Date Features","text":"<p>You can even process string encoded date features (format: 'YYYY-MM-DD'):</p> \ud83d\udd27 Using FeatureType\ud83d\udcaa Custom DateFeature <p>Use <code>FeatureType</code> for automatic default preprocessing setups.</p> <pre><code>from kdp.processor import PreprocessingModel\n\nppr = PreprocessingModel(\n    path_data=\"data/data.csv\",\n    features_specs={\n        \"feat1\": FeatureType.FLOAT,\n        \"feat2\": FeatureType.DATE,\n    },\n)\n</code></pre> <p>Customize text preprocessing by passing specific arguments to <code>TextFeature</code>.</p> <pre><code>from kdp.features import DateFeature\n\nfeatures_specs = {\n    \"feat1\": DateFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.FLOAT,\n    ),\n    \"feat2\": TextFeature(\n        name=\"feat2\",\n        feature_type=FeatureType.DATE,\n        # additional option to add season layer:\n        add_season=True,  # adds one-hot season indicator (summer, winter, etc) defaults to False\n    ),\n    ...\n}\n</code></pre> <p>Example date and numeric processing pipeline:</p> <p></p>"},{"location":"features/#custom-preprocessing-steps","title":"\ud83d\ude80 Custom Preprocessing Steps","text":"<p>If you require even more customization, you can define custom preprocessing steps using the <code>Feature</code> class, using <code>preprocessors</code> attribute.</p> <p>The <code>preprocessors</code> attribute accepts a list of methods defined in <code>PreprocessorLayerFactory</code>.</p> <pre><code>from kdp.features import Feature\n\nfeatures_specs = {\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": Feature(\n        name=\"custom_feature_pipeline\",\n        feature_type=FeatureType.FLOAT_NORMALIZED,\n        preprocessors=[\n            tf.keras.layers.Rescaling,\n            tf.keras.layers.Normalization,\n\n        ],\n        # leyers required kwargs\n        scale=1,\n    )\n}\n</code></pre> <p>Here's how the text feature preprocessing pipeline looks:</p> <p></p> <p>The full list of available layers can be found: Preprocessing Layers Factory</p>"},{"location":"integrations/","title":"\ud83d\udd17 Integrating Preprocessing Model with other Keras Model:","text":"<p>You can then easily ingetrate this model into your keras model as the first layer:</p>"},{"location":"integrations/#example-1-using-the-preprocessing-model-as-the-first-layer-of-a-sequential-model","title":"Example 1: Using the Preprocessing Model as the first layer of a Sequential Model","text":"<pre><code>class FunctionalModelWithPreprocessing(tf.keras.Model):\n    def __init__(self, preprocessing_model: tf.keras.Model) -&gt; None:\n        \"\"\"Initialize the user model.\n\n        Args:\n            preprocessing_model (tf.keras.Model): The preprocessing model.\n        \"\"\"\n        super().__init__()\n        self.preprocessing_model = preprocessing_model\n\n        # Dynamically create inputs based on the preprocessing model's input shape\n        inputs = {\n            name: tf.keras.Input(shape=shape[1:], name=name)\n            for name, shape in self.preprocessing_model.input_shape.items()\n        }\n\n        # You can use the preprocessing model directly in the functional API.\n        x = self.preprocessing_model(inputs)\n\n        # Define the dense layer as part of the model architecture\n        output = tf.keras.layers.Dense(\n            units=128,\n            activation=\"relu\",\n        )(x)\n\n        # Use the Model's functional API to define inputs and outputs\n        self.model = tf.keras.Model(inputs=inputs, outputs=output)\n\n    def call(self, inputs: dict[str, tf.Tensor]) -&gt; tf.Tensor:\n        \"\"\"Call the item model with the given inputs.\"\"\"\n        return self.model(inputs)\n\n# Defining this model is not easy with builtin preprocessing layers:\n\nfrom kdp import PreprocessingModel\nfrom kdp import FeatureType\n\n# DEFINING FEATURES PROCESSORS\nfeatures_specs = {\n    # ======= NUMERICAL Features =========================\n    \"feat1\": FeatureType.FLOAT_NORMALIZED,\n    \"feat2\": FeatureType.FLOAT_RESCALED,\n    # ======= CATEGORICAL Features ========================\n    \"feat3\": FeatureType.STRING_CATEGORICAL,\n    \"feat4\": FeatureType.INTEGER_CATEGORICAL,\n    # ======= TEXT Features ========================\n    \"feat5\": FeatureType.TEXT,\n}\n\n# INSTANTIATE THE PREPROCESSING MODEL with your data\nppr = PreprocessingModel(\n    path_data=\"data/my_data.csv\",\n    features_specs=features_spec,\n)\n# construct the preprocessing pipelines\nppr.build_preprocessor()\n\n# building a production / deployment ready model\nfull_model = FunctionalModelWithPreprocessing(\n    preprocessing_model=ppr.model,\n)\n</code></pre>"},{"location":"layers_factory/","title":"\ud83c\udfed Preprocessing Layers Factory","text":"<p>The <code>PreprocessorLayerFactory</code> class provides a convenient way to create and manage preprocessing layers for your machine learning models. It supports both standard Keras preprocessing layers and custom layers defined within the KDP framework.</p>"},{"location":"layers_factory/#using-keras-preprocessing-layers","title":"\ud83c\udfa1 Using Keras Preprocessing Layers","text":"<p>All preprocessing layers available in Keras can be used within the <code>PreprocessorLayerFactory</code>. You can access these layers by their class names. Here's an example of how to use a Keras preprocessing layer:</p> <p><pre><code>normalization_layer = PreprocessorLayerFactory.create_layer(\n    \"Normalization\",\n    axis=-1,\n    mean=None,\n    variance=None\n)\n</code></pre> Available layers:</p> <ul> <li> Normalization</li> <li> Discretization</li> <li> CategoryEncoding</li> <li> Hashing</li> <li> HashedCrossing</li> <li> StringLookup</li> <li> IntegerLookup</li> <li> TextVectorization</li> <li> ... and more</li> </ul>"},{"location":"layers_factory/#custom-kdp-preprocessing-layers","title":"\ud83c\udfd7\ufe0f Custom KDP Preprocessing Layers","text":"<p>In addition to Keras layers, the <code>PreprocessorLayerFactory</code> includes several custom layers specific to the KDP framework. Here's a list of available custom layers:</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.cast_to_float32_layer","title":"<code>cast_to_float32_layer(name='cast_to_float32', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a CastToFloat32Layer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'cast_to_float32'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the CastToFloat32Layer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.create_layer","title":"<code>create_layer(layer_class, name=None, **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a layer using the layer class name, automatically filtering kwargs based on the layer class.</p> <p>Parameters:</p> Name Type Description Default <code>layer_class</code> <code>str | Class Object</code> <p>The name of the layer class to be created (e.g., 'Normalization', 'Rescaling') or the class object itself.</p> required <code>name</code> <code>str</code> <p>The name of the layer. Optional.</p> <code>None</code> <code>**kwargs</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the specified layer class.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_encoding_layer","title":"<code>date_encoding_layer(name='date_encoding_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a DateEncodingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_encoding_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the DateEncodingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_parsing_layer","title":"<code>date_parsing_layer(name='date_parsing_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a DateParsingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_parsing_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the DateParsingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.date_season_layer","title":"<code>date_season_layer(name='date_season_layer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a SeasonLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'date_season_layer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the SeasonLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.text_preprocessing_layer","title":"<code>text_preprocessing_layer(name='text_preprocessing', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a TextPreprocessingLayer layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'text_preprocessing'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the TextPreprocessingLayer layer.</p>"},{"location":"layers_factory/#kdp.layers_factory.PreprocessorLayerFactory.transformer_block_layer","title":"<code>transformer_block_layer(name='transformer', **kwargs)</code>  <code>staticmethod</code>","text":"<p>Create a TransformerBlock layer.</p> <p>Parameters:</p> Name Type Description Default <code>name</code> <code>str</code> <p>The name of the layer.</p> <code>'transformer'</code> <code>**kwargs</code> <code>dict</code> <p>Additional keyword arguments to pass to the layer constructor.</p> <code>{}</code> <p>Returns:</p> Type Description <code>Layer</code> <p>An instance of the TransformerBlock layer.</p>"},{"location":"motivation/","title":"\ud83c\udf66 The Motivation Behind Keras Data Processor","text":"<p>The burning question now is \u2753:</p> <p>Why create a new preprocessing pipeline or model when we already have an excellent tool like Keras FeatureSpace?</p> <p>While <code>Keras FeatureSpace</code> has been a cornerstone in many of my projects, delivering great results, I encountered significant challenges in a high-volume data project. The tool required multiple data passes (proportional to the number of features), executing <code>.adapt</code> for each feature. This led to exceedingly long preprocessing times and frequent out-of-memory errors.</p> <p>This experience motivated a deep dive into the internal workings of Keras FeatureSpace and thus, motivated me to develop a new preprocessing pipeline that could handle data more efficiently\u2014both in terms of speed and memory usage. Thus, the journey began to craft a solution that would:</p> <ul> <li> <p> Process data in a single pass, utilizing an iterative approach to avoid loading the entire dataset into memory, managed by a batch_size parameter.</p> </li> <li> <p> Introduce custom predefined preprocessing steps tailored to the feature type, controlled by a feature_type parameter.</p> </li> <li> <p> Offer greater flexibility for custom preprocessing steps and a more Pythonic internal implementation.</p> </li> <li> <p> Align closely with the API of Keras FeatureSpace (proposing something similar), with the hope that it might eventually be integrated into the KFS ecosystem.</p> </li> </ul>"},{"location":"motivation/#quick-benchmark-overview","title":"Quick Benchmark Overview","text":"<p>To demonstrate the effectiveness of our new preprocessing pipeline, we conducted a benchmark comparing it with the traditional Keras FeatureSpace (this will give you a glimps on what was described earlier for the big data cases). Here\u2019s how we did it:</p> Benchmarking Steps: <ul> <li> <p>Setup: We configure the benchmark by specifying a set number of features in a loop. Each feature's specification (either a normalized float or a categorical string) is defined in a dictionary.</p> </li> <li> <p>Data Generation: For each set number of data points determined in another loop, we generate mock data based on the feature specifications and data points, which is then saved to a CSV file.</p> </li> <li> <p>Memory Management: We use garbage collection to free up memory before and after each benchmarking run, coupled with a 10-second cooldown period to ensure all operations complete fully.</p> </li> <li> <p>Performance Measurement: For both the Keras Data Processor (KDP) and Keras Feature Space (FS), we measure and record CPU and memory usage before and after their respective functions run, noting the time taken.</p> </li> <li> <p>Results Compilation: We collect and log results including the number of features, data points, execution time, memory, and CPU usage for each function in a structured format.</p> </li> </ul> <p>The results clearly illustrate the benefits, especially as the complexity of the data increases:</p> <p></p> <p>The graph shows a steep rise in processing time with an increase in data points for both <code>KDP</code> and <code>FS</code>. However, KDP consistently outperforms <code>FS</code>, with the gap widening as the number of data points grows.</p> <p></p> <p>This graph depicts the processing time increase with more features. Again, <code>KDP</code> outpaces <code>FS</code>, demonstrating substantial efficiency improvements.</p> <p>The combined effect of both the number of features and data points leads to significant performance gains on the <code>KDP</code> sice and time and memory hungry <code>FS</code> for the bigger and more complex datasets. This project was born from the need for better efficiency, and it\u2019s my hope to continue refining this tool with community support, pushing the boundaries of what we can achieve in data preprocessing (and maybe one day integrating it directly into Keras \u2764\ufe0f)!</p> <p>There is much to be done and many features to be added, but I am excited to see where this journey takes us. Let\u2019s build something great together! \ud83d\ude80\ud83d\udd27</p>"},{"location":"transformer_blocks/","title":"\ud83e\udd16 TransformerBlocks \ud83c\udf1f","text":"<p>You can add transformer blocks to  your preprocessing model by simply defining required configuration when initializing the <code>Preprocessor</code> class:</p> <p>with the following arguments:</p> <ul> <li> <p><code>transfo_nr_blocks</code> (int): The number of transformer blocks in sequence (default=None, transformer block is disabled by default).</p> </li> <li> <p><code>transfo_nr_heads</code> (int): The number of heads for the transformer block (default=3).</p> </li> <li> <p><code>transfo_ff_units</code> (int): The number of feed forward units for the transformer (default=16).</p> </li> <li> <p><code>transfo_dropout_rate</code> (float): The dropout rate for the transformer block (default=0.25).</p> </li> <li> <p><code>transfo_placement</code> (str): The placement of the transformer block withe the following options:</p> <ul> <li><code>CATEGORICAL</code> -&gt; only after categorical and text variables</li> <li><code>ALL_FEATURES</code> -&gt; after all concatenated features).</li> </ul> </li> </ul> <p>This used a dedicated TransformerBlockLayer to handle the transformer block logic.</p>"},{"location":"transformer_blocks/#code-examples","title":"\ud83d\udcbb Code Examples:","text":"<pre><code>from kdp.processor import PreprocessingModel, OutputModeOptions, TransformerBlockPlacementOptions\n\nppr = PreprocessingModel(\n    path_data=\"data/test_data.csv\",\n    features_specs=features_specs,\n    features_stats_path=\"stats_data.json\",\n    output_mode=OutputModeOptions.CONCAT,\n    # TRANSFORMERS BLOCK CONTROLL\n    transfo_nr_blocks=3, # if 0, transformer block is disabled\n    transfo_nr_heads=3,\n    transfo_ff_units=16,\n    transfo_dropout_rate=0.25,\n    transfo_placement=TransformerBlockPlacementOptions.ALL_FEATURES,\n</code></pre> <p>There are two options for the <code>transfo_placement</code> argument controlled using <code>TransformerBlockPlacementOptions</code> class:</p> <ul> <li> <p> <code>CATEGORICAL</code>: The transformer block is applied only to the categorical + text features: <code>TransformerBlockPlacementOptions.CATEGORICAL</code> only.</p> <p>The corresponding architecture may thus look like this: </p> </li> <li> <p> <code>ALL_FEATURES</code>: The transformer block is applied to all features: <code>TransformerBlockPlacementOptions.ALL_FEATURES</code></p> <p>The corresponding architecture may thus look like this: </p> </li> </ul>"}]}
\ No newline at end of file
diff --git a/1.8.0/sitemap.xml.gz b/1.8.0/sitemap.xml.gz
index a6d4c12a3cc0e21b644e6feb38b38d0877dd4c0f..cb48247e8eefc60028d63ad594227726947b3020 100644
GIT binary patch
delta 14
Vcmb=g=aBE_;OIZXls=K88~`DI1dRXy

delta 14
Vcmb=g=aBE_;8?QYaN0zUasVXz1wH@(

diff --git a/1.8.0/transformer_blocks/index.html b/1.8.0/transformer_blocks/index.html
index f95ca9d..f472389 100644
--- a/1.8.0/transformer_blocks/index.html
+++ b/1.8.0/transformer_blocks/index.html
@@ -9,10 +9,10 @@
       
       
       
-        <link rel="prev" href="../features/">
+        <link rel="prev" href="../integrations/">
       
       
-        <link rel="next" href="../layers_factory/">
+        <link rel="next" href="../motivation/">
       
       
       <link rel="icon" href="../assets/images/favicon.png">
@@ -335,6 +335,46 @@
       
   
   
+  
+  
+    <li class="md-nav__item">
+      <a href="../layers_factory/" class="md-nav__link">
+        
+  
+  <span class="md-ellipsis">
+    🏭 Layers Factory
+  </span>
+  
+
+      </a>
+    </li>
+  
+
+    
+      
+      
+  
+  
+  
+  
+    <li class="md-nav__item">
+      <a href="../integrations/" class="md-nav__link">
+        
+  
+  <span class="md-ellipsis">
+    📦 Integrating Preprocessing Model
+  </span>
+  
+
+      </a>
+    </li>
+  
+
+    
+      
+      
+  
+  
     
   
   
@@ -406,46 +446,6 @@
   
   
   
-    <li class="md-nav__item">
-      <a href="../layers_factory/" class="md-nav__link">
-        
-  
-  <span class="md-ellipsis">
-    🏭 Layers Factory
-  </span>
-  
-
-      </a>
-    </li>
-  
-
-    
-      
-      
-  
-  
-  
-  
-    <li class="md-nav__item">
-      <a href="../integrations/" class="md-nav__link">
-        
-  
-  <span class="md-ellipsis">
-    📦 Integrating Preprocessing Model
-  </span>
-  
-
-      </a>
-    </li>
-  
-
-    
-      
-      
-  
-  
-  
-  
     <li class="md-nav__item">
       <a href="../motivation/" class="md-nav__link">