diff --git a/Week_00/00_Overview.html b/Week_00/00_Overview.html index f32c6c4..32f5f78 100644 --- a/Week_00/00_Overview.html +++ b/Week_00/00_Overview.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_00/00a_DailyChallenge.html b/Week_00/00a_DailyChallenge.html index 0569420..28a4370 100644 --- a/Week_00/00a_DailyChallenge.html +++ b/Week_00/00a_DailyChallenge.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_00/00b_DailyResources.html b/Week_00/00b_DailyResources.html index fb10a30..7ab0785 100644 --- a/Week_00/00b_DailyResources.html +++ b/Week_00/00b_DailyResources.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_00/01_Errata.html b/Week_00/01_Errata.html index ba80109..0c625b8 100644 --- a/Week_00/01_Errata.html +++ b/Week_00/01_Errata.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/001_Overview.html b/Week_01/001_Overview.html index a02665a..10c38a0 100644 --- a/Week_01/001_Overview.html +++ b/Week_01/001_Overview.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/Lesson_01.html b/Week_01/Lesson_01.html index 10c8f08..2f606a3 100644 --- a/Week_01/Lesson_01.html +++ b/Week_01/Lesson_01.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/Lesson_02.html b/Week_01/Lesson_02.html index e987c1c..d11db79 100644 --- a/Week_01/Lesson_02.html +++ b/Week_01/Lesson_02.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/Lesson_03.html b/Week_01/Lesson_03.html index f5524d4..f42ef04 100644 --- a/Week_01/Lesson_03.html +++ b/Week_01/Lesson_03.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/Lesson_04.html b/Week_01/Lesson_04.html index 0a32004..613f4af 100644 --- a/Week_01/Lesson_04.html +++ b/Week_01/Lesson_04.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_01/Lesson_05.html b/Week_01/Lesson_05.html index d3e83c0..bc03947 100644 --- a/Week_01/Lesson_05.html +++ b/Week_01/Lesson_05.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -778,7 +779,7 @@

    Standard Library Highlights -
    0.6508227309087278
    +
    0.11290791626756647
     
    @@ -844,7 +845,7 @@

    Standard Library Highlights -
    2024-01-30 09:22:01.276254
    +
    2024-01-31 08:52:49.083772
     
    @@ -1167,8 +1168,8 @@

    Basic Quiz Game
    What is the capital of France?
    -a. London
    -b. Paris
    +a. Paris
    +b. London
     c. Rome
     
    @@ -1208,9 +1209,9 @@

    Basic Quiz Game
    What is the capital of France?
    -a. Rome
    -b. Paris
    -c. London
    +a. London
    +b. Rome
    +c. Paris
     
    ---------------------------------------------------------------------------
    @@ -1249,9 +1250,9 @@ 

    Basic Quiz Game
    What is the capital of France?
    -a. Paris
    -b. London
    -c. Rome
    +a. London
    +b. Rome
    +c. Paris
     
    ---------------------------------------------------------------------------
    @@ -1291,8 +1292,8 @@ 

    Basic Quiz Game
    What is the capital of France?
     a. Rome
    -b. Paris
    -c. London
    +b. London
    +c. Paris
     
    ---------------------------------------------------------------------------
    diff --git a/Week_02/002_Overview.html b/Week_02/002_Overview.html
    index 3613209..1c7b0e7 100644
    --- a/Week_02/002_Overview.html
    +++ b/Week_02/002_Overview.html
    @@ -259,6 +259,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_02/Lesson_06.html b/Week_02/Lesson_06.html index e6cc40b..ae7d1be 100644 --- a/Week_02/Lesson_06.html +++ b/Week_02/Lesson_06.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_02/Lesson_07.html b/Week_02/Lesson_07.html index 154c1f9..f75a03d 100644 --- a/Week_02/Lesson_07.html +++ b/Week_02/Lesson_07.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -741,15 +742,15 @@

    Matrix Dot Product (Element-wise Product):Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_02/Lesson_09.html b/Week_02/Lesson_09.html index ff91e91..568f967 100644 --- a/Week_02/Lesson_09.html +++ b/Week_02/Lesson_09.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_02/Lesson_10.html b/Week_02/Lesson_10.html index c1ab9e8..57eafa7 100644 --- a/Week_02/Lesson_10.html +++ b/Week_02/Lesson_10.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -595,7 +596,7 @@

    Step 1: Import Necessary Libraries -

    Poisson Distribution Example

    @@ -702,7 +703,7 @@

    Step 3: Understanding Distributions -../_images/f471f48523b4b750801da5035d60e32b3d9fa7f967a86460fac3a817493a2910.png +../_images/8c3a0d5ed06805763b5404ef2a3b932553e09a5d3a21332e387e2d8401ad344f.png

    diff --git a/Week_03/003_Overview.html b/Week_03/003_Overview.html index d40ecf5..ab0a82e 100644 --- a/Week_03/003_Overview.html +++ b/Week_03/003_Overview.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_03/Lesson_11.html b/Week_03/Lesson_11.html index cbab5d9..d5f4122 100644 --- a/Week_03/Lesson_11.html +++ b/Week_03/Lesson_11.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -598,7 +599,7 @@

    Setup for Activities

    -
    /tmp/ipykernel_237615/2223182689.py:3: DeprecationWarning: 
    +
    /tmp/ipykernel_288486/2223182689.py:3: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    diff --git a/Week_03/Lesson_12.html b/Week_03/Lesson_12.html
    index e043166..d8257d6 100644
    --- a/Week_03/Lesson_12.html
    +++ b/Week_03/Lesson_12.html
    @@ -261,6 +261,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_03/Lesson_12solution.html b/Week_03/Lesson_12solution.html index e4a845c..b5c1723 100644 --- a/Week_03/Lesson_12solution.html +++ b/Week_03/Lesson_12solution.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -603,7 +604,7 @@

    Objective -
    /tmp/ipykernel_237648/2223182689.py:3: DeprecationWarning: 
    +
    /tmp/ipykernel_288519/2223182689.py:3: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    diff --git a/Week_03/Lesson_13.html b/Week_03/Lesson_13.html
    index 0f49dd0..935bdd9 100644
    --- a/Week_03/Lesson_13.html
    +++ b/Week_03/Lesson_13.html
    @@ -259,6 +259,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -649,7 +650,7 @@

    Step 1: Load and Explore the Dataset
    /tmp/ipykernel_237687/245541981.py:1: DeprecationWarning: 
    +
    -
    /tmp/ipykernel_237687/684399944.py:1: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
    +
    /tmp/ipykernel_288555/684399944.py:1: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
     The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.
     
     For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.
     
     
       titanic_data['Age'].fillna(titanic_data['Age'].median(), inplace=True)
    -/tmp/ipykernel_237687/684399944.py:3: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
    +/tmp/ipykernel_288555/684399944.py:3: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
     The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.
     
     For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.
    diff --git a/Week_03/Lesson_14.html b/Week_03/Lesson_14.html
    index 796e91c..9113cd1 100644
    --- a/Week_03/Lesson_14.html
    +++ b/Week_03/Lesson_14.html
    @@ -261,6 +261,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -871,7 +872,7 @@

    Best Practices and Considerations
    /tmp/ipykernel_237713/2131166956.py:1: DeprecationWarning: 
    +
    /tmp/ipykernel_288580/2131166956.py:1: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    @@ -1127,7 +1128,7 @@ 

    Step 8: Statistical Summary Comparison -
    /tmp/ipykernel_237713/1279951594.py:6: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
    +
    /tmp/ipykernel_288580/1279951594.py:6: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.
     The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.
     
     For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.
    diff --git a/Week_03/Lesson_15.html b/Week_03/Lesson_15.html
    index bd48b9a..bd76991 100644
    --- a/Week_03/Lesson_15.html
    +++ b/Week_03/Lesson_15.html
    @@ -259,6 +259,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -751,7 +752,7 @@

    Step 1: Load the necessary libraries -
    /tmp/ipykernel_237751/3916798240.py:2: DeprecationWarning: 
    +
    /tmp/ipykernel_288616/3916798240.py:2: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    diff --git a/Week_04/004_Overview.html b/Week_04/004_Overview.html
    index 2095142..f512db4 100644
    --- a/Week_04/004_Overview.html
    +++ b/Week_04/004_Overview.html
    @@ -259,6 +259,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_04/Lesson_16.html b/Week_04/Lesson_16.html index a4f3666..7ce5fa3 100644 --- a/Week_04/Lesson_16.html +++ b/Week_04/Lesson_16.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -581,7 +582,7 @@

    Prerequisites -
    /tmp/ipykernel_237786/955872667.py:2: DeprecationWarning: 
    +
    /tmp/ipykernel_288649/955872667.py:2: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    diff --git a/Week_04/Lesson_17.html b/Week_04/Lesson_17.html
    index 0c5b0cf..14b57bc 100644
    --- a/Week_04/Lesson_17.html
    +++ b/Week_04/Lesson_17.html
    @@ -261,6 +261,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -583,7 +584,7 @@

    Prerequisites -
    /tmp/ipykernel_237837/955872667.py:2: DeprecationWarning: 
    +
    /tmp/ipykernel_288689/955872667.py:2: DeprecationWarning: 
     Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
     (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
     but was not found to be installed on your system.
    diff --git a/Week_04/Lesson_18.html b/Week_04/Lesson_18.html
    index c7f2ab6..a96f880 100644
    --- a/Week_04/Lesson_18.html
    +++ b/Week_04/Lesson_18.html
    @@ -259,6 +259,7 @@
     
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_04/Lesson_19.html b/Week_04/Lesson_19.html index 9befee1..9719ec4 100644 --- a/Week_04/Lesson_19.html +++ b/Week_04/Lesson_19.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_04/Lesson_20.html b/Week_04/Lesson_20.html index 14449a6..7b2fd47 100644 --- a/Week_04/Lesson_20.html +++ b/Week_04/Lesson_20.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_05/005_Overview.html b/Week_05/005_Overview.html index c3b93de..abf1f8a 100644 --- a/Week_05/005_Overview.html +++ b/Week_05/005_Overview.html @@ -259,6 +259,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/Week_05/005_Overview_.html b/Week_05/005_Overview_.html deleted file mode 100644 index 69b761d..0000000 --- a/Week_05/005_Overview_.html +++ /dev/null @@ -1,645 +0,0 @@ - - - - - - - - - - - - Course Structure — 100 Days of Machine Learning - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - - - - - - - - - - - -
    -
    -
    -
    -
    - - - -
    -
    - -
    - - - - - - - - - - - - - -
    - -
    - - - -
    - -
    -
    - -
    -
    - -
    - -
    - -
    - - -
    - -
    - -
    - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - -
    - -
    -
    - - - - - - - - -
    - -
    -

    Course Structure#

    -
    -
    -

    Module 3: Supervised Learning - Regression and Classification#

    -
    -

    Weeks 5-6#

    -
      -
    • Focus: Key concepts and algorithms in supervised learning.

    • -
    • Topics include regression, classification algorithms, decision trees, SVM, and ensemble methods.

    • -
    -
    -

    Week 5: Supervised Learning - Regression#

    -
      -
    • Day 21: Introduction to Regression Analysis in Python

      -
        -
      • Basics of regression analysis and simple linear regression.

      • -
      • Math Focus: Linear equation fundamentals and fitting models to data.

      • -
      -
    • -
    • Day 22: Implementing Multiple Linear Regression in Python

      -
        -
      • Understand and implement multiple linear regression.

      • -
      • Math Focus: Multivariate calculus and regression coefficients interpretation.

      • -
      -
    • -
    • Day 23: Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression

      -
        -
      • Explore advanced regression techniques and their applications.

      • -
      • Math Focus: Polynomial functions, Lasso and Ridge regularization techniques.

      • -
      -
    • -
    • Day 24: Regression Model Evaluation Metrics in Python

      -
        -
      • Key metrics for evaluating regression models.

      • -
      • Math Focus: Mean Squared Error (MSE), Root Mean Squared Error (RMSE), and R-squared.

      • -
      -
    • -
    • Day 25: Addressing Overfitting and Underfitting in Regression Models

      -
        -
      • Strategies to combat overfitting and underfitting in regression.

      • -
      • Math Focus: Bias-variance tradeoff and regularization methods.

      • -
      -
    • -
    -
    -
    -
    - - - - -
    - - - - - - - - -
    - - - - - - -
    -
    - - -
    - - -
    -
    -
    - - - - - -
    -
    - - \ No newline at end of file diff --git a/Week_05/Lesson_21.html b/Week_05/Lesson_21.html index f40f37c..6b68de5 100644 --- a/Week_05/Lesson_21.html +++ b/Week_05/Lesson_21.html @@ -261,6 +261,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • @@ -848,7 +849,7 @@

    Import and Analyze a Housing Dataset
    /tmp/ipykernel_237871/737031205.py:1: DeprecationWarning: 
    +
     
    @@ -685,8 +687,8 @@ 

    Understanding Model Evaluation Metrics -
    MSE: 732.3551245668029
    -R-squared: -0.027105564211052702
    +
    MSE: 3183.330047035957
    +R-squared: 0.13751568541102366
     
    @@ -710,8 +712,8 @@

    Understanding Model Evaluation Metrics -../_images/1d0563321f6a2b86ded4cb8e6c1035aab0234f07e9db2f827b7c6ea403da2913.png - diff --git a/Week_05/Lesson_23.html b/Week_05/Lesson_23.html index c0e5c7c..4cd5a10 100644 --- a/Week_05/Lesson_23.html +++ b/Week_05/Lesson_23.html @@ -9,7 +9,7 @@ - Outline Only - Lesson 23: Advanced Regression Techniques — 100 Days of Machine Learning + Day 23: Advanced Regression Techniques — 100 Days of Machine Learning @@ -62,13 +62,14 @@ const thebe_selector_output = ".output, .cell_output" + + - - + @@ -238,11 +239,6 @@ - -

    Week 5 - Data Preprocessing

    -

    Week 4 - Data Preprocessing

    -

    Course Overview

    -

    @@ -483,7 +484,9 @@ `); - +

    @@ -494,11 +497,27 @@
    -

    Outline Only - Lesson 23: Advanced Regression Techniques

    +

    Day 23: Advanced Regression Techniques

    @@ -508,35 +527,1398 @@

    Outline Only - Lesson 23: Advanced Regression Techniques

    -
    -

    Outline Only - Lesson 23: Advanced Regression Techniques#

    -

    Polynomial, Lasso, and Ridge Regression - Explore advanced regression techniques and their applications. - Math Focus: Polynomial functions, Lasso and Ridge regularization techniques.

    +
    +

    Day 23: Advanced Regression Techniques#

    +
    +

    Introduction#

    +

    Astute readers may have noticed during the Day 22 lesson that some of the customer_data.csv plots were not great fits across the entire domain of the data. This is because there was a non-linear element (an \(x^2\) term) in the function I used to build that dataset out of random numbers. Most data we’ll encounter is not perfectly linear, but we can still use regression. A higher order function may describe the relationships between our independent variables and the dependent variable. We are not limited to \(y = mx + c\), or even \(y = \beta_0 + \beta_1x_1 + \beta_2x_2 + ... + \beta_nx_n + \epsilon\) – we can include \(x_n^2, x_n^3, ...\) as if they were new independent variables, and give our regression line the freedom to match any polynomial function.

    +

    We’ll just need to steer clear of overfitting: with unlimited terms, it’s arbitrarily simple to draw a polynomial function that passes through every data point perfectly. This is unlikely to translate into predictive power outside of training, though. Lasso and Ridge are specific forms of regularization designed to address overfitting by penalizing the size of the coefficients. Keep an eye out for the penalty term (\(\lambda\)) which controls the complexity of the model.

    +

    A general polynomial regression model can be represented as:

    +

    \( y = \beta_0 + \beta_1x_1 + \beta_2x_1^2 + \ldots + \beta_nx_1^n + \epsilon \)

    +

    Where:

      -
    • Theoretical Concepts:

      -
        -
      • Overview of polynomial regression and its applications.

      • -
      • Introduction to regularization techniques: Lasso and Ridge regression.

      • +
      • \(y\) is the dependent variable.

      • +
      • \(x_1, x_1^2, \ldots, x_1^n\) are the predictor variables and their polynomial terms up to degree (n).

      • +
      • \(\beta_0, \beta_1, \ldots, \beta_n\) are the coefficients.

      • +
      • \(\epsilon\) represents the model error.

      -
    • -
    • Mathematical Foundation:

      -
        -
      • Polynomial functions and their role in regression.

      • -
      • Lasso (L1 regularization) and Ridge (L2 regularization) concepts.

      • +

        To get acquainted with the topic, let’s take a peek at what adding additional degrees to the polynomial can do:

        +
        +
        +
        # overview plot
        +import numpy as np
        +import matplotlib.pyplot as plt
        +from sklearn.linear_model import LinearRegression
        +from sklearn.preprocessing import PolynomialFeatures
        +from sklearn.metrics import r2_score
        +
        +# Generating demo data
        +np.random.seed(42)
        +x = np.random.normal(0, 1, 20)
        +
        +# This is the actual equation, so we could check exactly what coefficients our regression found.
        +y= -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)
        +
        +# Reshape x for sklearn
        +x = x[:, np.newaxis]
        +y = y[:, np.newaxis]
        +
        +# Simple linear regression
        +linear_regressor = LinearRegression()
        +linear_regressor.fit(x, y)
        +y_pred_linear = linear_regressor.predict(x)
        +
        +# Polynomial regression (underfit)
        +poly_features2 = PolynomialFeatures(degree=2)
        +x_poly2 = poly_features2.fit_transform(x)
        +poly_regressor2 = LinearRegression()
        +poly_regressor2.fit(x_poly2, y)
        +y_pred_poly2 = poly_regressor2.predict(x_poly2)
        +
        +# Polynomial regression (well-fit)
        +poly_features3 = PolynomialFeatures(degree=3)
        +x_poly3 = poly_features3.fit_transform(x)
        +poly_regressor3 = LinearRegression()
        +poly_regressor3.fit(x_poly3, y)
        +y_pred_poly3 = poly_regressor3.predict(x_poly3)
        +
        +# Polynomial regression (overfit)
        +poly_features5 = PolynomialFeatures(degree=5)
        +x_poly5 = poly_features5.fit_transform(x)
        +poly_regressor5 = LinearRegression()
        +poly_regressor5.fit(x_poly5, y)
        +y_pred_poly5 = poly_regressor5.predict(x_poly5)
        +
        +# R^2 Scores
        +r2_linear = r2_score(y, y_pred_linear)
        +r2_poly2 = r2_score(y, y_pred_poly2)
        +r2_poly3 = r2_score(y, y_pred_poly3)
        +r2_poly5 = r2_score(y, y_pred_poly5)
        +
        +# Plotting
        +plt.figure(figsize=(12, 10))
        +
        +# Plot simple linear regression
        +plt.subplot(2, 2, 1)
        +plt.scatter(x, y, color='blue', label='Actual response, yi')
        +plt.plot(x, y_pred_linear, color='red', label='Estimated regression line, f(x)')
        +plt.title(f'Degree: 1, R^2 = {r2_linear:.2f}')
        +plt.legend()
        +
        +# Plot underfit polynomial regression
        +plt.subplot(2, 2, 2)
        +plt.scatter(x, y, color='blue', label='Actual response, yi')
        +sorted_axis = np.argsort(x[:, 0])
        +plt.plot(x[sorted_axis], y_pred_poly2[sorted_axis], color='red', label='Estimated regression line, f(x)')
        +plt.title(f'Degree: 2, R^2 = {r2_poly2:.2f}')
        +plt.legend()
        +
        +# Plot well-fit polynomial regression
        +plt.subplot(2, 2, 3)
        +plt.scatter(x, y, color='blue', label='Actual response, yi')
        +sorted_axis = np.argsort(x[:, 0])
        +plt.plot(x[sorted_axis], y_pred_poly3[sorted_axis], color='red', label='Estimated regression line, f(x)')
        +plt.title(f'Degree: 3, R^2 = {r2_poly3:.2f}')
        +plt.legend()
        +
        +# Plot overfit polynomial regression
        +plt.subplot(2, 2, 4)
        +plt.scatter(x, y, color='blue', label='Actual response, yi')
        +sorted_axis = np.argsort(x[:, 0])
        +plt.plot(x[sorted_axis], y_pred_poly5[sorted_axis], color='red', label='Estimated regression line, f(x)')
        +plt.title(f'Degree: 5, R^2 = {r2_poly5:.2f}')
        +plt.legend()
        +
        +# Show the plots
        +plt.tight_layout()
        +plt.show()
        +
        +
        +
        +
        +../_images/5a3b207bfabe58ccdfda75f84946a10cdf87d302d66c3b6d1746e2c56a800111.png +
        +
        +
    +
    +

    Polynomial Regression#

    +

    In terms of execution, we can use sklearn’s sklearn.preprocessing.PolynomialFeatures functionality to perform linear regression with a higher degree. This is exactly what was used in the overview plot above, but I wanted to isolate the code for easier comparison to Lasso and Ridge regression below.

    +

    Some additional things to keep in mind:

    +
      +
    1. Choice of Polynomial Degree: Determining the appropriate degree of the polynomial is critical. A higher-degree polynomial can fit the training data very well but might perform poorly on unseen data due to overfitting. Various model selection techniques, such as cross-validation, can be used to choose a polynomial degree that balances bias and variance.

    2. +
    3. Feature Scaling: Polynomial terms can have very different scales, especially for higher degrees, which can make the regression model sensitive to the scale of the input features. Normalizing or standardizing the features before applying polynomial regression can help with model convergence and interpretation.

    4. +
    5. Multivariate Polynomial Regression: While your introduction focuses on polynomial regression with a single independent variable (\(x_1\)), it’s important to note that polynomial regression can be extended to multiple independent variables, allowing for interaction terms between different variables (e.g., \(x_1x_2\), \(x_1^2x_2\), etc.). This introduces complexity in model interpretation but can capture interactions between predictors that are not apparent in single-variable analyses.

    6. +
    7. Computational Complexity: As the degree of the polynomial and the number of independent variables increase, the computational complexity of fitting the regression model also increases. This is due to the larger number of terms and interactions that need to be calculated and optimized. It’s important to balance the model’s complexity with computational constraints.

    8. +
    9. Analyzing Residuals: When using polynomial regression, it becomes even more important to analyze residuals to ensure that the assumptions of linear regression are still met. This includes checking for homoscedasticity, normality of residuals, and absence of autocorrelation. If these assumptions are violated, the results of the regression, including any inference drawn from the coefficients, may not be valid.

    10. +
    +
    +

    On make_pipeline#

    +

    make_pipeline from sklearn.pipeline is a utility function that simplifies the process of creating a pipeline of transformations with a final estimator. In machine learning workflows, it’s often necessary to chain together multiple steps such as preprocessing (like scaling features or applying polynomial expansions) and then applying a model (like LinearRegression, Lasso, or Ridge). A pipeline bundles these steps into a single object that behaves like a compound estimator.

    +

    When you use make_pipeline, you can pass it a series of transformations followed by an estimator, and it automatically names each step based on its class. The steps are executed in sequence: each step’s fit_transform() method is called on the input data (except for the last step, where only fit() is called), transforming the data along the way, until it finally fits the model on the transformed data. This streamlines the code, making it cleaner and easier to read, and reduces the risk of mistakes (like applying transformations to the training data but forgetting to do so on the test data).

    +

    The intro plot above does not use a pipeline, but Lasso and Ridge specifically benefit from it. In this next example, we will pipeline from PolynomialFeatures (a preprocessor) to LinearRegression (a model).

    +

    This allows us to convert this block of code:

    +
    # Polynomial regression (well-fit)
    +poly_features3 = PolynomialFeatures(degree=3)
    +x_poly3 = poly_features3.fit_transform(x)
    +poly_regressor3 = LinearRegression()
    +poly_regressor3.fit(x_poly3, y)
    +y_pred_poly3 = poly_regressor3.predict(x_poly3)
    +
    +
    +

    into this:

    +
    poly = make_pipeline(PolynomialFeatures(degree), LinearRegression())
    +poly.fit(X, y)
    +
    +
    +

    You can imagine that as you add additional steps to transform your data, the first style of code will grow from 6 lines, to 9, to 12… while the second example simply adds more “machinery” to the sequence described in make_pipeline(...).

    +

    For instance, when used with LinearRegression, Lasso, or Ridge in the context of polynomial regression, you would typically create a pipeline that first expands your features into a polynomial feature space (using PolynomialFeatures) and then scales them (using StandardScaler, although not in these basic examples, it’s a common practice), before finally applying the regression model. This ensures that the feature expansion and scaling are part of the model fitting process, which is particularly important for cross-validation and deploying the model for predictions on new data.

    +

    To get the coefficients and intercept out of a pipeline that ends in linear regression, you’ll have to reach inside the pipeline via the name it generates for its different steps. poly_regressor3.coef_ becomes poly['linearregression'].coef, where the string 'linearregression' is generated from the LinearRegression object that was passed into the pipeline.

    +
    +
    +
    import numpy as np
    +import matplotlib.pyplot as plt
    +from sklearn.linear_model import Lasso
    +from sklearn.preprocessing import PolynomialFeatures
    +from sklearn.linear_model import LinearRegression
    +from sklearn.pipeline import make_pipeline
    +# Generating demo data
    +np.random.seed(42)
    +x = np.random.normal(0, 1, 20)
    +X = x[:, np.newaxis]
    +
    +# This is the actual equation, so we could check exactly what coefficients our regression found.
    +y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)
    +
    +# Reshape x for sklearn
    +x = x[:, np.newaxis]
    +y = y[:, np.newaxis]
    +
    +degree = 4  # choosing the same degree as the true model
    +poly = make_pipeline(PolynomialFeatures(degree), LinearRegression())
    +poly.fit(X, y)
    +
    +# Generating points for plotting the regression line
    +x_plot = np.linspace(min(X), max(X), 100)
    +y_plot = poly.predict(x_plot)
    +
    +plt.scatter(x, y, label='Data points')
    +sorted_axis = np.argsort(x[:, 0])
    +plt.plot(x_plot, y_plot, label='Polynomial regression line', color='red')
    +plt.legend()
    +plt.xlabel('x')
    +plt.ylabel('y')
    +plt.title('Polynomial (degree = 4) regression')
    +plt.show()
    +
    +
    +
    +
    +../_images/efe2803e3c407dd4463ca9959dfcf6bfa2b0b72cc864062d127916b2c28a2c0e.png +
    +
    +
    +
    +
    poly
    +
    +
    +
    +
    +
    Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=4)),
    +                ('linearregression', LinearRegression())])
    In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
    On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
    +
    +
    +
    +
    poly['linearregression'].coef_
    +
    +
    +
    +
    +
    array([[ 0.        , -2.00193104,  7.3848762 ,  3.00349368, -4.16571691]])
    +
    +
    +
    +
    +
    +
    +
    poly['linearregression'].intercept_
    +
    +
    +
    +
    +
    array([-0.32345315])
    +
    +
    +
    +
    +
    +
    +
    +

    Lasso Regression#

    +

    Lasso regression adds a penalty equal to the absolute value of the magnitude of coefficients. This can lead not only to small coefficients but can actually shrink some of them to zero, effectively performing variable selection. Using that feature of Lasso regression, you don’t have to interpret the usefulness of a variable - if it’s not important to the model, then its coefficients will drop to zero. However, to achieve this result, you’ll have to tune your lambda (\(\lambda\)) value. If \(\lambda\) is too small, the penalty effect might be negligible, leading to little improvement over ordinary least squares regression. If \(\lambda\) is too large, too many variables might be eliminated, resulting in underfitting. Techniques such as cross-validation can be used to select an optimal \(\lambda\).

    +

    The objective function for Lasso regression is:

    +

    \( \text{Minimize: } \frac{1}{2N} \sum_{i=1}^{N} (y_i - \sum_{j=1}^{n} \beta_j x_{ij})^2 + \lambda \sum_{j=1}^{n} |\beta_j| \)

    +

    Where:

    +
      +
    • \(N\) is the number of observations.

    • +
    • \(\lambda\) is the regularization parameter controlling the strength of the penalty.

    • +
    • The first term is the Mean Squared Error, and the second term is the L1 penalty.

    - -
  • Python Implementation:

    -
      -
    • Implementing polynomial regression with numpy and scikit-learn.

    • -
    • Demonstrating Lasso and Ridge regression using scikit-learn.

    • -
    • Comparing models using visualizations in matplotlib.

    • +

      Other things to keep in mind:

      +
        +
      • Lasso regression is sensitive to the scale of the input variables, so standardizing the data (to have 0 mean and unit variance) before applying Lasso regression is a common practice.

      • +
      • While Lasso can lead to sparse solutions, Ridge regression is preferred when multicollinearity is present among the features.

      - -
    • Example Dataset:

      -
        -
      • Dataset requiring a non-linear fit (e.g., environmental data).

      • +

        The introduction plot used sklearn.linear_model.LinearRegression to perform regression with different degrees of polynomials. Although Lasso might not perfectly capture the relationship in polynomial terms without specifically including polynomial features, this code will illustrate the process:

        +
        +
        +
        import numpy as np
        +import matplotlib.pyplot as plt
        +from sklearn.linear_model import Lasso
        +from sklearn.preprocessing import PolynomialFeatures
        +from sklearn.pipeline import make_pipeline
        +
        +# Generating demo data
        +np.random.seed(42)
        +x = np.random.normal(0, 1, 20)
        +y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)
        +X = x[:, np.newaxis]
        +
        +degree = 4  # choosing the same degree as the true model
        +lasso_poly = make_pipeline(PolynomialFeatures(degree), Lasso(alpha=0.1, max_iter=10000))
        +lasso_poly.fit(X, y)
        +
        +# Generating points for plotting the regression line
        +x_plot = np.linspace(min(x), max(x), 100)
        +X_plot = x_plot[:, np.newaxis]
        +y_plot = lasso_poly.predict(X_plot)
        +
        +# Plotting the data points and the regression line
        +plt.scatter(x, y, label='Data points')
        +plt.plot(x_plot, y_plot, label='Lasso Regression Line', color='red')
        +plt.legend()
        +plt.xlabel('x')
        +plt.ylabel('y')
        +plt.title('Lasso Regression with Polynomial Features')
        +plt.show()
        +
        +
        +
        +
        +../_images/cf2893ef3bdd7bf0354019761a0360b80dbe08cc759e847d38b3cd7a4c87129a.png +
        +
        +
        +
        +
        lasso_poly['lasso'].coef_
        +
        +
        +
        +
        +
        array([ 0.        , -1.55260439,  5.72240286,  2.90811749, -3.66350745])
        +
        +
        +
        +
        +
        +
        +
        lasso_poly['lasso'].intercept_
        +
        +
        +
        +
        +
        0.19943027115730638
        +
        +
        +
        +
        +
          +
        • Choosing Degree and \(\lambda\): The choice of degree=4 for the polynomial features and alpha=0.1 for the Lasso regression penalty ($\lambda$) is somewhat arbitrary here and might need adjustment based on cross-validation to find the optimal model complexity and regularization strength.

        • +
        • Max Iterations: Increasing max_iter in Lasso() might be necessary for the algorithm to converge, especially for higher degrees of polynomials or smaller values of \(\alpha\) (lambda).

        - +
  • +
    +

    Ridge Regression#

    +

    Ridge regression adds a penalty equal to the square of the magnitude of coefficients. All coefficients are shrunk by the same factor (none are eliminated).

    +

    The objective function for Ridge regression is:

    +

    \( \text{Minimize: } \frac{1}{2N} \sum_{i=1}^{N} (y_i - \sum_{j=1}^{n} \beta_j x_{ij})^2 + \lambda \sum_{j=1}^{n} \beta_j^2 \)

    +
      +
    • Similarly, \(N\) and \(\lambda\) have the same definitions as in Lasso.

    • +
    • The first term again represents the Mean Squared Error, and the second term is the L2 penalty.

    +
      +
    1. Effect of the Penalty: Ridge regression is particularly useful when dealing with multicollinearity or when you have more predictors than observations.

    2. +
    3. Scaling Importance: standardizing the features in Ridge regression is important due to the square of the coefficients being included in the penalty term. Features on larger scales can have disproportionately large effects on the formulation.

    4. +
    5. Choosing \(\lambda\) for the bias-variance trade-off: A higher \(\lambda\) increases bias but reduces variance, whereas a lower \(\lambda\) does the opposite. The optimal \(\lambda\) minimizes the mean squared error of predictions.

    6. +
    7. Computational Aspects: Ridge regression tends to be computationally more efficient than Lasso for a large number of features, mainly because the solution is obtained through matrix operations that have computationally efficient implementations.

    8. +
    +
    +
    +
    import numpy as np
    +import matplotlib.pyplot as plt
    +from sklearn.linear_model import Ridge
    +from sklearn.preprocessing import PolynomialFeatures
    +from sklearn.pipeline import make_pipeline
    +
    +# Generating demo data using the same snippet
    +np.random.seed(42)
    +x = np.random.normal(0, 1, 20)
    +y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)
    +X = x[:, np.newaxis]
    +
    +# Using polynomial features again since our relationship is non-linear
    +degree = 4
    +ridge_poly = make_pipeline(PolynomialFeatures(degree), Ridge(alpha=0.1))
    +ridge_poly.fit(X, y)
    +
    +# Generating points for plotting
    +x_plot = np.linspace(min(x), max(x), 100)
    +X_plot = x_plot[:, np.newaxis]
    +y_plot = ridge_poly.predict(X_plot)
    +
    +# Plotting
    +plt.scatter(x, y, label='Data points')
    +plt.plot(x_plot, y_plot, color='red', label='Ridge Regression Line')
    +plt.legend()
    +plt.xlabel('x')
    +plt.ylabel('y')
    +plt.title('Ridge Regression with Polynomial Features')
    +plt.show()
    +
    +
    +
    +
    +../_images/0db9f24dd130ecb95bde386604ac8a3a2c4540ea1d11b2edf145ecd048c39112.png +
    +
    +
    +
    +
    ridge_poly['ridge'].coef_
    +
    +
    +
    +
    +
    array([ 0.        , -2.05626925,  6.75667935,  3.06069885, -3.96459941])
    +
    +
    +
    +
    +
    +
    +
    ridge_poly['ridge'].intercept_
    +
    +
    +
    +
    +
    -0.14654769263455236
    +
    +
    +
    +
    +
    +
    +

    Exercise For The Reader#

    +

    Lasso and Ridge regression could be applied to sklearn’s included California housing data set.

    +
      +
    • Don’t forget to do a test train split.

    • +
    • It’s probably best to use a scaler.

    • +
    • selecting variables is important, but can be thought of as part science and part art. Try a few and see what helps.

    • +
    +
    +
    +
    # starter code
    +from sklearn.datasets import fetch_california_housing
    +from sklearn.model_selection import train_test_split
    +fetched = fetch_california_housing(as_frame=True)
    +X = fetched['data']
    +Y = fetched['target']
    +
    +# Splitting dataset
    +X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, random_state=42)
    +
    +
    +
    +
    +
    +
    +
    X.head()
    +
    +
    +
    +
    +
    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
    MedIncHouseAgeAveRoomsAveBedrmsPopulationAveOccupLatitudeLongitude
    08.325241.06.9841271.023810322.02.55555637.88-122.23
    18.301421.06.2381370.9718802401.02.10984237.86-122.22
    27.257452.08.2881361.073446496.02.80226037.85-122.24
    35.643152.05.8173521.073059558.02.54794537.85-122.25
    43.846252.06.2818531.081081565.02.18146737.85-122.25
    +
    +
    +
    +
    +
    # model configuration
    +from sklearn.preprocessing import StandardScaler
    +
    +degrees = 8
    +ridge_poly = make_pipeline(PolynomialFeatures(degrees), StandardScaler(), Ridge(alpha=0.1))
    +ridge_poly.fit(X_train, Y_train)
    +
    +
    +
    +
    +
    Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=8)),
    +                ('standardscaler', StandardScaler()),
    +                ('ridge', Ridge(alpha=0.1))])
    In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
    On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
    +
    +
    +
    +
    from sklearn.metrics import mean_squared_error, r2_score
    +
    +# Making predictions
    +predictions = ridge_poly.predict(X_test)
    +
    +# Evaluation
    +mse = mean_squared_error(Y_test, predictions)
    +r2 = r2_score(Y_test, predictions)
    +
    +print(f'MSE: {mse}')
    +print(f'R-squared: {r2}')
    +
    +
    +
    +
    +
    MSE: 620.2980353830641
    +R-squared: -472.3621683634644
    +
    +
    +
    +
    +
    +
    +
    # examine the concrete results of the model - prediction vs test data's label
    +# the dataset provides home values in fractions of $100,000, so we convert the prediction to real dollars.
    +print(f"""Input data:
    +{X_test[:1]}
    +
    +Median house value: ${Y_test.iloc[0] * 100:.2f}k
    +Predicted value: ${predictions[0] * 100:.2f}k""")
    +
    +
    +
    +
    +
    Input data:
    +       MedInc  HouseAge  AveRooms  AveBedrms  Population  AveOccup  Latitude  \
    +20046  1.6812      25.0  4.192201   1.022284      1392.0  3.877437     36.06   
    +
    +       Longitude  
    +20046    -119.01  
    +
    +Median house value: $47.70k
    +Predicted value: $70.53k
    +
    +
    +
    +
    +

    Can you improve it with data preprocessing or altering the model parameters?

    +

    Have fun!

    +
    +
    +

    Additional Resources#

    + +
    - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - - - - - - - - - - - -
    -
    -
    -
    -
    - - - -
    -
    - -
    - - - - - - - - - - - - - -
    - -
    - - - -
    - -
    -
    - -
    -
    - -
    - -
    - -
    - - -
    - -
    - -
    - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - -
    - -
    -
    - - - -
    -

    Outline Only - Lesson 24: Regression Model Evaluation Metrics in Python - Key metrics for evaluating regression models.

    - -
    -
    - -
    -
    -
    - - - - -
    - -
    -

    Outline Only - Lesson 24: Regression Model Evaluation Metrics in Python - Key metrics for evaluating regression models.#

    -

    Math Focus: Mean Squared Error (MSE), Root Mean Squared Error (RMSE), and R-squared.

    -
      -
    • Theoretical Concepts:

      -
        -
      • Importance of model evaluation in regression analysis.

      • -
      • Overview of key metrics: MSE, RMSE, and R-squared.

      • -
      -
    • -
    • Mathematical Foundation:

      -
        -
      • Formulas and interpretation of MSE, RMSE, and R-squared.

      • -
      • Understanding the significance of these metrics in model performance.

      • -
      -
    • -
    • Python Implementation:

      -
        -
      • Calculating MSE, RMSE, and R-squared using scikit-learn.

      • -
      • Visualizing residuals to understand model performance.

      • -
      -
    • -
    • Example Dataset:

      -
        -
      • Use datasets from previous lessons for consistency in evaluation.

      • -
      -
    • -
    -
    - - - - -
    - - - - - - - - -
    - - - - -
    -
    - - -
    - - -
    -
    -
    - - - - - -
    -
    - - \ No newline at end of file diff --git a/Week_05/Lesson_25.html b/Week_05/Lesson_25.html deleted file mode 100644 index cf40263..0000000 --- a/Week_05/Lesson_25.html +++ /dev/null @@ -1,646 +0,0 @@ - - - - - - - - - - - - Outline Only - Lesson 25: Addressing Overfitting and Underfitting in Regression Models — 100 Days of Machine Learning - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - - - - - - - - - - - -
    -
    -
    -
    -
    - - - -
    -
    - -
    - - - - - - - - - - - - - -
    - -
    - - - -
    - -
    -
    - -
    -
    - -
    - -
    - -
    - - -
    - -
    - -
    - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
    - -
    - -
    -
    - - - -
    -

    Outline Only - Lesson 25: Addressing Overfitting and Underfitting in Regression Models

    - -
    -
    - -
    -
    -
    - - - - -
    - -
    -

    Outline Only - Lesson 25: Addressing Overfitting and Underfitting in Regression Models#

    -

    Strategies to combat overfitting and underfitting in regression. - Math Focus: Bias-variance tradeoff and regularization methods.

    -
      -
    • Theoretical Concepts:

      -
        -
      • Identifying symptoms of overfitting and underfitting in regression models.

      • -
      • Strategies to combat overfitting and underfitting.

      • -
      -
    • -
    • Mathematical Foundation:

      -
        -
      • Bias-variance tradeoff.

      • -
      • Regularization methods and their mathematical basis.

      • -
      -
    • -
    • Python Implementation:

      -
        -
      • Demonstrating overfitting and underfitting using matplotlib.

      • -
      • Implementing regularization techniques in Python.

      • -
      • Using validation curves and learning curves for model diagnostics.

      • -
      -
    • -
    • Example Dataset:

      -
        -
      • A dataset with a clear overfitting/underfitting tendency (e.g., high-dimensional data).

      • -
      -
    • -
    -
    - - - - -
    - - - - - - - - -
    - - - - -
    -
    - - -
    - - -
    -
    -
    - - - - - -
    -
    - - \ No newline at end of file diff --git a/_images/0db9f24dd130ecb95bde386604ac8a3a2c4540ea1d11b2edf145ecd048c39112.png b/_images/0db9f24dd130ecb95bde386604ac8a3a2c4540ea1d11b2edf145ecd048c39112.png new file mode 100644 index 0000000..524a124 Binary files /dev/null and b/_images/0db9f24dd130ecb95bde386604ac8a3a2c4540ea1d11b2edf145ecd048c39112.png differ diff --git a/_images/1960b324add5d46958aae8ded16b7d272ca3d7a00e62af7e627201cecc10a22d.png b/_images/1960b324add5d46958aae8ded16b7d272ca3d7a00e62af7e627201cecc10a22d.png deleted file mode 100644 index a73bc8a..0000000 Binary files a/_images/1960b324add5d46958aae8ded16b7d272ca3d7a00e62af7e627201cecc10a22d.png and /dev/null differ diff --git a/_images/1d0563321f6a2b86ded4cb8e6c1035aab0234f07e9db2f827b7c6ea403da2913.png b/_images/1d0563321f6a2b86ded4cb8e6c1035aab0234f07e9db2f827b7c6ea403da2913.png deleted file mode 100644 index 0fadd59..0000000 Binary files a/_images/1d0563321f6a2b86ded4cb8e6c1035aab0234f07e9db2f827b7c6ea403da2913.png and /dev/null differ diff --git a/_images/4d7b3afa51f748619d6d68f394d8d582710de819323ec9056508688058da6b39.png b/_images/4d7b3afa51f748619d6d68f394d8d582710de819323ec9056508688058da6b39.png deleted file mode 100644 index 81b91a0..0000000 Binary files a/_images/4d7b3afa51f748619d6d68f394d8d582710de819323ec9056508688058da6b39.png and /dev/null differ diff --git a/_images/4e87df33e5462df633db2b7b3ed7111f3e20a8646e86a404e369b3186da83e8e.png b/_images/4e87df33e5462df633db2b7b3ed7111f3e20a8646e86a404e369b3186da83e8e.png deleted file mode 100644 index 822bb71..0000000 Binary files a/_images/4e87df33e5462df633db2b7b3ed7111f3e20a8646e86a404e369b3186da83e8e.png and /dev/null differ diff --git a/_images/596a853ea8f36fbbdd24acadc5c2d5007c23779e63fc1516ee16885d91138718.png b/_images/596a853ea8f36fbbdd24acadc5c2d5007c23779e63fc1516ee16885d91138718.png new file mode 100644 index 0000000..81eaec4 Binary files /dev/null and b/_images/596a853ea8f36fbbdd24acadc5c2d5007c23779e63fc1516ee16885d91138718.png differ diff --git a/_images/5a3b207bfabe58ccdfda75f84946a10cdf87d302d66c3b6d1746e2c56a800111.png b/_images/5a3b207bfabe58ccdfda75f84946a10cdf87d302d66c3b6d1746e2c56a800111.png new file mode 100644 index 0000000..cf34f5c Binary files /dev/null and b/_images/5a3b207bfabe58ccdfda75f84946a10cdf87d302d66c3b6d1746e2c56a800111.png differ diff --git a/_images/81ecec8704faf2c1f7ee87b3c690f8d8de124c1b0f37f2a7180b2dffce389c9e.png b/_images/81ecec8704faf2c1f7ee87b3c690f8d8de124c1b0f37f2a7180b2dffce389c9e.png deleted file mode 100644 index 144895b..0000000 Binary files a/_images/81ecec8704faf2c1f7ee87b3c690f8d8de124c1b0f37f2a7180b2dffce389c9e.png and /dev/null differ diff --git a/_images/8a4fc5eafbe1194d2af18ad1cce90114b7a63486611fb0e29814773b4d4eced0.png b/_images/8a4fc5eafbe1194d2af18ad1cce90114b7a63486611fb0e29814773b4d4eced0.png deleted file mode 100644 index ebbab64..0000000 Binary files a/_images/8a4fc5eafbe1194d2af18ad1cce90114b7a63486611fb0e29814773b4d4eced0.png and /dev/null differ diff --git a/_images/8c3a0d5ed06805763b5404ef2a3b932553e09a5d3a21332e387e2d8401ad344f.png b/_images/8c3a0d5ed06805763b5404ef2a3b932553e09a5d3a21332e387e2d8401ad344f.png new file mode 100644 index 0000000..fd444e9 Binary files /dev/null and b/_images/8c3a0d5ed06805763b5404ef2a3b932553e09a5d3a21332e387e2d8401ad344f.png differ diff --git a/_images/9239cf149dff59ff38d351ff926223010fb8551c6f5fa5166e60f27a8a9386e7.png b/_images/9239cf149dff59ff38d351ff926223010fb8551c6f5fa5166e60f27a8a9386e7.png deleted file mode 100644 index ad61b4b..0000000 Binary files a/_images/9239cf149dff59ff38d351ff926223010fb8551c6f5fa5166e60f27a8a9386e7.png and /dev/null differ diff --git a/_images/92ac3250e6513c3b8472e0b18e967da18927d77722af5d165c07f194e84d7801.png b/_images/92ac3250e6513c3b8472e0b18e967da18927d77722af5d165c07f194e84d7801.png deleted file mode 100644 index cca0a3b..0000000 Binary files a/_images/92ac3250e6513c3b8472e0b18e967da18927d77722af5d165c07f194e84d7801.png and /dev/null differ diff --git a/_images/95c79f53523d1b9783ae4165a7fd293f44bf5c1ec13b96e0683169676e70c07c.png b/_images/95c79f53523d1b9783ae4165a7fd293f44bf5c1ec13b96e0683169676e70c07c.png deleted file mode 100644 index 506e45e..0000000 Binary files a/_images/95c79f53523d1b9783ae4165a7fd293f44bf5c1ec13b96e0683169676e70c07c.png and /dev/null differ diff --git a/_images/973c05605e4407d03117eb8668d22802aba5e50872ff991cd2a522591d987fbf.png b/_images/973c05605e4407d03117eb8668d22802aba5e50872ff991cd2a522591d987fbf.png deleted file mode 100644 index aebbca1..0000000 Binary files a/_images/973c05605e4407d03117eb8668d22802aba5e50872ff991cd2a522591d987fbf.png and /dev/null differ diff --git a/_images/9bd1031423bef1a2f61f1d89256148d1b71e943953636677f033cd71d2a243d2.png b/_images/9bd1031423bef1a2f61f1d89256148d1b71e943953636677f033cd71d2a243d2.png new file mode 100644 index 0000000..ee4229c Binary files /dev/null and b/_images/9bd1031423bef1a2f61f1d89256148d1b71e943953636677f033cd71d2a243d2.png differ diff --git a/_images/a298648d33b481f372b4498a7f50d6080ac2ff6cb7286d57d3c8a7e488319dab.png b/_images/a298648d33b481f372b4498a7f50d6080ac2ff6cb7286d57d3c8a7e488319dab.png new file mode 100644 index 0000000..bb63d80 Binary files /dev/null and b/_images/a298648d33b481f372b4498a7f50d6080ac2ff6cb7286d57d3c8a7e488319dab.png differ diff --git a/_images/ac8ca84aa071dd742f96fd53ca0d5b1485f5b3b640b6d84c2fbd9c99fcab7c9f.png b/_images/ac8ca84aa071dd742f96fd53ca0d5b1485f5b3b640b6d84c2fbd9c99fcab7c9f.png deleted file mode 100644 index 7079024..0000000 Binary files a/_images/ac8ca84aa071dd742f96fd53ca0d5b1485f5b3b640b6d84c2fbd9c99fcab7c9f.png and /dev/null differ diff --git a/_images/b63ac6f1c346a37d4c9b5f6b2beb867291b424fff549f41528576a8ebe98007f.png b/_images/b63ac6f1c346a37d4c9b5f6b2beb867291b424fff549f41528576a8ebe98007f.png deleted file mode 100644 index 8780ec2..0000000 Binary files a/_images/b63ac6f1c346a37d4c9b5f6b2beb867291b424fff549f41528576a8ebe98007f.png and /dev/null differ diff --git a/_images/bb0d0c6c15e5ffac9ec2fbb8b1013187538a784f2b9216a086c4291db4962b35.png b/_images/bb0d0c6c15e5ffac9ec2fbb8b1013187538a784f2b9216a086c4291db4962b35.png new file mode 100644 index 0000000..6e28942 Binary files /dev/null and b/_images/bb0d0c6c15e5ffac9ec2fbb8b1013187538a784f2b9216a086c4291db4962b35.png differ diff --git a/_images/c78a8b5d5f1a20faf246b3282e3a95f3146ddc2009886cf542dbe0434f1a1346.png b/_images/c78a8b5d5f1a20faf246b3282e3a95f3146ddc2009886cf542dbe0434f1a1346.png deleted file mode 100644 index c41d07f..0000000 Binary files a/_images/c78a8b5d5f1a20faf246b3282e3a95f3146ddc2009886cf542dbe0434f1a1346.png and /dev/null differ diff --git a/_images/cf2893ef3bdd7bf0354019761a0360b80dbe08cc759e847d38b3cd7a4c87129a.png b/_images/cf2893ef3bdd7bf0354019761a0360b80dbe08cc759e847d38b3cd7a4c87129a.png new file mode 100644 index 0000000..baaaaa9 Binary files /dev/null and b/_images/cf2893ef3bdd7bf0354019761a0360b80dbe08cc759e847d38b3cd7a4c87129a.png differ diff --git a/_images/dec1a5268a9ed8954bf44f8e724342a06ccc2e679de0814a106db7960fd97390.png b/_images/dec1a5268a9ed8954bf44f8e724342a06ccc2e679de0814a106db7960fd97390.png deleted file mode 100644 index 488d2d7..0000000 Binary files a/_images/dec1a5268a9ed8954bf44f8e724342a06ccc2e679de0814a106db7960fd97390.png and /dev/null differ diff --git a/_images/efe2803e3c407dd4463ca9959dfcf6bfa2b0b72cc864062d127916b2c28a2c0e.png b/_images/efe2803e3c407dd4463ca9959dfcf6bfa2b0b72cc864062d127916b2c28a2c0e.png new file mode 100644 index 0000000..c86f470 Binary files /dev/null and b/_images/efe2803e3c407dd4463ca9959dfcf6bfa2b0b72cc864062d127916b2c28a2c0e.png differ diff --git a/_images/f471f48523b4b750801da5035d60e32b3d9fa7f967a86460fac3a817493a2910.png b/_images/f471f48523b4b750801da5035d60e32b3d9fa7f967a86460fac3a817493a2910.png deleted file mode 100644 index 0089d74..0000000 Binary files a/_images/f471f48523b4b750801da5035d60e32b3d9fa7f967a86460fac3a817493a2910.png and /dev/null differ diff --git a/_sources/Week_05/005_Overview_.md b/_sources/Week_05/005_Overview_.md deleted file mode 100644 index eb841cb..0000000 --- a/_sources/Week_05/005_Overview_.md +++ /dev/null @@ -1,27 +0,0 @@ - # Course Structure - - # Module 3: Supervised Learning - Regression and Classification - ## Weeks 5-6 -- Focus: Key concepts and algorithms in supervised learning. -- Topics include regression, classification algorithms, decision trees, SVM, and ensemble methods. - -### Week 5: Supervised Learning - Regression -- **Day 21:** Introduction to Regression Analysis in Python - - Basics of regression analysis and simple linear regression. - - Math Focus: Linear equation fundamentals and fitting models to data. - -- **Day 22:** Implementing Multiple Linear Regression in Python - - Understand and implement multiple linear regression. - - Math Focus: Multivariate calculus and regression coefficients interpretation. - -- **Day 23:** Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression - - Explore advanced regression techniques and their applications. - - Math Focus: Polynomial functions, Lasso and Ridge regularization techniques. - -- **Day 24:** Regression Model Evaluation Metrics in Python - - Key metrics for evaluating regression models. - - Math Focus: Mean Squared Error (MSE), Root Mean Squared Error (RMSE), and R-squared. - -- **Day 25:** Addressing Overfitting and Underfitting in Regression Models - - Strategies to combat overfitting and underfitting in regression. - - Math Focus: Bias-variance tradeoff and regularization methods. \ No newline at end of file diff --git a/_sources/Week_05/Lesson_22.ipynb b/_sources/Week_05/Lesson_22.ipynb index ac1a21f..fa12c56 100644 --- a/_sources/Week_05/Lesson_22.ipynb +++ b/_sources/Week_05/Lesson_22.ipynb @@ -76,7 +76,7 @@ "import matplotlib.pyplot as plt\n", "import pandas as pd\n", "\n", - "df = pd.read_csv(\"customer_data2.csv\")\n", + "df = pd.read_csv(\"customer_data.csv\")\n", "g = sns.pairplot(df, x_vars=['Age','Income'], y_vars='Spending_Score', height=7, aspect=0.7, kind='reg')\n", "g.fig.suptitle(\"Regression Lines: Age and Income versus Spending Score\", y=1.02)\n", "plt.show()" @@ -511,6 +511,9 @@ "source": [ "# Additional Resources\n", "\n", + "- **Resource 1:** [Multiple Linear Regression in Python](https://www.nickmccullum.com/multiple-linear-regression-python/) (Detailed guide on multiple linear regression, including data preparation and model building)\n", + "- **Resource 2:** [Multivariate Linear Regression Tutorial with Real Python](https://realpython.com/linear-regression-in-python/#multiple-linear-regression) (Explanation of multiple linear regression with an example using Python)\n", + "\n", "https://www.statology.org/multiple-linear-regression-assumptions/" ] }, diff --git a/_sources/Week_05/Lesson_23.ipynb b/_sources/Week_05/Lesson_23.ipynb index 0b93193..e2831ad 100644 --- a/_sources/Week_05/Lesson_23.ipynb +++ b/_sources/Week_05/Lesson_23.ipynb @@ -5,26 +5,1647 @@ "id": "210315fa-bf4a-4892-9e66-e42ee9b5d804", "metadata": {}, "source": [ - "# Outline Only - **Lesson 23:** Advanced Regression Techniques\n", - "Polynomial, Lasso, and Ridge Regression - Explore advanced regression techniques and their applications. - Math Focus: Polynomial functions, Lasso and Ridge regularization techniques.\n", - "- **Theoretical Concepts:**\n", - " - Overview of polynomial regression and its applications.\n", - " - Introduction to regularization techniques: Lasso and Ridge regression.\n", - "- **Mathematical Foundation:**\n", - " - Polynomial functions and their role in regression.\n", - " - Lasso (L1 regularization) and Ridge (L2 regularization) concepts.\n", - "- **Python Implementation:**\n", - " - Implementing polynomial regression with numpy and scikit-learn.\n", - " - Demonstrating Lasso and Ridge regression using scikit-learn.\n", - " - Comparing models using visualizations in matplotlib.\n", - "- **Example Dataset:**\n", - " - Dataset requiring a non-linear fit (e.g., environmental data)." + "# Day 23: Advanced Regression Techniques" + ] + }, + { + "cell_type": "markdown", + "id": "242f5383-181e-459b-895d-aebad6bf0aa6", + "metadata": {}, + "source": [ + "## Introduction\n", + "\n", + "Astute readers may have noticed during the Day 22 lesson that some of the `customer_data.csv` plots were not great fits across the entire domain of the data. This is because there was a non-linear element (an $x^2$ term) in the function I used to build that dataset out of random numbers. Most data we'll encounter is not perfectly linear, but we can still use regression. A higher order function may describe the relationships between our independent variables and the dependent variable. We are not limited to $y = mx + c$, or even $y = \\beta_0 + \\beta_1x_1 + \\beta_2x_2 + ... + \\beta_nx_n + \\epsilon$ -- we can include $x_n^2, x_n^3, ...$ as if they were new independent variables, and give our regression line the freedom to match any polynomial function.\n", + "\n", + "We'll just need to steer clear of overfitting: with unlimited terms, it's arbitrarily simple to draw a polynomial function that passes through *every* data point perfectly. This is unlikely to translate into predictive power outside of training, though. Lasso and Ridge are specific forms of regularization designed to address overfitting by penalizing the size of the coefficients. Keep an eye out for the penalty term ($\\lambda$) which controls the complexity of the model.\n", + "\n", + "A general polynomial regression model can be represented as:\n", + "\n", + "$ y = \\beta_0 + \\beta_1x_1 + \\beta_2x_1^2 + \\ldots + \\beta_nx_1^n + \\epsilon $\n", + "\n", + "Where:\n", + "- $y$ is the dependent variable.\n", + "- $x_1, x_1^2, \\ldots, x_1^n$ are the predictor variables and their polynomial terms up to degree \\(n\\).\n", + "- $\\beta_0, \\beta_1, \\ldots, \\beta_n$ are the coefficients.\n", + "- $\\epsilon$ represents the model error.\n", + "\n", + "To get acquainted with the topic, let's take a peek at what adding additional degrees to the polynomial can do:" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "19e3f075-176d-4dff-89a0-88b71613af31", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
    " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# overview plot\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from sklearn.linear_model import LinearRegression\n", + "from sklearn.preprocessing import PolynomialFeatures\n", + "from sklearn.metrics import r2_score\n", + "\n", + "# Generating demo data\n", + "np.random.seed(42)\n", + "x = np.random.normal(0, 1, 20)\n", + "\n", + "# This is the actual equation, so we could check exactly what coefficients our regression found.\n", + "y= -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)\n", + "\n", + "# Reshape x for sklearn\n", + "x = x[:, np.newaxis]\n", + "y = y[:, np.newaxis]\n", + "\n", + "# Simple linear regression\n", + "linear_regressor = LinearRegression()\n", + "linear_regressor.fit(x, y)\n", + "y_pred_linear = linear_regressor.predict(x)\n", + "\n", + "# Polynomial regression (underfit)\n", + "poly_features2 = PolynomialFeatures(degree=2)\n", + "x_poly2 = poly_features2.fit_transform(x)\n", + "poly_regressor2 = LinearRegression()\n", + "poly_regressor2.fit(x_poly2, y)\n", + "y_pred_poly2 = poly_regressor2.predict(x_poly2)\n", + "\n", + "# Polynomial regression (well-fit)\n", + "poly_features3 = PolynomialFeatures(degree=3)\n", + "x_poly3 = poly_features3.fit_transform(x)\n", + "poly_regressor3 = LinearRegression()\n", + "poly_regressor3.fit(x_poly3, y)\n", + "y_pred_poly3 = poly_regressor3.predict(x_poly3)\n", + "\n", + "# Polynomial regression (overfit)\n", + "poly_features5 = PolynomialFeatures(degree=5)\n", + "x_poly5 = poly_features5.fit_transform(x)\n", + "poly_regressor5 = LinearRegression()\n", + "poly_regressor5.fit(x_poly5, y)\n", + "y_pred_poly5 = poly_regressor5.predict(x_poly5)\n", + "\n", + "# R^2 Scores\n", + "r2_linear = r2_score(y, y_pred_linear)\n", + "r2_poly2 = r2_score(y, y_pred_poly2)\n", + "r2_poly3 = r2_score(y, y_pred_poly3)\n", + "r2_poly5 = r2_score(y, y_pred_poly5)\n", + "\n", + "# Plotting\n", + "plt.figure(figsize=(12, 10))\n", + "\n", + "# Plot simple linear regression\n", + "plt.subplot(2, 2, 1)\n", + "plt.scatter(x, y, color='blue', label='Actual response, yi')\n", + "plt.plot(x, y_pred_linear, color='red', label='Estimated regression line, f(x)')\n", + "plt.title(f'Degree: 1, R^2 = {r2_linear:.2f}')\n", + "plt.legend()\n", + "\n", + "# Plot underfit polynomial regression\n", + "plt.subplot(2, 2, 2)\n", + "plt.scatter(x, y, color='blue', label='Actual response, yi')\n", + "sorted_axis = np.argsort(x[:, 0])\n", + "plt.plot(x[sorted_axis], y_pred_poly2[sorted_axis], color='red', label='Estimated regression line, f(x)')\n", + "plt.title(f'Degree: 2, R^2 = {r2_poly2:.2f}')\n", + "plt.legend()\n", + "\n", + "# Plot well-fit polynomial regression\n", + "plt.subplot(2, 2, 3)\n", + "plt.scatter(x, y, color='blue', label='Actual response, yi')\n", + "sorted_axis = np.argsort(x[:, 0])\n", + "plt.plot(x[sorted_axis], y_pred_poly3[sorted_axis], color='red', label='Estimated regression line, f(x)')\n", + "plt.title(f'Degree: 3, R^2 = {r2_poly3:.2f}')\n", + "plt.legend()\n", + "\n", + "# Plot overfit polynomial regression\n", + "plt.subplot(2, 2, 4)\n", + "plt.scatter(x, y, color='blue', label='Actual response, yi')\n", + "sorted_axis = np.argsort(x[:, 0])\n", + "plt.plot(x[sorted_axis], y_pred_poly5[sorted_axis], color='red', label='Estimated regression line, f(x)')\n", + "plt.title(f'Degree: 5, R^2 = {r2_poly5:.2f}')\n", + "plt.legend()\n", + "\n", + "# Show the plots\n", + "plt.tight_layout()\n", + "plt.show()\n" + ] + }, + { + "cell_type": "markdown", + "id": "51bb7f38-423d-468b-bac5-052d1aa0d6b1", + "metadata": {}, + "source": [ + "## Polynomial Regression\n", + "\n", + "In terms of execution, we can use `sklearn`'s `sklearn.preprocessing.PolynomialFeatures` functionality to perform linear regression with a higher degree. This is exactly what was used in the overview plot above, but I wanted to isolate the code for easier comparison to Lasso and Ridge regression below.\n", + "\n", + "Some additional things to keep in mind:\n", + "\n", + "1. **Choice of Polynomial Degree**: Determining the appropriate degree of the polynomial is critical. A higher-degree polynomial can fit the training data very well but might perform poorly on unseen data due to overfitting. Various model selection techniques, such as cross-validation, can be used to choose a polynomial degree that balances bias and variance.\n", + "\n", + "2. **Feature Scaling**: Polynomial terms can have very different scales, especially for higher degrees, which can make the regression model sensitive to the scale of the input features. Normalizing or standardizing the features before applying polynomial regression can help with model convergence and interpretation.\n", + "\n", + "3. **Multivariate Polynomial Regression**: While your introduction focuses on polynomial regression with a single independent variable ($x_1$), it's important to note that polynomial regression can be extended to multiple independent variables, allowing for interaction terms between different variables (e.g., $x_1x_2$, $x_1^2x_2$, etc.). This introduces complexity in model interpretation but can capture interactions between predictors that are not apparent in single-variable analyses.\n", + "\n", + "4. **Computational Complexity**: As the degree of the polynomial and the number of independent variables increase, the computational complexity of fitting the regression model also increases. This is due to the larger number of terms and interactions that need to be calculated and optimized. It's important to balance the model's complexity with computational constraints.\n", + "\n", + "5. **Analyzing Residuals**: When using polynomial regression, it becomes even more important to analyze residuals to ensure that the assumptions of linear regression are still met. This includes checking for homoscedasticity, normality of residuals, and absence of autocorrelation. If these assumptions are violated, the results of the regression, including any inference drawn from the coefficients, may not be valid.\n", + "\n", + "### On `make_pipeline`\n", + "\n", + "`make_pipeline` from `sklearn.pipeline` is a utility function that simplifies the process of creating a pipeline of transformations with a final estimator. In machine learning workflows, it's often necessary to chain together multiple steps such as preprocessing (like scaling features or applying polynomial expansions) and then applying a model (like LinearRegression, Lasso, or Ridge). A pipeline bundles these steps into a single object that behaves like a compound estimator. \n", + "\n", + "When you use `make_pipeline`, you can pass it a series of transformations followed by an estimator, and it automatically names each step based on its class. The steps are executed in sequence: each step's `fit_transform()` method is called on the input data (except for the last step, where only `fit()` is called), transforming the data along the way, until it finally fits the model on the transformed data. This streamlines the code, making it cleaner and easier to read, and reduces the risk of mistakes (like applying transformations to the training data but forgetting to do so on the test data).\n", + "\n", + "The intro plot above does not use a pipeline, but Lasso and Ridge specifically benefit from it. In this next example, we will pipeline from [PolynomialFeatures](https://scikit-learn.org/stable/modules/generated/sklearn.preprocessing.PolynomialFeatures.html) (a preprocessor) to [LinearRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LinearRegression.html) (a model).\n", + "\n", + "This allows us to convert this block of code:\n", + "\n", + "```python\n", + "# Polynomial regression (well-fit)\n", + "poly_features3 = PolynomialFeatures(degree=3)\n", + "x_poly3 = poly_features3.fit_transform(x)\n", + "poly_regressor3 = LinearRegression()\n", + "poly_regressor3.fit(x_poly3, y)\n", + "y_pred_poly3 = poly_regressor3.predict(x_poly3)\n", + "```\n", + "\n", + "into this:\n", + "\n", + "```python\n", + "poly = make_pipeline(PolynomialFeatures(degree), LinearRegression())\n", + "poly.fit(X, y)\n", + "```\n", + "\n", + "You can imagine that as you add additional steps to transform your data, the first style of code will grow from 6 lines, to 9, to 12... while the second example simply adds more \"machinery\" to the sequence described in `make_pipeline(...)`.\n", + "\n", + "For instance, when used with `LinearRegression`, `Lasso`, or `Ridge` in the context of polynomial regression, you would typically create a pipeline that first expands your features into a polynomial feature space (using `PolynomialFeatures`) and then scales them (using `StandardScaler`, although not in these basic examples, it's a common practice), before finally applying the regression model. This ensures that the feature expansion and scaling are part of the model fitting process, which is particularly important for cross-validation and deploying the model for predictions on new data.\n", + "\n", + "To get the coefficients and intercept out of a pipeline that ends in linear regression, you'll have to reach inside the pipeline via the name it generates for its different steps. `poly_regressor3.coef_` becomes `poly['linearregression'].coef`, where the string `'linearregression'` is generated from the `LinearRegression` object that was passed into the pipeline." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "0ff250a3-56ab-49aa-a03b-2e13b64922b0", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
    " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from sklearn.linear_model import Lasso\n", + "from sklearn.preprocessing import PolynomialFeatures\n", + "from sklearn.linear_model import LinearRegression\n", + "from sklearn.pipeline import make_pipeline\n", + "# Generating demo data\n", + "np.random.seed(42)\n", + "x = np.random.normal(0, 1, 20)\n", + "X = x[:, np.newaxis]\n", + "\n", + "# This is the actual equation, so we could check exactly what coefficients our regression found.\n", + "y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)\n", + "\n", + "# Reshape x for sklearn\n", + "x = x[:, np.newaxis]\n", + "y = y[:, np.newaxis]\n", + "\n", + "degree = 4 # choosing the same degree as the true model\n", + "poly = make_pipeline(PolynomialFeatures(degree), LinearRegression())\n", + "poly.fit(X, y)\n", + "\n", + "# Generating points for plotting the regression line\n", + "x_plot = np.linspace(min(X), max(X), 100)\n", + "y_plot = poly.predict(x_plot)\n", + "\n", + "plt.scatter(x, y, label='Data points')\n", + "sorted_axis = np.argsort(x[:, 0])\n", + "plt.plot(x_plot, y_plot, label='Polynomial regression line', color='red')\n", + "plt.legend()\n", + "plt.xlabel('x')\n", + "plt.ylabel('y')\n", + "plt.title('Polynomial (degree = 4) regression')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "75134492-a181-4364-bca2-f25babb8fb71", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
    Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=4)),\n",
    +       "                ('linearregression', LinearRegression())])
    In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
    On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
    " + ], + "text/plain": [ + "Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=4)),\n", + " ('linearregression', LinearRegression())])" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "poly" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "82785ac3-c1ab-4411-84eb-7ac688452ece", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([[ 0. , -2.00193104, 7.3848762 , 3.00349368, -4.16571691]])" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "poly['linearregression'].coef_" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "3cee9f6f-2317-43f4-9e32-99d9433266bc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([-0.32345315])" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "poly['linearregression'].intercept_" + ] + }, + { + "cell_type": "markdown", + "id": "f413714d-8027-48cc-8abc-1abb98e4a4bd", + "metadata": {}, + "source": [ + "## Lasso Regression\n", + "\n", + "Lasso regression adds a penalty equal to the absolute value of the magnitude of coefficients. This can lead not only to small coefficients but can actually shrink some of them to zero, effectively performing variable selection. Using that feature of Lasso regression, you don't have to interpret the usefulness of a variable - if it's not important to the model, then its coefficients will drop to zero. However, to achieve this result, you'll have to tune your lambda ($\\lambda$) value. If $\\lambda$ is too small, the penalty effect might be negligible, leading to little improvement over ordinary least squares regression. If $\\lambda$ is too large, too many variables might be eliminated, resulting in underfitting. Techniques such as cross-validation can be used to select an optimal $\\lambda$.\n", + "\n", + "The objective function for Lasso regression is:\n", + "\n", + "$ \\text{Minimize: } \\frac{1}{2N} \\sum_{i=1}^{N} (y_i - \\sum_{j=1}^{n} \\beta_j x_{ij})^2 + \\lambda \\sum_{j=1}^{n} |\\beta_j| $\n", + "\n", + "Where:\n", + "- $N$ is the number of observations.\n", + "- $\\lambda$ is the regularization parameter controlling the strength of the penalty.\n", + "- The first term is the Mean Squared Error, and the second term is the L1 penalty.\n", + "\n", + "\n", + "\n", + "Other things to keep in mind:\n", + "\n", + "- Lasso regression is sensitive to the scale of the input variables, so standardizing the data (to have 0 mean and unit variance) before applying Lasso regression is a common practice.\n", + "- While Lasso can lead to sparse solutions, Ridge regression is preferred when multicollinearity is present among the features.\n", + "\n", + "The introduction plot used `sklearn.linear_model.LinearRegression` to perform regression with different degrees of polynomials. Although Lasso might not perfectly capture the relationship in polynomial terms without specifically including polynomial features, this code will illustrate the process:\n" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "c57477e2-507e-438e-82ee-28ffbc7eac3d", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
    " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from sklearn.linear_model import Lasso\n", + "from sklearn.preprocessing import PolynomialFeatures\n", + "from sklearn.pipeline import make_pipeline\n", + "\n", + "# Generating demo data\n", + "np.random.seed(42)\n", + "x = np.random.normal(0, 1, 20)\n", + "y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)\n", + "X = x[:, np.newaxis]\n", + "\n", + "degree = 4 # choosing the same degree as the true model\n", + "lasso_poly = make_pipeline(PolynomialFeatures(degree), Lasso(alpha=0.1, max_iter=10000))\n", + "lasso_poly.fit(X, y)\n", + "\n", + "# Generating points for plotting the regression line\n", + "x_plot = np.linspace(min(x), max(x), 100)\n", + "X_plot = x_plot[:, np.newaxis]\n", + "y_plot = lasso_poly.predict(X_plot)\n", + "\n", + "# Plotting the data points and the regression line\n", + "plt.scatter(x, y, label='Data points')\n", + "plt.plot(x_plot, y_plot, label='Lasso Regression Line', color='red')\n", + "plt.legend()\n", + "plt.xlabel('x')\n", + "plt.ylabel('y')\n", + "plt.title('Lasso Regression with Polynomial Features')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "e7fa142d-4ff9-42e6-9858-8e8156852e49", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([ 0. , -1.55260439, 5.72240286, 2.90811749, -3.66350745])" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "lasso_poly['lasso'].coef_" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "80726256-28a9-4326-8d9d-520162c999a1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.19943027115730638" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "lasso_poly['lasso'].intercept_" + ] + }, + { + "cell_type": "markdown", + "id": "afcf86f0-ac8c-42f8-9842-ee4e9471c888", + "metadata": {}, + "source": [ + "- **Choosing Degree and $\\lambda$**: The choice of `degree=4` for the polynomial features and `alpha=0.1` for the Lasso regression penalty (`$\\lambda$`) is somewhat arbitrary here and might need adjustment based on cross-validation to find the optimal model complexity and regularization strength.\n", + "- **Max Iterations**: Increasing `max_iter` in `Lasso()` might be necessary for the algorithm to converge, especially for higher degrees of polynomials or smaller values of $\\alpha$ (`lambda`)." + ] + }, + { + "cell_type": "markdown", + "id": "ddf35035-e970-4a46-969a-74eebeda569e", + "metadata": {}, + "source": [ + "## Ridge Regression\n", + "\n", + "Ridge regression adds a penalty equal to the square of the magnitude of coefficients. All coefficients are shrunk by the same factor (none are eliminated).\n", + "\n", + "The objective function for Ridge regression is:\n", + "\n", + "$ \\text{Minimize: } \\frac{1}{2N} \\sum_{i=1}^{N} (y_i - \\sum_{j=1}^{n} \\beta_j x_{ij})^2 + \\lambda \\sum_{j=1}^{n} \\beta_j^2 $\n", + "\n", + "- Similarly, $N$ and $\\lambda$ have the same definitions as in Lasso.\n", + "- The first term again represents the Mean Squared Error, and the second term is the L2 penalty.\n", + "\n", + "1. **Effect of the Penalty**: Ridge regression is particularly useful when dealing with multicollinearity or when you have more predictors than observations.\n", + "\n", + "2. **Scaling Importance**: standardizing the features in Ridge regression is important due to the square of the coefficients being included in the penalty term. Features on larger scales can have disproportionately large effects on the formulation.\n", + "\n", + "3. **Choosing $\\lambda$ for the bias-variance trade-off**: A higher $\\lambda$ increases bias but reduces variance, whereas a lower $\\lambda$ does the opposite. The optimal $\\lambda$ minimizes the mean squared error of predictions.\n", + "\n", + "4. **Computational Aspects**: Ridge regression tends to be computationally more efficient than Lasso for a large number of features, mainly because the solution is obtained through matrix operations that have computationally efficient implementations.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "5c103fb1-7d95-4441-b00a-51035ea53e27", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
    " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from sklearn.linear_model import Ridge\n", + "from sklearn.preprocessing import PolynomialFeatures\n", + "from sklearn.pipeline import make_pipeline\n", + "\n", + "# Generating demo data using the same snippet\n", + "np.random.seed(42)\n", + "x = np.random.normal(0, 1, 20)\n", + "y = -3.8 * x**4 + 3.4 * x**3 + 6.6 * x**2 - 2.5 * x + np.random.normal(0, 1, 20)\n", + "X = x[:, np.newaxis]\n", + "\n", + "# Using polynomial features again since our relationship is non-linear\n", + "degree = 4\n", + "ridge_poly = make_pipeline(PolynomialFeatures(degree), Ridge(alpha=0.1))\n", + "ridge_poly.fit(X, y)\n", + "\n", + "# Generating points for plotting\n", + "x_plot = np.linspace(min(x), max(x), 100)\n", + "X_plot = x_plot[:, np.newaxis]\n", + "y_plot = ridge_poly.predict(X_plot)\n", + "\n", + "# Plotting\n", + "plt.scatter(x, y, label='Data points')\n", + "plt.plot(x_plot, y_plot, color='red', label='Ridge Regression Line')\n", + "plt.legend()\n", + "plt.xlabel('x')\n", + "plt.ylabel('y')\n", + "plt.title('Ridge Regression with Polynomial Features')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "ec10b1ed-2cd4-4e2f-856b-dc95c093b7eb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([ 0. , -2.05626925, 6.75667935, 3.06069885, -3.96459941])" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ridge_poly['ridge'].coef_" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "950a5b0b-afeb-4899-8c0a-74bc989e464a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "-0.14654769263455236" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ridge_poly['ridge'].intercept_" + ] + }, + { + "cell_type": "markdown", + "id": "6605fd80-9410-46d4-b054-b06fcd85f4d3", + "metadata": {}, + "source": [ + "## Exercise For The Reader\n", + "\n", + "Lasso and Ridge regression could be applied to sklearn's included [California housing data set](https://scikit-learn.org/stable/datasets/real_world.html#california-housing-dataset).\n", + "\n", + "\n", + "\n", + "* Don't forget to do a test train split.\n", + "* It's probably best to use a scaler.\n", + "* selecting variables is important, but can be thought of as part science and part art. Try a few and see what helps." + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "id": "0a63bf90-e251-4807-9ca6-0952a43d26c4", + "metadata": {}, + "outputs": [], + "source": [ + "# starter code\n", + "from sklearn.datasets import fetch_california_housing\n", + "from sklearn.model_selection import train_test_split\n", + "fetched = fetch_california_housing(as_frame=True)\n", + "X = fetched['data']\n", + "Y = fetched['target']\n", + "\n", + "# Splitting dataset\n", + "X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, random_state=42)" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "id": "0fd6514b-3031-41a2-b2da-9aef3cb508ea", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
    \n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    MedIncHouseAgeAveRoomsAveBedrmsPopulationAveOccupLatitudeLongitude
    08.325241.06.9841271.023810322.02.55555637.88-122.23
    18.301421.06.2381370.9718802401.02.10984237.86-122.22
    27.257452.08.2881361.073446496.02.80226037.85-122.24
    35.643152.05.8173521.073059558.02.54794537.85-122.25
    43.846252.06.2818531.081081565.02.18146737.85-122.25
    \n", + "
    " + ], + "text/plain": [ + " MedInc HouseAge AveRooms AveBedrms Population AveOccup Latitude \\\n", + "0 8.3252 41.0 6.984127 1.023810 322.0 2.555556 37.88 \n", + "1 8.3014 21.0 6.238137 0.971880 2401.0 2.109842 37.86 \n", + "2 7.2574 52.0 8.288136 1.073446 496.0 2.802260 37.85 \n", + "3 5.6431 52.0 5.817352 1.073059 558.0 2.547945 37.85 \n", + "4 3.8462 52.0 6.281853 1.081081 565.0 2.181467 37.85 \n", + "\n", + " Longitude \n", + "0 -122.23 \n", + "1 -122.22 \n", + "2 -122.24 \n", + "3 -122.25 \n", + "4 -122.25 " + ] + }, + "execution_count": 29, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "52b11cb7-455a-4a6d-935b-33d801df9ad0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
    Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=8)),\n",
    +       "                ('standardscaler', StandardScaler()),\n",
    +       "                ('ridge', Ridge(alpha=0.1))])
    In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
    On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
    " + ], + "text/plain": [ + "Pipeline(steps=[('polynomialfeatures', PolynomialFeatures(degree=8)),\n", + " ('standardscaler', StandardScaler()),\n", + " ('ridge', Ridge(alpha=0.1))])" + ] + }, + "execution_count": 58, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# model configuration\n", + "from sklearn.preprocessing import StandardScaler\n", + "\n", + "degrees = 8\n", + "ridge_poly = make_pipeline(PolynomialFeatures(degrees), StandardScaler(), Ridge(alpha=0.1))\n", + "ridge_poly.fit(X_train, Y_train)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "id": "4d97f8a1-f718-40f6-90b8-c1ab3a477662", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "MSE: 620.2980353830641\n", + "R-squared: -472.3621683634644\n" + ] + } + ], + "source": [ + "from sklearn.metrics import mean_squared_error, r2_score\n", + "\n", + "# Making predictions\n", + "predictions = ridge_poly.predict(X_test)\n", + "\n", + "# Evaluation\n", + "mse = mean_squared_error(Y_test, predictions)\n", + "r2 = r2_score(Y_test, predictions)\n", + "\n", + "print(f'MSE: {mse}')\n", + "print(f'R-squared: {r2}')" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "id": "e4df6f54-b6a6-40ff-8849-f5a9ca2ff290", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Input data:\n", + " MedInc HouseAge AveRooms AveBedrms Population AveOccup Latitude \\\n", + "20046 1.6812 25.0 4.192201 1.022284 1392.0 3.877437 36.06 \n", + "\n", + " Longitude \n", + "20046 -119.01 \n", + "\n", + "Median house value: $47.70k\n", + "Predicted value: $70.53k\n" + ] + } + ], + "source": [ + "# examine the concrete results of the model - prediction vs test data's label\n", + "# the dataset provides home values in fractions of $100,000, so we convert the prediction to real dollars.\n", + "print(f\"\"\"Input data:\n", + "{X_test[:1]}\n", + "\n", + "Median house value: ${Y_test.iloc[0] * 100:.2f}k\n", + "Predicted value: ${predictions[0] * 100:.2f}k\"\"\")" + ] + }, + { + "cell_type": "markdown", + "id": "65e80f87-06a3-4416-83e0-cd06078c6703", + "metadata": {}, + "source": [ + "Can you improve it with data preprocessing or altering the model parameters?\n", + "\n", + "Have fun!" + ] + }, + { + "cell_type": "markdown", + "id": "27de40d2-56fd-482f-bc79-6c31ab056d3c", + "metadata": {}, + "source": [ + "## Additional Resources\n", + "\n", + "- **Resource 1:** [Advanced Linear Regression With Python](https://realpython.com/linear-regression-in-python/#polynomial-regression) (Guide on polynomial regression, Lasso, and Ridge regression in Python)\n", + "- **Resource 2:** [Machine Learning: Polynomial Regression with Python](https://towardsdatascience.com/machine-learning-polynomial-regression-with-python-5328e4e8a386) (Tutorial on polynomial regression and its application in Python)" ] }, { "cell_type": "code", "execution_count": null, - "id": "780f47fd-0028-4f64-8cd3-cef867bcb2b2", + "id": "6328b773-d5f0-4c16-88e5-201cdf8068e4", "metadata": {}, "outputs": [], "source": [] diff --git a/_sources/Week_05/Lesson_24.ipynb b/_sources/Week_05/Lesson_24.ipynb deleted file mode 100644 index 56cf18e..0000000 --- a/_sources/Week_05/Lesson_24.ipynb +++ /dev/null @@ -1,53 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "d042b09f-5dbb-4492-b635-efaf72f2430a", - "metadata": {}, - "source": [ - "# Outline Only - **Lesson 24:** Regression Model Evaluation Metrics in Python - Key metrics for evaluating regression models.\n", - "Math Focus: Mean Squared Error (MSE), Root Mean Squared Error (RMSE), and R-squared.\n", - "- **Theoretical Concepts:**\n", - " - Importance of model evaluation in regression analysis.\n", - " - Overview of key metrics: MSE, RMSE, and R-squared.\n", - "- **Mathematical Foundation:**\n", - " - Formulas and interpretation of MSE, RMSE, and R-squared.\n", - " - Understanding the significance of these metrics in model performance.\n", - "- **Python Implementation:**\n", - " - Calculating MSE, RMSE, and R-squared using scikit-learn.\n", - " - Visualizing residuals to understand model performance.\n", - "- **Example Dataset:**\n", - " - Use datasets from previous lessons for consistency in evaluation." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "b1004f48-41e2-48b4-9803-6b5d575d639b", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.11.6" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/_sources/Week_05/Lesson_25.ipynb b/_sources/Week_05/Lesson_25.ipynb deleted file mode 100644 index 8d4973d..0000000 --- a/_sources/Week_05/Lesson_25.ipynb +++ /dev/null @@ -1,54 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "3f3fb1e7-ba4e-4da8-b4ec-d8a9688f1ae3", - "metadata": {}, - "source": [ - "# Outline Only - **Lesson 25:** Addressing Overfitting and Underfitting in Regression Models \n", - "Strategies to combat overfitting and underfitting in regression. - Math Focus: Bias-variance tradeoff and regularization methods.\n", - "- **Theoretical Concepts:**\n", - " - Identifying symptoms of overfitting and underfitting in regression models.\n", - " - Strategies to combat overfitting and underfitting.\n", - "- **Mathematical Foundation:**\n", - " - Bias-variance tradeoff.\n", - " - Regularization methods and their mathematical basis.\n", - "- **Python Implementation:**\n", - " - Demonstrating overfitting and underfitting using matplotlib.\n", - " - Implementing regularization techniques in Python.\n", - " - Using validation curves and learning curves for model diagnostics.\n", - "- **Example Dataset:**\n", - " - A dataset with a clear overfitting/underfitting tendency (e.g., high-dimensional data)." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "fd7b23be-578e-456b-a1ad-0cd8f56cceef", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.11.6" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/genindex.html b/genindex.html index a26bae6..db4e119 100644 --- a/genindex.html +++ b/genindex.html @@ -256,6 +256,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/index.html b/index.html index b8e7e1e..bedc41d 100644 --- a/index.html +++ b/index.html @@ -258,6 +258,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/objects.inv b/objects.inv index f79226f..71c03a9 100644 Binary files a/objects.inv and b/objects.inv differ diff --git a/search.html b/search.html index 9e1e5c4..1b6aedb 100644 --- a/search.html +++ b/search.html @@ -258,6 +258,7 @@
  • Day 21 - Introduction to Regression Analysis in Python
  • Day 22: Implementing Multiple Linear Regression in Python
  • +
  • Day 23 - Advanced Regression Techniques - Polynomial, Lasso, and Ridge Regression
  • diff --git a/searchindex.js b/searchindex.js index a8bba31..e976b77 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["Week_00/00_Overview", "Week_00/00a_DailyChallenge", "Week_00/00b_DailyResources", "Week_00/01_Errata", "Week_01/001_Overview", "Week_01/Lesson_01", "Week_01/Lesson_02", "Week_01/Lesson_03", "Week_01/Lesson_04", "Week_01/Lesson_05", "Week_02/002_Overview", "Week_02/Lesson_06", "Week_02/Lesson_07", "Week_02/Lesson_08", "Week_02/Lesson_09", "Week_02/Lesson_10", "Week_03/003_Overview", "Week_03/Lesson_11", "Week_03/Lesson_12", "Week_03/Lesson_12solution", "Week_03/Lesson_13", "Week_03/Lesson_14", "Week_03/Lesson_15", "Week_04/004_Overview", "Week_04/Lesson_16", "Week_04/Lesson_17", "Week_04/Lesson_18", "Week_04/Lesson_19", "Week_04/Lesson_20", "Week_05/005_Overview", "Week_05/Lesson_21", "Week_05/Lesson_22", "index"], "filenames": ["Week_00/00_Overview.md", "Week_00/00a_DailyChallenge.md", "Week_00/00b_DailyResources.md", "Week_00/01_Errata.md", "Week_01/001_Overview.md", "Week_01/Lesson_01.ipynb", "Week_01/Lesson_02.ipynb", "Week_01/Lesson_03.ipynb", "Week_01/Lesson_04.ipynb", "Week_01/Lesson_05.ipynb", "Week_02/002_Overview.md", "Week_02/Lesson_06.ipynb", "Week_02/Lesson_07.ipynb", "Week_02/Lesson_08.ipynb", "Week_02/Lesson_09.ipynb", "Week_02/Lesson_10.ipynb", "Week_03/003_Overview.md", "Week_03/Lesson_11.ipynb", "Week_03/Lesson_12.ipynb", "Week_03/Lesson_12solution.ipynb", "Week_03/Lesson_13.ipynb", "Week_03/Lesson_14.ipynb", "Week_03/Lesson_15.ipynb", "Week_04/004_Overview.md", "Week_04/Lesson_16.ipynb", "Week_04/Lesson_17.ipynb", "Week_04/Lesson_18.ipynb", "Week_04/Lesson_19.ipynb", "Week_04/Lesson_20.ipynb", "Week_05/005_Overview.md", "Week_05/Lesson_21.ipynb", "Week_05/Lesson_22.ipynb", "index.rst"], "titles": ["100 Days of Machine Learning Challenge", "Daily Challenge Curriculum", "Daily Curriculum Resources", "Errata", "Course Structure", "Day 1: Python Basics - Syntax, Variables", "Day 2: Python Data Types", "Day 3: Control Structures - Loops", "Day 4: Control Structures - Conditionals", "Day 5: Functions and Modules", "Course Structure", "Day 6: Linear Algebra - Vector Operations in Python", "Day 7: Linear Algebra - Matrices and Matrix Operations", "Day 8: Calculus - Derivatives, Concept and Applications", "Day 9: Calculus - Integrals, Fundamental Theorems, and Applications in Machine Learning", "Day 10: Probability and Statistics - Basic Concepts, Relevant Distributions - Expanded", "Course Structure", "Day 11: Introduction to Data Preprocessing in Python", "Day 12: In-Depth Exploration of Data Splitting Techniques in Python with Cross-Validation", "Day 12: In-Depth Exploration of Data Splitting Techniques - Solution", "Day 13: Advanced Techniques for Handling Missing Data in Python", "Day 14: Data Normalization and Scaling using Python", "Day 15: Encoding Categorical Data in Python - Expanded with Mathematical Implications", "Course Structure", "Day 16: Comprehensive EDA and Data Visualization in Python", "Day 17: In-Depth EDA and Central Tendency in Python", "Day 18: In-Depth Analysis of Histograms and Box Plots in Python", "Day 19: Correlation Analysis using Python", "Day 20: Advanced Feature Selection and Importance in Python - With Iris Dataset", "Course Structure", "Day 21 - Introduction to Regression Analysis in Python", "Day 22: Implementing Multiple Linear Regression in Python", "100 Days of Machine Learning Challenge"], "terms": {"welcom": [0, 6, 32], "comprehens": [0, 1, 2, 12, 18, 19, 27, 28, 30, 31, 32], "journei": [0, 5, 6, 13, 28, 32], "world": [0, 1, 2, 6, 9, 14, 20, 30, 32], "tailor": [0, 2, 32], "divers": [0, 2, 6, 9, 12, 19, 32], "audienc": [0, 32], "includ": [0, 1, 2, 5, 9, 11, 12, 13, 14, 15, 18, 20, 21, 22, 24, 26, 28, 29, 30, 31, 32], "aspir": [0, 32], "scientist": [0, 30], "profession": [0, 32], "relat": [0, 1, 2, 9, 12, 19, 20, 27, 32], "field": [0, 2, 12, 13, 15, 30, 31, 32], "enthusiast": [0, 32], "thi": [0, 2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "program": [0, 1, 2, 4, 5, 6, 8, 10, 11, 13, 14, 15, 18, 32], "design": [0, 9, 11, 13, 17, 28, 32], "individu": [0, 2, 5, 26, 27, 32], "high": [0, 1, 2, 9, 17, 19, 26, 27, 28, 31, 32], "colleg": [0, 2, 32], "level": [0, 9, 15, 17, 19, 22, 24, 26, 27, 32], "algebra": [0, 1, 4, 10, 13, 14, 15, 21, 24, 25, 32], "knowledg": [0, 1, 2, 11, 13, 14, 18, 20, 22, 24, 27, 28, 32], "It": [0, 2, 5, 6, 7, 8, 9, 11, 12, 13, 15, 18, 19, 20, 21, 25, 27, 28, 30, 31, 32], "offer": [0, 2, 12, 15, 32], "well": [0, 2, 11, 18, 19, 26, 27, 28, 30, 32], "round": [0, 2, 9, 19, 20, 32], "educ": [0, 1, 22, 32], "experi": [0, 1, 5, 15, 28, 32], "through": [0, 1, 2, 4, 5, 6, 7, 8, 13, 20, 21, 22, 25, 26, 30, 32], "video": [0, 2, 12, 32], "lectur": [0, 12, 32], "question": [0, 7, 9, 17, 32], "hand": [0, 1, 2, 9, 28, 30, 32], "tutori": [0, 2, 5, 18, 26, 32], "focu": [0, 1, 2, 4, 5, 10, 16, 23, 24, 26, 29, 30, 32], "topic": [0, 4, 10, 16, 23, 29, 32], "syntax": [0, 1, 4, 6, 8, 10, 11, 32], "linear": [0, 1, 4, 9, 10, 19, 20, 21, 24, 25, 27, 28, 29, 32], "calculu": [0, 1, 4, 10, 29, 32], "statist": [0, 1, 4, 10, 14, 16, 18, 23, 25, 27, 28, 30, 31, 32], "method": [0, 7, 9, 13, 15, 16, 17, 18, 21, 23, 24, 26, 27, 29, 31, 32], "visual": [0, 1, 13, 14, 15, 16, 17, 23, 26, 28, 32], "descript": [0, 1, 12, 16, 19, 23, 25, 32], "algorithm": [0, 1, 7, 11, 12, 13, 14, 18, 21, 28, 29, 30, 31, 32], "decis": [0, 1, 6, 8, 13, 15, 17, 20, 26, 29, 32], "tree": [0, 1, 13, 28, 29, 31, 32], "svm": [0, 1, 13, 29, 32], "techniqu": [0, 1, 14, 15, 16, 23, 29, 30, 31, 32], "reduc": [0, 1, 2, 18, 22, 28, 30, 32], "complex": [0, 1, 2, 5, 7, 8, 9, 11, 18, 20, 24, 28, 31, 32], "cluster": [0, 1, 11, 19, 25, 32], "gaussian": [0, 1, 15, 21, 32], "mixtur": [0, 1, 32], "model": [0, 1, 5, 9, 11, 13, 14, 15, 21, 22, 27, 28, 29, 32], "pca": [0, 1, 32], "t": [0, 1, 5, 6, 9, 12, 13, 15, 19, 20, 22, 24, 26, 27, 28, 30, 31, 32], "sne": [0, 1, 32], "core": [0, 1, 2, 15, 17, 19, 28, 32], "concept": [0, 5, 6, 8, 11, 12, 16, 18, 21, 22, 24, 25, 29, 32], "architectur": [0, 1, 32], "neural": [0, 11, 13, 14, 21, 31, 32], "network": [0, 11, 13, 14, 21, 31, 32], "cnn": [0, 32], "rnn": [0, 32], "imag": [0, 1, 11, 12, 32], "sequenc": [0, 1, 4, 5, 7, 32], "process": [0, 7, 9, 11, 12, 17, 18, 19, 20, 22, 28, 30, 32], "emerg": [0, 1, 32], "reinforc": [0, 7, 32], "transfer": [0, 1, 32], "gan": [0, 1, 32], "attent": [0, 1, 32], "mechan": [0, 1, 11, 12, 20, 32], "operation": [0, 1, 2, 32], "understand": [0, 1, 4, 5, 6, 8, 10, 11, 14, 16, 18, 19, 23, 24, 25, 29, 30, 32], "transform": [0, 11, 12, 18, 19, 21, 22, 26, 28, 31, 32], "mlop": [0, 32], "etl": [0, 32], "applic": [0, 6, 10, 12, 15, 17, 18, 20, 24, 26, 28, 29, 32], "variou": [0, 1, 2, 11, 12, 13, 14, 15, 17, 19, 20, 22, 23, 28, 30, 32], "industri": [0, 32], "healthcar": [0, 1, 31, 32], "financ": [0, 1, 17, 31, 32], "retail": [0, 1, 32], "manufactur": [0, 1, 32], "build": [0, 1, 5, 7, 9, 11, 19, 20, 28, 32], "evalu": [0, 1, 5, 6, 8, 9, 13, 14, 19, 21, 22, 25, 27, 28, 29, 32], "connect": [0, 1, 2, 14], "learner": 0, "expert": [0, 20], "share": [0, 9], "your": [0, 2, 6, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 30, 31], "insight": [0, 1, 2, 17, 19, 20, 22, 24, 25, 26, 27, 31], "particip": 0, "discuss": [0, 2, 24, 26, 27, 30], "collabor": 0, "start": [0, 2, 5, 7, 9, 12, 24, 30], "date": [0, 5, 9, 17], "januari": 0, "1st": [0, 22], "2024": [0, 9], "twitter": [0, 32], "100daysml": [0, 32], "reddit": [0, 32], "r": [0, 1, 2, 9, 11, 15, 27, 28, 29, 30, 31, 32], "discord": [0, 32], "us": [0, 1, 4, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 18, 19, 22, 23, 24, 25, 26, 31, 32], "websit": [0, 2, 32], "http": [0, 2, 5, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "www": [0, 2, 5, 15, 17, 18, 20, 21, 22, 25, 26, 27, 28, 31, 32], "100daysofml": [0, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 32], "com": [0, 2, 5, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 32], "we": [0, 5, 6, 9, 11, 12, 13, 15, 20, 21, 25, 26, 27, 28, 30, 31], "ar": [0, 2, 5, 6, 7, 8, 9, 11, 12, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "excit": 0, "embark": [0, 20, 21, 27, 28], "explor": [0, 1, 2, 4, 6, 10, 13, 14, 15, 16, 22, 23, 25, 26, 27, 29, 30, 31], "discoveri": 0, "you": [0, 2, 5, 6, 7, 9, 11, 12, 13, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "let": [0, 5, 9, 11, 12, 13, 14, 15, 20, 26, 28, 30, 31], "s": [0, 2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 21, 22, 24, 25, 26, 30, 31], "grow": 0, "togeth": [0, 12], "skill": [1, 6, 8, 13, 15, 20, 21, 22, 24, 25, 26, 28, 30], "type": [1, 4, 5, 9, 12, 15, 16, 19, 23, 24, 25, 26, 28, 30], "control": [1, 4, 6, 12], "structur": [1, 5, 11, 12, 20, 22, 24, 26], "dai": [1, 4, 10, 16, 23, 29], "variabl": [1, 4, 6, 7, 9, 12, 17, 18, 19, 21, 22, 24, 26, 27, 28, 30, 31], "assign": [1, 2, 4, 5, 8, 9, 12, 21, 28], "math": [1, 2, 4, 7, 9, 10, 15, 16, 18, 23, 29], "arithmet": [1, 2, 4, 6, 17], "differ": [1, 4, 5, 6, 7, 8, 9, 11, 12, 15, 19, 20, 22, 24, 25, 26, 27, 28, 31], "logic": [1, 2, 4, 5, 8, 22], "calcul": [1, 2, 4, 7, 9, 10, 11, 14, 17, 18, 24, 25, 27, 28, 30], "loop": [1, 4, 5, 6, 8, 9, 25, 30], "construct": [1, 4, 26, 28, 30], "while": [1, 2, 4, 5, 9, 11, 13, 17, 19, 20, 22, 24, 27, 28, 30], "condit": [1, 4, 5, 6, 7, 9, 11, 13, 30], "statement": [1, 4, 5, 6, 12], "elif": [1, 2, 4, 7, 8, 9], "els": [1, 2, 4, 8, 9, 15, 28], "flow": [1, 4], "implement": [1, 4, 10, 16, 18, 19, 23, 24, 25, 29], "function": [1, 4, 5, 6, 7, 14, 17, 20, 21, 27, 28, 29, 30], "defin": [1, 2, 4, 5, 7, 8, 9, 12, 14, 20, 22, 24, 28], "write": [1, 4, 5, 6, 7, 8, 12, 24, 25, 27], "formula": [1, 4, 11, 12, 17, 18, 21, 22, 25, 27, 30], "vector": [1, 10, 12, 13, 31], "work": [1, 2, 5, 7, 10, 12, 13, 20, 21], "perform": [1, 6, 9, 10, 11, 12, 14, 15, 17, 18, 21, 22, 24, 25, 26, 27, 28, 30, 31], "matric": [1, 10, 11, 22, 24], "matrix": [1, 9, 10, 18, 24], "deriv": [1, 10, 14, 31], "integr": [1, 10], "fundament": [1, 6, 7, 8, 10, 11, 12, 13, 15, 26, 28, 29, 30], "theorem": [1, 10, 18], "simpl": [1, 2, 7, 10, 11, 18, 21, 24, 29, 31], "probabl": [1, 5, 10, 14, 18, 25, 28], "relev": [1, 9, 10, 11, 17, 19], "distribut": [1, 10, 11, 12, 14, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 31], "prepar": [1, 2, 17, 20, 21, 22, 28], "import": [1, 5, 7, 12, 14, 16, 18, 19, 20, 22, 23, 24, 25, 26, 27, 31], "scale": [1, 11, 16, 18, 19, 20, 28, 31], "split": [1, 12, 13, 16, 28, 31], "train": [1, 11, 13, 16, 17, 19, 22, 28, 31], "test": [1, 5, 6, 7, 8, 15, 16, 19, 22, 27, 31], "set": [1, 7, 15, 16, 17, 18, 19, 22, 25, 27, 28, 30, 31], "random": [1, 7, 9, 12, 15, 16, 18, 30], "sampl": [1, 2, 9, 15, 16, 17, 18, 19, 26, 27, 28, 30], "stratifi": [1, 2, 16, 30], "principl": [1, 2, 14, 16, 20, 21, 24], "handl": [1, 8, 9, 11, 12, 16, 17, 18, 19, 21, 28, 30, 31], "miss": [1, 16, 17, 18, 19, 21, 24, 28, 31], "detect": [1, 16, 17, 18, 21, 28, 31], "imput": [1, 2, 16, 17], "rational": [1, 2, 16, 20, 21, 22], "normal": [1, 11, 15, 16, 17, 18, 19, 20, 24, 27, 28, 31], "about": [1, 2, 7, 9, 13, 15, 16, 18, 19, 20, 21, 22, 24, 26, 27, 28, 30, 31], "featur": [1, 5, 6, 9, 11, 13, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 30, 31], "z": [1, 2, 9, 11, 12, 16, 17, 30], "score": [1, 2, 9, 16, 17, 18, 26, 28, 31], "min": [1, 2, 16, 17, 19, 22, 28], "max": [1, 2, 16, 17, 19, 22], "encod": [1, 16, 18, 19, 21, 31], "categor": [1, 8, 16, 17, 18, 19, 20, 21, 25, 28, 30, 31], "binari": [1, 2, 9, 16, 18], "one": [1, 2, 6, 7, 8, 9, 11, 16, 17, 18, 19, 22, 26, 27, 28, 30, 31], "hot": [1, 2, 8, 16, 31], "label": [1, 2, 13, 14, 16, 18, 20, 21, 24, 26, 28, 30, 31], "implic": [1, 2, 16, 21, 24, 25, 26], "graphic": [1, 17, 23, 30], "represent": [1, 2, 12, 14, 18, 19, 21, 22, 23, 24, 26], "measur": [1, 2, 9, 11, 13, 15, 17, 18, 19, 23, 24, 27, 28, 30, 31], "central": [1, 2, 15, 18, 20, 21, 23, 26], "tendenc": [1, 2, 15, 20, 21, 23, 24, 26], "dispers": [1, 2, 15, 17, 19, 23, 26], "creat": [1, 2, 5, 6, 7, 8, 9, 17, 19, 20, 22, 23, 24, 25, 30], "plot": [1, 2, 5, 13, 14, 15, 17, 18, 19, 21, 22, 23, 27, 28, 30, 31], "histogram": [1, 2, 21, 22, 23, 31], "box": [1, 2, 17, 21, 23, 25], "correl": [1, 21, 22, 23, 24, 25, 28, 31], "its": [1, 2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 23, 24, 28, 30, 31], "coeffici": [1, 2, 9, 23, 28, 29, 30, 31], "interpret": [1, 2, 5, 8, 13, 15, 21, 22, 23, 24, 25, 27, 29, 30, 31], "select": [1, 9, 13, 18, 20, 21, 23, 24, 27, 30], "inform": [1, 2, 9, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26], "gain": [1, 2, 19, 23, 24, 25, 26, 27], "gini": [1, 2, 23], "impur": [1, 2, 23], "metric": [1, 18, 19, 20, 22, 23, 28, 29], "kei": [1, 2, 5, 7, 8, 12, 17, 18, 19, 20, 21, 25, 26, 28, 29, 30], "equat": [1, 2, 9, 11, 12, 29], "fit": [1, 2, 18, 19, 20, 21, 22, 28, 29, 31], "22": [1, 7, 8, 9, 12, 17, 20, 21, 22, 29], "multipl": [1, 5, 7, 8, 9, 13, 20, 28, 29], "multivari": [1, 2, 29], "23": [1, 8, 9, 17, 29], "polynomi": [1, 29], "lasso": [1, 29], "ridg": [1, 20, 29], "regular": [1, 2, 11, 14, 29, 31], "24": [1, 7, 8, 9, 12, 17, 29], "mean": [1, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 26, 27, 28, 29, 30, 31], "squar": [1, 2, 9, 12, 19, 24, 28, 29, 31], "error": [1, 2, 5, 6, 7, 9, 17, 18, 19, 24, 28, 29, 30, 31], "mse": [1, 2, 9, 29, 31], "root": [1, 2, 29, 31], "rmse": [1, 2, 29, 31], "25": [1, 5, 6, 7, 8, 9, 12, 13, 15, 17, 19, 21, 22, 29, 30, 31], "address": [1, 9, 29, 31], "overfit": [1, 14, 20, 22, 28, 29], "underfit": [1, 29], "strategi": [1, 2, 28, 29, 31], "combat": [1, 2, 29], "bia": [1, 18, 20, 29], "varianc": [1, 2, 15, 18, 20, 21, 22, 25, 26, 28, 29, 30, 31], "tradeoff": [1, 2, 29], "26": [1, 8, 9, 14, 17, 19], "logist": [1, 20, 21, 30], "27": [1, 8, 17, 20, 21, 22], "k": [1, 11, 12, 13, 18, 20, 21, 28], "nearest": [1, 20, 21], "neighbor": [1, 20, 21], "nn": 1, "distanc": [1, 2, 11, 13, 20, 30], "euclidean": [1, 2, 20], "manhattan": [1, 2], "28": [1, 8, 17, 19], "support": [1, 7, 9, 19, 24, 31], "nonlinear": 1, "both": [1, 2, 6, 7, 8, 9, 11, 13, 17, 18, 19, 24, 27, 28, 30, 31], "nonlinearli": 1, "separ": [1, 2, 5, 9, 12, 19, 28, 31], "hyperplan": [1, 2], "margin": [1, 2, 13, 28], "maxim": [1, 24], "kernel": [1, 2, 7, 9, 24], "trick": 1, "29": [1, 7, 8, 17, 19], "rule": [1, 6, 11, 26], "base": [1, 5, 7, 8, 9, 11, 12, 15, 18, 24, 25, 28, 30, 31], "entropi": [1, 2], "30": [1, 6, 8, 9, 12, 15, 17, 21], "naiv": [1, 21], "bay": [1, 21], "classifi": [1, 19, 20, 22, 28], "context": [1, 2, 17, 19, 20, 25, 27, 28, 31], "31": [1, 8, 9, 12, 17, 21, 25], "overview": [1, 24], "combin": [1, 2, 5, 6, 19, 20, 22, 24, 26, 28, 31], "weight": [1, 2, 13, 19, 22, 30], "averag": [1, 2, 9, 13, 15, 17, 19, 20, 30, 31], "32": [1, 8, 12, 17, 19, 21], "bag": 1, "forest": 1, "bootstrap": [1, 2], "role": [1, 2, 7, 11, 12, 13, 14, 17, 20], "33": [1, 9, 12, 17], "boost": 1, "adaboost": 1, "updat": [1, 2, 9, 13, 18, 19], "34": [1, 8, 9, 17, 19, 20, 21, 22], "gradient": [1, 11, 13, 14], "gbm": 1, "xgboost": 1, "descent": [1, 2, 11, 13], "35": [1, 9, 17, 21], "Their": [1, 9, 11, 13], "stack": [1, 2], "blend": [1, 2, 24], "36": [1, 12, 17, 21], "37": [1, 8, 9, 17], "dataset": [1, 2, 7, 17, 24, 25, 31], "centroid": [1, 2], "converg": [1, 2, 11, 21, 31], "criteria": [1, 2, 6, 28], "38": [1, 8, 12, 17, 19], "hierarch": 1, "dendrogram": [1, 2], "linkag": [1, 2], "39": [1, 17, 19, 21], "densiti": [1, 15, 19, 21, 24, 25, 26], "dbscan": 1, "40": [1, 8, 17, 19, 24], "gmm": 1, "expect": [1, 14, 30], "41": [1, 8, 17], "princip": [1, 2], "compon": [1, 2, 11, 30], "covari": [1, 2], "eigenvalu": [1, 2, 11, 12], "eigenvector": [1, 2, 11], "42": [1, 8, 9, 17, 18, 19, 21, 28, 30, 31], "step": [1, 2, 5, 7, 9, 14, 27, 31], "involv": [1, 2, 13, 19, 20, 28, 30], "comput": [1, 2, 5, 9, 12, 13, 14, 17, 19, 20, 28, 30], "43": [1, 8, 12, 17], "singular": 1, "valu": [1, 5, 6, 7, 8, 11, 13, 14, 15, 17, 18, 20, 21, 22, 24, 26, 27, 28, 30, 31], "decomposit": 1, "svd": 1, "Its": 1, "44": [1, 8, 9, 17, 19], "stochast": [1, 2, 11], "embed": [1, 2], "45": [1, 12, 17, 19, 24], "other": [1, 5, 6, 7, 9, 11, 12, 13, 15, 17, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31], "addit": [1, 2, 5, 6, 7, 9, 13, 19], "like": [1, 2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 22, 24, 26, 27, 28, 30, 31], "lda": [1, 2], "autoencod": 1, "behind": [1, 2, 9, 18, 20], "case": [1, 8, 9, 12, 13, 17, 19, 20, 21, 22, 25, 30], "46": [1, 8, 9, 17], "perceptron": 1, "activ": [1, 8, 14, 18, 20], "47": [1, 8, 9, 17, 20, 21, 22, 28], "feedforward": 1, "layer": [1, 25], "neuron": [1, 2], "48": [1, 12, 17, 31], "backpropag": [1, 13, 14], "dive": [1, 2, 15], "The": [1, 2, 5, 6, 8, 9, 11, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30], "chain": [1, 2, 6, 20, 21], "49": [1, 8, 17], "loss": [1, 9, 14], "optim": [1, 6, 11, 13, 14, 30], "focus": [1, 2, 5, 12, 18, 19, 20, 22, 26], "50": [1, 6, 8, 9, 12, 17, 19, 21, 22, 26], "tune": [1, 19, 28], "improv": [1, 2, 8, 9, 17, 19, 21, 24, 28], "hyperparamet": [1, 2, 28], "avoid": [1, 2, 6, 7, 9, 11, 18, 19, 20, 21, 22, 24, 27], "51": [1, 17, 19], "map": [1, 2], "gener": [1, 7, 9, 13, 14, 15, 18, 19, 28, 30, 31], "52": [1, 8, 12, 17, 19], "pool": 1, "spatial": [1, 2], "effect": [1, 2, 7, 9, 11, 12, 13, 18, 20, 24, 25, 26, 28, 30, 31], "53": [1, 8, 12, 17], "task": [1, 2, 5, 8, 11, 12, 18, 20, 21, 25, 27, 30], "filter": [1, 2], "54": [1, 12, 17, 19], "enhanc": [1, 2, 8, 11, 13, 17, 18, 19, 21, 26, 28], "dropout": [1, 2], "batch": [1, 2], "basi": [1, 2, 17, 30], "55": [1, 17, 21], "fine": [1, 2, 28], "extract": [1, 15, 26], "56": [1, 8, 17, 19], "uniqu": [1, 2, 5, 22, 28], "57": [1, 6, 12, 17, 19], "long": [1, 5, 7, 11, 17], "short": [1, 6, 8], "term": [1, 6, 13, 14, 22, 27, 31], "memori": [1, 17, 19], "lstm": 1, "cell": [1, 2, 5, 7, 9, 19, 22, 24], "depend": [1, 2, 5, 7, 8, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31], "58": [1, 8, 12, 17, 19, 21], "time": [1, 7, 9, 12, 13, 15, 17, 18, 20, 24, 30], "59": [1, 8, 12, 17], "seri": [1, 5, 7, 9, 18, 20, 21, 24, 28, 30, 31], "forecast": [1, 2, 30], "60": [1, 6, 8, 12, 17, 19], "util": [1, 9, 11, 13, 20, 24, 30, 31], "natur": [1, 5, 7, 11, 15, 20, 22, 27, 30, 31], "languag": [1, 5, 7, 9, 11], "nlp": [1, 11], "word": [1, 2, 6, 9, 11], "space": [1, 2, 5, 11, 15, 22, 30], "61": [1, 8, 17], "framework": [1, 2, 15], "reward": [1, 2], "make": [1, 5, 6, 7, 8, 9, 11, 12, 13, 15, 17, 20, 22, 24, 25, 26, 30, 31], "62": [1, 8, 17, 20, 21, 22], "markov": 1, "mdp": [1, 2], "rl": 1, "transit": [1, 2], "state": [1, 2, 6, 12, 13, 22, 24], "63": [1, 17], "q": [1, 20, 21, 22], "bellman": [1, 2], "estim": [1, 2, 17, 19, 20, 24, 28, 30, 31], "64": [1, 8, 17], "dqn": 1, "environ": [1, 2, 18, 19, 20], "65": [1, 6, 12, 17, 19], "polici": [1, 18], "ascent": [1, 2], "66": [1, 17], "depth": [1, 27, 28], "67": [1, 8, 17, 19], "adversari": 1, "minimax": [1, 2], "game": [1, 2, 11], "theori": [1, 2, 12, 18, 28], "68": [1, 8, 12, 19], "self": [1, 7, 9], "69": [1, 17], "more": [1, 2, 5, 7, 8, 9, 11, 12, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 30, 31], "reconstruct": [1, 2], "latent": [1, 2], "70": [1, 6, 19], "research": 1, "ml": [1, 13, 14, 18, 32], "aih": 1, "latest": [1, 2, 5], "artifici": [1, 2, 11, 20, 22], "intellig": [1, 2, 11], "technolog": 1, "71": [1, 8, 19], "lifecycl": 1, "72": [1, 12, 19], "version": [1, 5], "track": [1, 9, 20], "73": [1, 8], "ci": 1, "cd": 1, "continu": [1, 2, 5, 9, 12, 13, 14, 17, 20, 22, 27, 28, 30, 31], "deliveri": 1, "autom": [1, 2, 7, 11], "valid": [1, 2, 9, 13, 21, 28, 31], "74": [1, 8], "monitor": 1, "mainten": 1, "maintain": [1, 5, 7, 20], "product": [1, 2], "anomali": [1, 2, 20], "drift": [1, 2], "behavior": [1, 2, 6, 9, 13, 20, 21], "75": [1, 17, 19, 21, 22, 31], "tool": [1, 5, 11, 13, 17, 24, 25, 26, 27, 30, 31], "platform": [1, 5], "scalabl": [1, 2], "effici": [1, 2, 7, 8, 9, 11, 13, 17, 18, 22, 28], "76": [1, 8, 12, 19, 21, 22], "load": [1, 9, 11, 17, 19, 24, 25, 26, 27, 28, 31], "queri": [1, 2], "77": [1, 8, 12], "approach": [1, 2, 6, 19, 28, 31], "78": [1, 12, 19], "databas": 1, "manag": [1, 9, 22], "phase": 1, "balanc": [1, 2, 18, 19, 28], "79": [1, 8], "an": [1, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "pipelin": [1, 28], "workflow": [1, 2], "80": 1, "81": 1, "82": [1, 8, 19], "posit": [1, 5, 7, 9, 11, 13, 17, 18, 19, 26, 27, 30], "83": [1, 8, 12, 17], "84": 1, "e": [1, 2, 5, 9, 11, 12, 15, 17, 20, 21, 22, 24, 28], "g": [1, 2, 9, 11, 13, 17, 20, 21, 22, 24, 28, 31], "bert": [1, 2], "gpt": [1, 2], "geometri": [1, 2], "contextu": [1, 2, 19, 20], "85": 1, "domain": [1, 13, 20, 28], "beyond": [1, 2, 26, 28, 30], "vision": [1, 2], "adapt": [1, 2], "issu": [1, 2, 15, 17, 19, 20, 21, 22, 24, 25, 26, 30], "86": [1, 8, 20, 21], "fair": 1, "quantit": [1, 2, 17, 27], "87": [1, 12], "privaci": 1, "secur": 1, "system": [1, 11, 12, 13, 15, 17, 19, 20, 21, 22, 24, 25, 30], "cryptographi": [1, 2, 9], "protect": [1, 2], "88": [1, 8, 19], "explain": [1, 5], "transpar": [1, 20], "need": [1, 2, 6, 7, 9, 12, 17, 19, 20, 21, 22, 28], "explan": [1, 2, 18], "89": [1, 8, 12], "regul": 1, "complianc": [1, 18], "affect": [1, 2, 6, 13, 20, 21, 25, 26, 28], "gdpr": [1, 2], "risk": [1, 2, 18], "assess": [1, 2, 8, 18, 19, 20, 22, 26, 27, 31], "90": 1, "develop": [1, 7, 11, 20, 24], "91": [1, 8, 22], "diagnost": [1, 2], "treatment": [1, 2], "plan": [1, 18], "predict": [1, 2, 9, 11, 13, 15, 18, 19, 20, 24, 27, 28, 31], "health": [1, 2], "92": [1, 8], "fraud": [1, 2], "financi": [1, 2], "93": [1, 19], "custom": [1, 2, 6, 9], "suppli": [1, 2], "demand": [1, 2], "94": [1, 8], "qualiti": [1, 2, 17, 18, 20, 24], "reliabl": [1, 2, 19, 28], "95": [1, 6, 12], "transport": 1, "etc": [1, 11, 30], "broad": [1, 2], "specif": [1, 2, 5, 6, 9, 11, 13, 18, 20, 21, 28], "A": [1, 2, 5, 7, 9, 11, 12, 15, 19, 20, 21, 24, 27, 31], "encompass": 1, "96": [1, 19], "protocol": [1, 2], "encrypt": [1, 2], "97": [1, 8, 9, 19], "identifi": [1, 9, 11, 17, 19, 20, 22, 26, 27, 30], "threat": 1, "vulner": 1, "potenti": [1, 2, 18, 19, 22, 24, 25, 26, 27, 28, 31], "98": [1, 8, 19], "prevent": [1, 14, 18, 20, 21, 22, 30], "pattern": [1, 2, 9, 11, 19, 20, 24, 25, 26, 30], "recognit": [1, 2, 11], "99": [1, 19], "best": [1, 2, 5, 19, 31], "100": [1, 5, 6, 8, 9, 13, 14, 19, 30], "studi": [1, 12, 31], "incid": 1, "real": [1, 2, 14, 20, 28, 30], "forens": [1, 2], "post": [1, 2, 20, 28], "101": [1, 8], "guidanc": [1, 2], "scope": [1, 2, 8, 9], "definit": [1, 2, 9, 12, 14, 19], "feasibl": [1, 2], "102": 1, "104": 1, "throughout": [1, 5, 9], "cours": [1, 2, 11, 12, 17], "problem": [1, 2, 7, 9, 11, 12, 14, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30], "solv": [1, 2, 6, 7, 9, 11, 12, 30], "105": 1, "final": [1, 6, 8, 9], "present": [1, 7, 9, 15, 22, 24, 25, 26, 28], "result": [1, 2, 5, 6, 8, 9, 11, 12, 19, 20, 21, 22, 24, 25, 26, 27, 31], "googl": [2, 5], "edu": 2, "interact": [2, 5, 9, 11, 12, 28, 30, 31], "cover": [2, 12], "realpython": [2, 26, 27], "demonstr": [2, 9, 19, 22, 28, 30], "code": [2, 5, 6, 7, 9, 17, 18, 21, 22, 24, 25, 27, 30], "execut": [2, 5, 7, 8, 9], "comment": [2, 5], "express": [2, 5, 6, 8, 11, 12, 13, 31], "exampl": [2, 5, 6, 9, 15, 21, 31], "numpi": [2, 5, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 27, 28, 30], "np": [2, 9, 11, 12, 13, 14, 15, 17, 19, 20, 21, 28, 30], "number": [2, 5, 6, 8, 11, 12, 13, 15, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 30], "arrai": [2, 9, 11, 12, 15, 17, 30], "w3school": 2, "python_datatyp": 2, "asp": 2, "document": [2, 9, 11, 19, 20, 26, 27, 28], "tutorialspoint": 2, "python_data_structur": 2, "index": [2, 7, 9, 11, 21, 27, 28], "htm": 2, "string": [2, 5, 6, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "list": [2, 6, 7, 8, 9, 11, 15, 25, 26, 28], "dictionari": [2, 7, 25], "python_oper": 2, "detail": [2, 9, 15, 19, 22, 27], "comparison": [2, 17, 20], "usag": [2, 7, 17, 18, 19, 20, 27, 28, 31], "check": [2, 6, 7, 8, 9, 13, 17, 19, 20, 21, 24, 27, 28, 31], "practic": [2, 9, 11, 12, 15, 19, 23, 30, 32], "convers": 2, "int": [2, 5, 7, 9], "float_vari": 2, "compar": [2, 5, 6, 18, 20, 21, 22, 24, 26, 28, 30, 31], "dataquest": 2, "io": [2, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28], "python_while_loop": 2, "break": [2, 9, 20, 28], "gloss_python_for_nest": 2, "nest": 2, "iter": [2, 7, 8, 20, 28], "over": [2, 6, 7, 8, 9, 11, 12, 13, 14, 15, 19, 28, 31], "sum": [2, 5, 11, 12, 14, 20, 21, 22, 26, 27, 28, 30, 31], "multi": [2, 17, 19], "counter": 2, "gloss_python_els": 2, "gloss_python_elif": 2, "programiz": 2, "pariti": 2, "modifi": [2, 5, 7, 9, 21], "within": [2, 5, 9, 12, 18, 19, 22, 26, 27, 28, 30], "doc": [2, 31], "org": [2, 5, 13, 15, 17, 19, 25, 27, 28, 31], "es": 2, "html": [2, 19, 25, 26, 27, 28, 31], "offici": 2, "creation": 2, "call": [2, 7, 9, 11, 12, 22, 24], "refer": [2, 5, 6, 8, 11, 12, 30, 31], "guid": [2, 18, 24, 25], "python_modul": 2, "packag": [2, 7, 9, 17, 28, 30], "access": [2, 5, 9, 12, 17, 24], "area": [2, 13, 14, 18, 26], "input": [2, 6, 7, 9, 12, 13, 21, 28, 30], "sqrt": [2, 11, 15, 17, 27], "panda": [2, 5, 9, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "m": [2, 6, 12, 30], "youtub": [2, 15], "watch": [2, 15], "v": [2, 11, 13, 15, 27], "fnk_zzamoss": 2, "khanacademi": [2, 15], "free": [2, 5, 7, 9, 12, 19], "onlin": [2, 30], "exercis": [2, 7, 12, 24, 28, 30], "bvanderlei": 2, "librari": [2, 5, 14, 17, 18, 19, 20, 24, 25, 26, 30], "subtract": [2, 5, 7, 13, 21, 30], "scalar": [2, 12], "dot": [2, 9, 25], "magnitud": [2, 12], "matplotlib": [2, 9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 31], "kyb8iza5au": 2, "mathsisfun": 2, "geeksforgeek": [2, 17, 25, 27, 28], "manipul": [2, 6, 7, 11], "transpos": 2, "invers": 2, "determin": [2, 6, 8, 11, 12, 13, 17, 28, 30], "differenti": [2, 14], "dc": 2, "diff": [2, 13], "intro": 2, "askpython": 2, "sympi": [2, 13, 14], "symbol": [2, 5, 12, 13, 14], "wuvtyaankzm": 2, "composit": 2, "tangent": 2, "line": [2, 5, 7, 8, 9, 12, 17, 19, 22, 24, 25, 26, 31], "ic": 2, "2i44y9hfq4q": 2, "integrand": 2, "simpson": 2, "find": [2, 9, 11, 12, 13, 14, 17, 18, 20, 24, 26, 27, 28, 30], "volum": [2, 11, 13], "done": [2, 7, 9, 18, 31], "lwq1zw": 2, "xhbe": 2, "scipi": [2, 15, 17, 19, 24, 25, 27], "stat": [2, 15, 17, 19, 24, 25], "from": [2, 5, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "median": [2, 15, 17, 19, 21, 26, 31], "standard": [2, 6, 15, 18, 20, 22, 25, 26, 28, 31], "deviat": [2, 15, 21, 22, 25, 26, 28], "boxplot": [2, 21, 26], "hypothesi": [2, 15, 27], "scienc": [2, 5, 9, 12, 14, 18, 24, 26, 28, 30], "mode": [2, 15, 20, 21, 26, 31], "outlier": [2, 17, 19, 20, 21, 24, 25, 26, 27, 31], "determinist": 2, "analyz": [2, 11, 13, 15, 17, 19, 20, 22, 25, 26, 27, 28], "impact": [2, 7, 9, 18, 19, 21, 22, 24, 28], "scikit": [2, 5, 9, 18, 20, 21, 22, 24, 25, 31], "vs": [2, 9, 20, 21, 26, 31], "each": [2, 5, 7, 8, 9, 12, 15, 18, 19, 20, 22, 25, 26, 27, 28, 30, 31], "kaggl": [2, 17, 18, 19, 20, 21, 24], "engin": [2, 12, 13, 14, 17, 18], "One": [2, 13], "between": [2, 6, 7, 8, 9, 11, 12, 13, 14, 18, 19, 20, 21, 22, 24, 27, 28, 31], "cross": [2, 28], "In": [2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 20, 22, 24, 27, 28, 30, 31], "aspect": [2, 5, 8, 28, 31, 32], "rang": [2, 6, 8, 9, 11, 15, 21, 24, 25, 26, 28, 30], "skew": [2, 17, 19, 20, 25, 26, 27], "galleri": 2, "showcas": 2, "overal": [2, 18, 20, 28], "pearson": [2, 28], "spearman": 2, "heatmap": [2, 19], "wrangl": 2, "hous": 2, "seaborn": [2, 19, 21, 22, 24, 25, 26, 27, 31], "pairplot": [2, 24, 25, 31], "price": [2, 6, 9, 13], "than": [2, 5, 6, 7, 8, 9, 11, 12, 17, 25, 26, 28, 30, 31], "independ": [2, 12, 13, 15, 18, 22, 28, 30, 31], "how": [2, 5, 6, 7, 9, 11, 13, 14, 15, 18, 19, 21, 22, 24, 25, 26, 27, 28, 30, 31], "influenc": [2, 18, 19, 20, 22, 25, 27, 31], "With": [2, 5, 9], "relationship": [2, 11, 13, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31], "foundat": [2, 4, 6, 10, 11, 14, 15, 16, 17, 18, 25, 32], "accuraci": [2, 18, 21, 22, 25], "efficaci": 2, "limit": [2, 9, 13, 18], "appropri": [2, 18, 20, 21, 24, 25, 30, 31], "deal": [2, 5, 7, 18, 20, 28, 30, 31], "abil": [2, 19], "titan": [2, 20, 21], "outcom": [2, 9, 15, 30, 31], "confus": [2, 9, 18, 19], "datacamp": 2, "provid": [2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 30, 31], "theoret": [2, 24, 28], "path": [2, 18, 19, 22], "assumpt": [2, 20, 24, 27, 28, 31], "conceptu": 2, "masteri": [2, 15], "delv": [2, 6, 22, 25, 26, 27, 28], "underpin": [2, 25, 27], "github": [2, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30], "repositori": 2, "investig": [2, 17, 19, 24, 30], "analyt": [2, 22, 31], "vidhya": 2, "articl": [2, 5, 20, 21], "choos": [2, 9, 14, 18, 20, 21, 24, 25, 26, 27, 28], "nick": 2, "mccullum": 2, "minim": [2, 18, 30], "sse": [2, 30], "built": [2, 5, 28], "beginn": [2, 9], "iri": 2, "also": [2, 5, 6, 8, 9, 11, 14, 18, 19, 20, 24, 25, 26, 28], "group": [2, 6, 17, 18, 19, 26, 28], "point": [2, 5, 7, 9, 11, 13, 14, 15, 18, 19, 20, 24, 25, 26, 27, 30], "recalcul": 2, "format": [2, 9, 17, 30, 31], "abus": 2, "agglom": 2, "divis": [2, 5, 6, 13], "form": [2, 7, 8, 9, 11, 13, 30], "repres": [2, 5, 6, 9, 12, 13, 14, 17, 18, 19, 20, 22, 24, 25, 26, 28, 30, 31], "paramet": [2, 15, 18, 20, 24, 28, 30], "epsilon": [2, 30, 31], "ep": 2, "minpt": 2, "anoth": [2, 5, 9, 11, 27, 28], "found": [2, 5, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "renesh": 2, "bedr": 2, "blog": [2, 17, 18, 20, 21, 22, 24, 25, 28], "which": [2, 5, 6, 7, 8, 9, 11, 13, 17, 19, 20, 21, 22, 26, 27, 30, 31], "\u03b5": 2, "vari": [2, 7, 9, 13, 18, 19, 28], "For": [2, 5, 8, 9, 11, 12, 13, 14, 18, 19, 20, 21, 22, 24, 26, 30], "thorough": [2, 13, 15, 24, 27], "excel": [2, 14, 19], "plu": 2, "breast": 2, "cancer": 2, "cifar": 2, "scratch": 2, "necessari": [2, 7, 9, 12, 13, 14, 17, 18, 20, 24, 25, 26, 30, 31], "kindson": 2, "geniu": 2, "particularli": [2, 5, 6, 7, 11, 14, 18, 19, 20, 28, 30, 31], "underli": [2, 19, 21, 24, 28, 31], "benefici": [2, 5, 19, 20, 25, 31], "those": [2, 12, 19, 20, 21, 30, 31], "look": [2, 6, 19, 20, 22, 25, 26, 28, 30, 31], "can": [2, 5, 6, 7, 8, 9, 11, 12, 13, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 30, 31], "decompos": 2, "constitu": 2, "u": [2, 11, 13], "sigma": [2, 15, 17, 18, 30], "\u03c3": [2, 15, 17, 21], "compress": [2, 9, 12], "nois": [2, 20, 26], "To": [2, 9, 11, 12, 13, 19, 20, 21, 30], "recommend": [2, 9, 19, 20], "where": [2, 5, 6, 8, 9, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 27, 28, 30, 31], "ll": [2, 5, 6, 9, 12, 13, 17, 22, 26, 27, 28], "lower": [2, 9, 18, 19, 26, 28, 30], "precursor": 2, "avail": [2, 9, 30], "toward": [2, 19, 30], "often": [2, 5, 6, 7, 8, 9, 11, 12, 13, 17, 20, 26, 28, 30], "have": [2, 5, 6, 9, 11, 12, 13, 19, 20, 21, 22, 28, 30, 31], "discrimin": [2, 21], "class": [2, 7, 17, 18, 22, 28, 31], "bias": [2, 18, 19], "bryn": 2, "mawr": 2, "artificial_neural_network": 2, "ipynb": 2, "relu": 2, "walk": 2, "tensorflow": 2, "kera": [2, 9], "first": [2, 5, 6, 11, 14, 17, 19, 21, 24, 26, 30], "adjust": [2, 11, 21, 28, 30, 31], "relianc": 2, "choic": [2, 5, 7, 9, 20, 27, 28], "crucial": [2, 5, 6, 7, 11, 12, 13, 14, 15, 18, 19, 20, 22, 26, 27, 28, 30, 31], "opendatasci": 2, "emphas": [2, 21], "consid": [2, 8, 9, 13, 14, 17, 19, 20, 21, 25, 26, 27, 30, 31], "size": [2, 9, 11, 12, 18, 19, 24, 28, 30], "varieti": [2, 18], "when": [2, 5, 6, 7, 8, 9, 11, 12, 17, 18, 19, 20, 21, 22, 26, 27, 30, 31], "instanc": [2, 5, 11, 14, 19, 20, 31], "might": [2, 5, 7, 19, 20, 22, 25, 28, 30, 31], "ideal": [2, 13, 18, 20, 21, 22, 27], "larger": [2, 20, 21, 30, 31], "same": [2, 5, 7, 9, 11, 12, 18, 20, 27, 31], "suggest": [2, 19, 25, 27], "most": [2, 7, 8, 9, 17, 19, 20, 22, 24, 27, 28, 30], "target": [2, 7, 19, 20, 21, 27, 28, 30, 31], "output": [2, 6, 9, 12, 13, 22, 24, 28, 30], "larg": [2, 7, 11, 18, 20, 22, 24, 28, 31], "spread": [2, 17, 19, 20, 21, 22, 24, 25, 26], "logarithm": [2, 28], "msle": 2, "mai": [2, 6, 9, 11, 12, 22, 27, 28, 30], "suitabl": [2, 12, 17, 22, 30, 31], "initi": [2, 5, 18, 24, 25, 31], "ad": [2, 9, 11, 12, 25, 28, 30], "rectifi": 2, "unit": [2, 11, 21, 28, 30, 31], "hidden": [2, 21], "quantiti": [2, 9, 11, 12, 14], "especi": [2, 5, 6, 7, 8, 9, 17, 19, 20, 28, 30], "characterist": [2, 18, 19, 20, 22], "learnopencv": 2, "rate": [2, 11, 18, 19, 22, 26], "critic": [2, 24, 26, 28], "signific": [2, 11, 13, 15, 17, 18, 19, 24, 28, 31], "pivot": [2, 11, 13, 14], "pytorch": [2, 9], "immens": 2, "help": [2, 7, 11, 13, 14, 15, 17, 19, 20, 21, 24, 28], "These": [2, 5, 6, 7, 11, 12, 13, 19, 20], "thei": [2, 5, 6, 7, 9, 11, 12, 13, 14, 15, 19, 21, 22, 25, 26, 27, 28, 31], "contribut": [2, 14, 21, 28], "dimens": [2, 12, 13], "produc": [2, 5, 24, 25], "chan": 2, "leverag": [2, 28], "pre": [2, 13, 14, 17], "new": [2, 5, 7, 11, 12, 17, 19, 28, 30, 31], "touch": 2, "exist": [2, 9, 12, 13, 17, 20, 22], "them": [2, 7, 9, 11, 12, 14, 17, 26, 28, 30, 31], "follow": [2, 5, 6, 8, 9, 11, 15, 21, 25, 26, 28, 31], "special": [2, 5, 6, 9, 12], "kind": [2, 12, 22, 31], "complet": [2, 9, 19, 20, 21, 30], "intuit": [2, 6], "ultim": 2, "freecodecamp": 2, "variat": [2, 19], "gate": 2, "challeng": [2, 5, 22, 31], "sequenti": [2, 9], "show": [2, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "extend": [2, 26, 30], "easi": [2, 6, 17, 24, 25], "Into": 2, "friendli": [2, 9], "less": [2, 6, 7, 8, 9, 19, 20, 21, 28, 30, 31], "intimid": 2, "newcom": 2, "agent": 2, "goal": [2, 7, 20, 24, 28], "openai": 2, "gym": [2, 6], "learndatasci": 2, "previous": [2, 5, 28, 30], "mention": 2, "lai": [2, 15], "groundwork": [2, 15, 30], "tradit": [2, 28], "deeper": [2, 6, 28], "mani": [2, 9, 12, 15, 20, 22, 24, 25, 28, 30, 31], "accompani": [2, 9], "instruct": [2, 5], "common": [2, 9, 19, 20, 25, 31], "repurpos": 2, "get": [2, 5, 6, 11, 19, 28, 30, 31], "thing": [2, 7, 9, 11], "two": [2, 5, 7, 9, 11, 12, 13, 17, 21, 22, 25, 26, 27, 31], "simultan": [2, 31], "competit": 2, "respons": [2, 20, 24], "snippet": [2, 28, 30], "translat": 2, "grasp": [2, 6, 13, 19, 27], "text": [2, 5, 11, 18, 28, 30], "denois": 2, "give": [2, 7, 9, 13, 14, 22, 25, 28, 30, 31], "clear": [2, 7, 22, 24, 25], "along": [2, 11, 13, 19, 30], "back": [2, 6, 9, 31], "arxiv": 2, "essenti": [2, 5, 6, 7, 11, 12, 13, 14, 17, 18, 19, 21, 22, 24, 27, 28, 30, 31], "keep": [2, 9, 20, 21, 24, 28], "up": [2, 9, 14], "paper": 2, "vast": [2, 30], "collect": [2, 6, 11, 15], "preprint": 2, "mit": [2, 12], "review": 2, "breakthrough": 2, "written": [2, 8, 9], "novel": 2, "paradigm": 2, "projectpro": 2, "across": [2, 11, 12, 13, 18, 19, 20, 21, 28], "deploy": 2, "container": 2, "kubernet": 2, "ensur": [2, 5, 7, 11, 13, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 31], "robust": [2, 13, 17, 19, 20, 24], "top": [2, 12, 22, 28], "neptun": [2, 28], "landscap": 2, "2023": [2, 21, 28], "cater": 2, "consider": [2, 19, 28, 32], "cloud": [2, 5, 30], "microsoft": 2, "commun": [2, 5, 18, 26, 28], "hub": 2, "host": 2, "codespac": 2, "csv": [2, 9, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "json": [2, 9], "xml": 2, "sourc": [2, 9], "convert": [2, 17, 22, 28, 31], "off": [2, 19], "file": [2, 7, 9, 30], "azur": 2, "cosmo": 2, "db": 2, "storag": 2, "retriev": [2, 5, 7, 9], "log": [2, 9, 26, 28], "streamlin": 2, "sql": 2, "power": [2, 5, 7, 11, 15, 22, 24, 27, 28, 30, 31], "bi": 2, "uva": 2, "dl": 2, "head": [2, 17, 19, 20, 21, 22, 30, 31], "harvard": 2, "llm": 2, "similar": [2, 6, 7, 11, 12, 20, 25, 30, 31], "decod": 2, "examin": [2, 19, 20, 21, 26, 30], "hug": 2, "face": 2, "enabl": [2, 7, 8, 9, 11, 14, 20, 26, 30, 31], "audio": 2, "upon": [2, 9], "broader": [2, 15, 28], "signal": 2, "modif": [2, 9, 18], "outsid": [2, 6, 9, 25, 26], "foster": 2, "opencoursewar": [2, 12], "full": 2, "classroom": 2, "pluralsight": 2, "mitig": 2, "kdnugget": [2, 28], "user": [2, 7, 9], "close": [2, 19, 20, 27, 30], "pertain": 2, "regulatori": 2, "adher": 2, "coursera": [2, 12], "care": [2, 18, 20], "benefit": [2, 11, 31], "stanford": 2, "patient": 2, "visit": 2, "lab": 2, "procedur": [2, 9, 30], "univers": 2, "innov": 2, "extrapol": 2, "though": [2, 9], "capabl": [2, 8, 9, 19], "person": [2, 6], "centric": 2, "modern": 2, "reshap": [2, 30], "cryptograph": 2, "recogn": [2, 13], "ibm": 2, "forb": 2, "driven": [2, 15, 20], "mckinsei": 2, "highlight": [2, 13, 26, 30], "infosecur": 2, "magazin": 2, "report": [2, 18, 20, 27], "probabilist": 2, "viabil": 2, "realist": 2, "edx": 2, "advic": 2, "idea": [2, 9, 13, 31], "engag": [2, 27], "inde": 2, "tip": [2, 5], "sciencedirect": 2, "summar": [2, 9, 15, 24, 25, 26, 30], "synthesi": 2, "wai": [2, 6, 7, 8, 9, 11, 12, 13, 20, 28], "clearli": [2, 24, 26], "data": [4, 5, 8, 9, 12, 14, 25, 26, 27, 29, 31, 32], "3": [4, 5, 6, 8, 9, 12, 14, 19, 30, 31, 32], "4": [4, 5, 7, 9, 12, 14, 17, 30, 31, 32], "5": [4, 5, 6, 7, 8, 12, 14, 15, 17, 25, 26, 28, 30, 32], "what": [5, 6, 7, 8, 9, 19, 22, 25, 28, 30, 31], "machin": [5, 6, 9, 12, 13, 17, 18, 20, 21, 28, 30, 31], "learn": [5, 6, 9, 12, 13, 15, 16, 17, 18, 20, 21, 22, 24, 25, 27, 28, 31], "our": [5, 6, 7, 9, 13, 25, 27, 30], "go": [5, 6, 9, 30], "wide": [5, 11, 19, 26, 28, 30], "due": [5, 11, 19, 22, 25, 28], "readabl": [5, 7, 8, 9], "simplic": [5, 11], "rich": 5, "ecosystem": 5, "invalu": [5, 20], "preprocess": [5, 19, 22, 28, 32], "analysi": [5, 6, 11, 12, 13, 14, 15, 17, 18, 20, 29, 31, 32], "colab": 5, "account": [5, 9, 20], "jupyt": [5, 9, 19, 20], "notebook": [5, 9, 19, 31], "allow": [5, 6, 7, 8, 9, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31], "browser": 5, "without": [5, 9, 11, 17, 21, 22, 25, 28, 30], "ani": [5, 6, 9, 11, 12, 13, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 31], "setup": 5, "requir": [5, 7, 8, 9, 11, 15, 17, 19, 20, 21, 22, 24, 25, 30, 31], "gpu": 5, "some": [5, 7, 9, 12, 13, 19, 20, 28, 30, 31], "computation": [5, 20, 28], "heavi": 5, "local": [5, 9], "option": [5, 6, 9], "don": [5, 9, 24, 25, 26, 27, 30, 31], "cpu": 5, "want": [5, 7, 13, 30], "acquaint": [5, 27, 30], "anywai": 5, "later": [5, 30], "consist": [5, 18, 19, 20, 21, 28], "contain": [5, 9, 17, 26, 28, 31], "either": [5, 6, 9, 12, 17], "markdown": 5, "rememb": [5, 7, 22, 24, 27, 28], "should": [5, 6, 7, 9, 18, 20, 21, 25, 28, 30, 31], "run": [5, 8, 9, 18, 28], "order": [5, 6, 7, 11, 12, 22, 28], "sinc": [5, 9, 12, 19, 30], "earlier": 5, "howev": [5, 9, 12, 18, 22, 28], "re": [5, 6, 9, 17, 20, 28, 30, 31], "debug": 5, "rerun": [5, 19], "alwai": [5, 6, 7, 9, 13, 19, 20, 21, 28, 30, 31], "appear": [5, 14, 17, 19, 25, 26], "If": [5, 6, 9, 13, 14, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31], "encount": [5, 6, 13], "unexpect": 5, "troubleshoot": 5, "all": [5, 6, 9, 12, 15, 17, 19, 21, 22, 25, 26, 28, 30, 31], "begin": [5, 11, 12, 13], "invalid": [5, 9], "incorrect": [5, 7], "occur": [5, 15, 17, 20, 31], "chang": [5, 7, 9, 11, 20, 21, 22, 27, 30, 31], "haven": 5, "been": [5, 6, 9], "propag": 5, "By": [5, 6, 11, 20, 21, 28], "runtim": 5, "menu": [5, 9], "reflect": [5, 19, 20, 22, 24], "save": [5, 9], "regularli": 5, "autosav": 5, "drive": [5, 13], "good": [5, 19, 30], "habit": 5, "manual": 5, "flexibl": [5, 7, 9], "easili": 5, "perfect": [5, 19, 22], "oper": [5, 7, 9, 10, 18, 20, 21], "print": [5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "after": [5, 6, 7, 9, 12, 18, 20, 21, 22, 28, 31], "next": [5, 7, 15, 17, 19, 20, 21, 22, 24, 25, 30], "block": [5, 7, 9], "whitespac": [5, 8, 9], "indent": [5, 8, 9], "brace": 5, "end": [5, 6, 7, 9, 11, 12, 17], "unind": 5, "amount": [5, 6, 19, 28], "must": [5, 6, 12, 27], "commonli": [5, 6, 8, 12, 13, 17, 20, 24, 27, 28], "x": [5, 6, 8, 9, 12, 13, 14, 17, 18, 19, 21, 24, 25, 27, 28, 30, 31], "0": [5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "here": [5, 6, 7, 9, 13, 19, 22, 27, 30], "true": [5, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 24, 26, 27, 31], "meaning": [5, 9, 24, 26, 27, 30, 31], "apart": [5, 9], "tab": 5, "element": [5, 6, 7, 11, 17, 19, 28, 30], "excess": [5, 19], "ignor": [5, 15, 24, 26, 27, 28], "henc": 5, "b": [5, 6, 8, 9, 11, 12, 14, 28, 30], "harder": 5, "read": [5, 6, 8, 25, 31], "lack": [5, 19, 27], "parenthes": [5, 6, 9], "bracket": 5, "lengthi": 5, "total": [5, 6, 9, 14, 17, 18, 19, 26, 28], "c": [5, 8, 9, 11, 12, 13], "d": [5, 13], "f": [5, 6, 7, 8, 9, 13, 14, 15, 21, 22, 24, 25, 26, 30, 31], "backslash": 5, "indic": [5, 9, 11, 13, 18, 19, 21, 26, 27, 28, 30, 31], "describ": [5, 9, 11, 12, 13, 15, 17, 19, 21, 22, 24, 26, 27, 30], "note": [5, 9, 12, 25, 27, 28, 30, 31], "futur": [5, 30], "carri": 5, "out": [5, 6, 9, 19, 20, 26, 30], "primari": [5, 20, 24], "add": [5, 9, 11, 12], "operand": [5, 6], "equal": [5, 6, 9, 12, 15, 17, 21, 22, 26, 28, 30, 31], "8": [5, 7, 8, 9, 10, 11, 12, 15, 17, 20, 22, 24, 30, 31, 32], "right": [5, 6, 9, 11, 12, 13, 18, 20, 21, 24, 26, 28, 30, 31], "left": [5, 6, 12, 13, 26, 28, 30], "2": [5, 8, 9, 12, 14, 19, 30, 31, 32], "multipli": [5, 11, 12], "15": [5, 8, 12, 16, 17, 19, 24, 25, 30, 32], "divid": [5, 17, 18, 19, 21, 26, 30], "return": [5, 6, 7, 12, 17, 28, 31], "float": [5, 9], "floor": 5, "largest": [5, 8], "whole": 5, "smaller": [5, 19, 20, 21], "modulu": 5, "remaind": 5, "exponenti": 5, "rais": [5, 7, 9], "try": [5, 6, 9, 19, 20, 21, 28, 30], "someth": [5, 9], "yourself": [5, 7, 27, 30], "name": [5, 7, 9, 12, 20, 21, 22, 24, 31], "10": [5, 7, 8, 9, 10, 11, 12, 13, 14, 17, 19, 20, 24, 25, 26, 27, 28, 30, 32], "overwrit": 5, "whatev": [5, 9], "held": 5, "shorthand": [5, 6], "increment": 5, "decrement": 5, "equival": [5, 27, 30], "wa": [5, 7, 9, 12, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30], "would": [5, 9, 15, 19, 20, 21, 22, 24, 25, 28, 30, 31], "now": [5, 6, 9, 30, 31], "becom": [5, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "6": [5, 7, 9, 10, 12, 13, 14, 15, 17, 22, 27, 30, 32], "13": [5, 8, 12, 16, 17, 19, 24, 32], "store": [5, 6, 7, 9, 25], "todai": [5, 6, 13, 31], "three": [5, 6, 7, 11, 25, 28, 30], "integ": [5, 9, 12, 22], "decim": 5, "14": [5, 7, 8, 11, 12, 16, 17, 22, 24, 32], "001": 5, "charact": [5, 11], "str": [5, 7, 9], "enclos": [5, 9], "quot": 5, "hello": [5, 9], "my_integ": 5, "my_float": 5, "my_str": 5, "displai": [5, 9, 12, 19, 21, 25, 31], "ask": [5, 7], "current": [5, 7, 9, 32], "There": [5, 8, 9, 18, 30], "restrict": 5, "certain": [5, 7, 8, 12, 19, 24], "ha": [5, 6, 7, 9, 11, 12, 13, 15, 17, 19, 20, 22, 26, 28, 30, 31], "guess": [5, 31], "y": [5, 9, 11, 12, 18, 19, 21, 24, 26, 27, 28, 31], "hi": 5, "constant": [5, 31], "possibl": [5, 9, 15, 20, 24, 28, 30], "down": [5, 9, 20, 28], "convinc": [5, 7], "fill": [5, 12, 21, 31], "behav": [5, 20, 21], "concaten": 5, "academi": [5, 11, 12], "introduct": [5, 16, 23, 26, 29, 32], "codecademi": 5, "introduc": [5, 6, 9, 20, 22, 26, 30], "en": [5, 15, 27], "wikipedia": 5, "wiki": 5, "python_syntax_and_semant": 5, "previou": [6, 9], "session": 6, "laid": 6, "basic": [6, 8, 14, 16, 19, 21, 22, 23, 24, 25, 27, 29, 32], "onli": [6, 7, 9, 11, 12, 17, 18, 21, 22, 24, 25, 27, 28, 31], "lesson": [6, 13, 15, 18, 24, 25, 26, 27, 28, 30], "stronger": 6, "appli": [6, 11, 12, 14, 18, 20, 22, 25, 27, 28, 31, 32], "reason": [6, 17, 18, 20, 25, 27, 30], "boolean": 6, "bool": [6, 7], "truth": [6, 8], "fals": [6, 7, 8, 9, 18, 19, 25], "is_rain": 6, "is_sunni": 6, "none": [6, 9, 22], "signifi": 6, "noth": 6, "absenc": 6, "default": [6, 9, 28], "least": [6, 9], "rainbow": 6, "inequ": 6, "numer": [6, 21, 22, 26, 28, 31], "greater": [6, 7], "object": [6, 9, 11, 17], "ident": [6, 12], "membership": 6, "temperatur": [6, 13, 17], "warm": 6, "cat": 6, "letter": [6, 9, 12], "compound": 6, "concis": [6, 7, 8, 11, 26], "n": [6, 9, 11, 12, 13, 15, 17, 18, 19, 22, 24, 25, 27, 30], "cleaner": [6, 7], "part": [6, 7, 9, 12, 17, 30], "mathemat": [6, 9, 11, 12, 16, 25, 32], "preced": 6, "insid": [6, 9, 25, 26], "circuit": [6, 12], "stop": [6, 7], "soon": [6, 8], "think": [6, 7, 9, 12, 13], "why": [6, 11, 18, 25, 27, 30], "doesn": [6, 13, 19, 22, 27, 28], "matter": [6, 11, 12], "similarli": [6, 13], "doe": [6, 7, 9, 12, 15, 19, 27, 28], "second": [6, 9, 14, 17, 26, 30], "known": [6, 7, 8, 11, 30], "even": [6, 7, 17, 18, 22, 25, 30, 31], "becaus": [6, 7, 9, 13, 17, 20, 21, 28, 30], "alreadi": [6, 9], "satisfi": [6, 22, 30, 31], "whether": [6, 7, 11, 13, 22, 28], "scenario": [6, 8, 9, 11, 13, 14, 20], "fallback": 6, "zero": [6, 11, 13, 17, 21, 24, 30, 31], "elig": 6, "discount": 6, "senior": 6, "citizen": 6, "ag": [6, 7, 21, 22, 30, 31], "older": 6, "student": [6, 24, 25], "purchas": 6, "tuesdai": 6, "everyon": 6, "take": [6, 7, 9, 12, 31], "statu": [6, 9], "def": [6, 7, 9, 28, 31], "calculate_discount": 6, "is_stud": 6, "total_purchas": 6, "is_tuesdai": 6, "discount_elig": 6, "final_pric": 6, "2f": [6, 9, 18, 30], "00": [6, 19, 21], "upgrad": 6, "member": 6, "year": 6, "attend": 6, "friend": 6, "automat": [6, 9], "regardless": [6, 7, 31], "four": [6, 17, 28], "repeatedli": 7, "under": [7, 11, 13, 14], "repetit": 7, "backbon": 7, "script": [7, 9], "shorter": 7, "valuabl": [7, 19, 26], "repeat": [7, 9, 18, 20, 30], "lead": [7, 9, 19, 20, 22, 28], "organ": [7, 9, 15], "python": [7, 9, 16, 19, 23, 29, 32], "item": [7, 9, 25], "mutabl": 7, "my_list": 7, "unord": [7, 22], "pair": [7, 9, 22, 30], "my_dict": 7, "alic": 7, "len": [7, 9, 21, 28, 30], "specifi": [7, 9, 11], "beforehand": 7, "count": [7, 8, 9, 15, 17, 19, 21, 22], "warn": [7, 9], "infinit": 7, "Be": [7, 18, 20, 24, 28], "cautiou": [7, 20, 24, 28], "never": [7, 20, 21], "difficulti": 7, "straightforward": [7, 11, 13, 18, 30], "inher": [7, 22], "extern": 7, "backward": [7, 28], "tupl": [7, 9], "prefer": [7, 12, 28], "prone": [7, 30], "argument": 7, "i": [7, 8, 9, 11, 12, 17, 21, 24, 25, 27, 30], "nuanc": [7, 19, 22, 25], "purpos": [7, 20, 26], "exit": 7, "prematur": 7, "met": [7, 8], "serv": 7, "itself": [7, 9, 11, 17, 20], "skip": 7, "move": [7, 13, 24, 28], "onto": [7, 11], "bypass": 7, "bodi": [7, 11], "odd": 7, "9": [7, 8, 9, 10, 11, 12, 15, 17, 19, 20, 21, 22, 24, 25, 32], "finish": 7, "termin": 7, "search": [7, 9], "trigger": 7, "remind": [7, 12], "content": [7, 9, 19, 24], "search_for": 7, "enumer": [7, 9, 21], "entir": [7, 9, 13, 28, 31], "java": 7, "plai": [7, 11, 12, 14, 20], "emploi": [7, 12], "accomplish": 7, "divisor": 7, "is_prim": 7, "num": 7, "answer": [7, 9, 31], "correct": [7, 9, 17, 19, 22, 25, 28, 30], "immedi": [7, 9], "feedback": [7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "num_quest": 7, "num1": 7, "randint": [7, 9, 12], "num2": 7, "correct_answ": 7, "user_answ": [7, 9], "stdinnotimplementederror": [7, 9], "traceback": [7, 9, 22, 24], "recent": [7, 9, 22, 24], "last": [7, 9, 17, 19, 21, 22, 24], "16": [7, 8, 9, 12, 17, 19, 21, 23], "19": [7, 8, 9, 17, 23, 32], "21": [7, 8, 11, 12, 17, 21, 29, 32], "book_100daysml": [7, 9], "venv": [7, 9], "lib": [7, 9], "python3": [7, 9], "11": [7, 8, 9, 11, 12, 16, 19, 21, 24], "site": [7, 9], "ipykernel": [7, 9], "kernelbas": [7, 9], "py": [7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 27, 30], "1260": [7, 9], "raw_input": [7, 9], "prompt": 7, "1258": [7, 9], "_allow_stdin": [7, 9], "1259": [7, 9], "msg": [7, 9], "frontend": [7, 9], "request": [7, 9], "1261": [7, 9], "_input_request": [7, 9], "1262": [7, 9], "1263": [7, 9], "_parent_id": [7, 9], "shell": [7, 9], "1264": [7, 9], "get_par": [7, 9], "1265": [7, 9], "password": [7, 9], "1266": [7, 9], "quizz": 7, "feel": [7, 9], "action": [8, 9, 25], "branch": 8, "therebi": 8, "increas": [8, 19, 22, 30], "do_someth": 8, "voila": 8, "conjunct": 8, "do_something_els": 8, "Not": [8, 11, 12, 21], "mutual": [8, 22], "exclus": [8, 22, 28], "condition1": 8, "condition2": 8, "neither": 8, "nor": 8, "do_another_th": 8, "liken": 8, "style": 8, "switch": 8, "correspond": [8, 12], "taken": [8, 12], "medium": [8, 18, 21, 22, 24, 28], "compact": 8, "ternari": 8, "quick": [8, 13, 31], "singl": [8, 9, 11, 12, 17, 30, 31], "vertic": 8, "align": [8, 18, 20, 28], "classic": 8, "job": [8, 30], "interview": 8, "1": [8, 12, 14, 30, 31, 32], "fizz": 8, "instead": [8, 17, 20, 21], "buzz": 8, "7": [8, 9, 10, 11, 15, 17, 20, 22, 24, 26, 31, 32], "17": [8, 9, 12, 17, 19, 21, 23, 32], "entri": [8, 12, 17, 19], "celsiu": [8, 17], "below": [8, 9, 17, 19, 30], "freez": 8, "inclus": [8, 25, 28], "cold": 8, "moder": [8, 19], "abov": [8, 19], "categori": [8, 17, 20, 22, 24], "predefin": [8, 11], "temp": 8, "000": [8, 17], "sedentari": 8, "499": 8, "lightli": 8, "500": 8, "999": 8, "veri": [8, 9, 13, 19, 31], "distinct": [9, 28, 30], "situat": [9, 22], "reusabl": 9, "better": [9, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31], "modular": 9, "degre": [9, 17, 19, 28], "reus": 9, "keyword": 9, "colon": 9, "ey": 9, "peel": 9, "resum": 9, "some_funct": 9, "pass": 9, "do_math": 9, "chosen": [9, 28, 31], "my_funct": 9, "empti": 9, "convent": 9, "lowercas": 9, "underscor": 9, "match": [9, 12], "familiar": [9, 18, 22, 31], "directli": [9, 20, 30], "mere": [9, 28], "being": [9, 19, 30, 31], "won": 9, "until": [9, 30], "declar": [9, 12], "proper": 9, "john": 9, "mandatori": 9, "overridden": 9, "reorder": 9, "shuffl": [9, 18], "global": 9, "confin": 9, "shadow": 9, "do": [9, 17, 19, 20, 21, 24, 25, 26, 27, 30, 31], "who": 9, "struggl": [9, 19], "explicitli": 9, "regard": 9, "bad": 9, "anti": 9, "just": [9, 11, 12, 13, 14, 28, 30], "see": [9, 28, 30], "didn": 9, "h": [9, 13], "stuff": [9, 31], "append": [9, 11, 28], "ones": 9, "caus": [9, 15, 17, 19, 20, 21, 22, 24, 25, 27, 30], "typeerror": 9, "send": 9, "caller": 9, "unpack": 9, "usual": [9, 12, 31], "section": [9, 26], "ran": 9, "bring": [9, 28], "sometim": 9, "batteri": 9, "web": 9, "goe": [9, 30], "heard": 9, "slow": [9, 11, 13], "circumst": 9, "popular": [9, 30], "few": [9, 18, 19, 21, 24, 25, 30, 31], "constraint": 9, "rust": 9, "speed": [9, 11, 13, 21], "highli": [9, 22, 26, 27, 30, 31], "compil": [9, 24], "glue": 9, "namespac": 9, "home": [9, 30], "linux": 9, "x86_64": 9, "cpython": 9, "311": 9, "gnu": 9, "so": [9, 13, 17, 20, 21, 27, 30, 31], "fact": 9, "directori": 9, "pi": [9, 15], "141592653589793": 9, "pow": 9, "forc": [9, 11], "simpli": [9, 13, 30, 31], "frequent": [9, 13, 17, 20], "pyplot": [9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "plt": [9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "dozen": 9, "exhaust": 9, "given": [9, 11, 13, 15, 19, 30, 31], "alia": 9, "leav": [9, 30], "rest": [9, 22, 31], "sole": [9, 26, 28], "sparingli": 9, "difficult": 9, "trace": 9, "come": [9, 15], "own": [9, 15], "encapsul": [9, 13, 22], "occasion": 9, "ok": 9, "greatli": 9, "star": 9, "great": 9, "caution": 9, "could": [9, 19, 25], "adequ": [9, 20], "As": [9, 28], "homework": [9, 28], "perus": 9, "handi": 9, "lot": 9, "dice_rol": 9, "6692318444660496": [], "servic": 9, "txt": 9, "dump": 9, "elaps": 9, "deliber": [9, 30], "sleep": 9, "datetim": 9, "calendar": 9, "timestamp": 9, "timezon": 9, "durat": [9, 11], "01": [9, 21], "06": [17, 20, 25, 28], "344280": [], "regress": [9, 15, 21, 27, 32], "far": [9, 19], "actual": [9, 11, 17, 19, 30, 31], "suppos": 9, "ax": [9, 11, 24, 26, 30, 31], "column": [9, 12, 19, 20, 21, 22, 28, 30, 31], "intercept": [9, 30, 31], "x_data": 9, "x1": [9, 11, 12], "x2": [9, 12], "xn": 9, "y_data": 9, "y1": [9, 11, 12], "y2": [9, 12], "yn": 9, "y_pred": 9, "quantifi": [9, 15, 27, 28], "replac": [9, 20, 22], "synthes": 9, "everyth": 9, "ve": [9, 30], "correctli": [9, 19, 22, 28, 31], "too": [9, 24, 25, 28], "low": [9, 17, 19, 26, 27, 30], "attempt": 9, "made": 9, "onc": [9, 31], "successfulli": [9, 19], "messag": 9, "user_input": 9, "enter": 9, "except": 9, "valueerror": 9, "pleas": [9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "calculate_scor": 9, "range_s": 9, "fewer": [9, 19, 22], "worst": 9, "log2": 9, "worst_case_binary_search": 9, "interpol": 9, "extrem": [9, 17, 19, 20, 24], "guessing_gam": 9, "min_valu": 9, "max_valu": 9, "configur": [9, 18, 31], "number_to_guess": 9, "user_guess": 9, "congratul": 9, "again": 9, "desir": [9, 19], "20": [9, 11, 12, 17, 19, 20, 23, 24, 26, 32], "record": 9, "got": [9, 30], "wrong": 9, "my": 9, "solut": [9, 11, 13, 30], "disk": 9, "bonu": 9, "quickli": 9, "around": [9, 13, 19, 21, 24, 26], "example_quiz": 9, "filenam": 9, "sample_quiz": 9, "capit": [9, 12, 25], "franc": 9, "pari": 9, "wrong_answ": 9, "rome": 9, "london": 9, "open": 9, "w": 9, "load_quiz": 9, "uncom": 9, "quiz_gam": 9, "total_scor": 9, "all_answ": 9, "chr": 9, "start_tim": 9, "strip": 9, "end_tim": 9, "time_taken": 9, "correct_answer_index": 9, "assum": [9, 17, 18, 19, 20, 21, 27, 28, 30, 31], "1f": 9, "18": [9, 12, 17, 23, 32], "pick": [9, 30], "inspir": 9, "edit": 9, "delet": 9, "phone": 9, "email": 9, "interfac": 9, "command": 9, "view": [9, 18, 26], "confirm": [9, 13], "success": [9, 15], "gracefulli": 9, "inventori": 9, "remov": [9, 17, 28, 31], "id": [9, 19, 21, 28], "stock": [9, 13], "cost": [9, 13, 20, 28], "tax": 9, "mathbf": 11, "bmatrix": [11, 12], "v_1": 11, "v_2": 11, "vdot": [11, 12], "v_n": 11, "possess": 11, "length": [11, 13, 21, 28], "denot": [11, 12, 13, 14, 15, 28], "non": [11, 19, 20, 28, 31], "neg": [11, 19, 26, 27, 30, 31], "orient": 11, "rel": [11, 19, 28], "frame": [11, 17, 19], "angl": [11, 30], "coordin": [11, 12], "fulli": 11, "car": [11, 13], "travel": [11, 13], "60kph": 11, "ne": 11, "paramount": 11, "scientif": 11, "disciplin": [11, 12, 15], "versatil": 11, "veloc": [11, 13], "acceler": [11, 13], "displac": 11, "motion": 11, "civil": 11, "electr": [11, 12], "indispens": [11, 15], "classif": [11, 18, 28, 30, 32], "phenomena": [11, 15], "tackl": 11, "place": [11, 18], "background": 11, "color": [11, 13, 14, 15, 18, 20, 21, 22, 24, 26, 28, 30, 31], "easier": [11, 31], "handwritten": 11, "digit": [11, 22], "optic": 11, "ocr": 11, "shape": [11, 12, 17, 19, 26, 27], "commut": [11, 12], "associ": [11, 12, 28], "therefor": [11, 13], "yield": 11, "OR": [11, 12], "x_add": 11, "sgd": 11, "dynam": 11, "progress": 11, "overshoot": 11, "ab": 11, "bx": 11, "mulitpl": 11, "ay": 11, "xa": 11, "ya": 11, "x_scalar_mult": 11, "navig": 11, "robot": 11, "linalg": [11, 12], "arctan2": 11, "radian": 11, "9272952180016122": 11, "sentiment": 11, "mathbb": 11, "dimension": [11, 22, 28, 30, 32], "cdot": [11, 12, 13], "sum_": [11, 12, 17, 25, 30], "x_i": [11, 17, 27, 30], "y_i": [11, 27, 30], "respect": [11, 13, 21, 27, 28, 31], "co": 11, "theta": 11, "bilinear": 11, "orthogon": 11, "perpendicular": 11, "quad": 11, "dot_product": 11, "x1_3d": 11, "y1_3d": 11, "3d": [11, 30], "surfac": 11, "light": 11, "render": [11, 19], "torqu": 11, "rotat": [11, 24, 30], "origin": [11, 12, 14, 20, 21, 30, 31], "mathbi": 11, "vmatrix": 11, "j": [11, 12], "x_1": [11, 30, 31], "x_2": [11, 30, 31], "x_3": 11, "y_1": 11, "y_2": 11, "y_3": 11, "a_1": 11, "a_2": 11, "a_3": 11, "b_1": 11, "b_2": 11, "b_3": 11, "sin": 11, "plane": [11, 30], "neq": 11, "exert": 11, "simplifi": [11, 28], "cross_product": 11, "l2": 11, "_2": 11, "ldot": 11, "vector_v": 11, "l2_norm": 11, "new_posit": 11, "aerospac": 11, "safeti": 11, "stabil": [11, 19, 21], "bridg": 11, "accur": [11, 24, 27, 30, 31], "analys": [11, 17, 19, 20, 24, 25, 30], "big": 11, "quicker": 11, "precis": [11, 13, 18, 19, 21, 22], "abstract": 11, "infrastructur": 11, "quantum": [11, 12], "stem": 11, "approxim": [11, 19, 28], "minut": 11, "linspac": [11, 13, 14], "meshgrid": 11, "circular": 11, "quiver": 11, "xlim": [11, 30], "ylim": [11, 30], "titl": [11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "xlabel": [11, 13, 14, 18, 20, 21, 22, 24, 25, 26, 28, 30, 31], "axi": [11, 18, 19, 22, 28, 30, 31], "ylabel": [11, 13, 14, 18, 20, 21, 22, 24, 25, 26, 28, 30, 31], "v1": 11, "v2": 11, "v_add": 11, "v_sub": 11, "v_scalar_mult": 11, "xy": [11, 12], "scale_unit": 11, "green": [11, 20, 21, 30], "red": [11, 13, 21, 22, 27, 30, 31], "blue": [11, 14, 20, 21, 22, 30, 31], "khan": [11, 12], "rectangular": 12, "arrang": 12, "row": [12, 17, 21, 22, 24, 31], "x_": [12, 25], "12": [12, 16, 17, 20, 21, 22, 24, 26, 27, 30, 31, 32], "1n": 12, "2n": 12, "ddot": 12, "m1": 12, "m2": 12, "mn": 12, "physic": [12, 13, 14], "moment": [12, 13], "inertia": 12, "tensor": 12, "graph": [12, 13, 14], "among": [12, 27, 28, 30], "kickoff": 12, "fantast": 12, "coupl": 12, "grid": [12, 13, 14, 25], "nonumb": 12, "z1": 12, "subscript": 12, "isn": [12, 30], "nice": 12, "notic": 12, "verifi": 12, "_": 12, "ij": 12, "x1_": 12, "y1_": 12, "m_add": 12, "m_sub": 12, "rather": [12, 30], "l": 12, "obtain": [12, 25, 28], "th": [12, 30], "compat": 12, "inner": 12, "circ": 12, "m_sca": 12, "m_mul": 12, "4x4": 12, "communit": 12, "m_mul1": 12, "m_mul2": 12, "113": 12, "141": 31, "114": [], "129": [], "166": [], "103": 12, "158": [], "rrr": 12, "hspace": 12, "1cm": 12, "twice": 12, "notat": 12, "transposit": 12, "x_t": 12, "det": 12, "nonzero": 12, "x_inv": 12, "inv": 12, "81474977e": 12, "62949953e": 12, "12589991e": 12, "mat_x": 12, "mat_i": 12, "mat_": 12, "mat_xi": 12, "mat_xy_t": 12, "mat_xy_t2": 12, "2nd": [12, 22], "mat_xy_inv": 12, "118": 12, "194": 12, "322": 12, "264": 12, "405": 12, "690": 12, "668": 12, "895": [12, 20, 21, 22], "1610": 12, "81926058e": 12, "93203101e": 12, "79964834e": 12, "97348241e": 12, "05242171e": 12, "95975384e": 12, "further": [12, 17, 19, 25], "resourc": 12, "link": 12, "materi": 12, "interest": [12, 13, 15, 20, 26, 27, 30], "essenc": [13, 20], "ai": [13, 14, 28, 32], "curios": 13, "willing": 13, "akin": [13, 14], "lim_": 13, "frac": [13, 17, 18, 25, 27, 30], "instantan": 13, "curv": [13, 14, 18], "imagin": 13, "know": [13, 14, 30], "fast": [13, 30], "growth": 13, "popul": [13, 15, 17, 18, 19, 24], "particular": [13, 19], "df": [13, 18, 20, 21, 31], "dx": [13, 14], "2x": 13, "3x": 13, "4x": 13, "expon": [13, 30], "impli": [13, 19, 27, 28], "concern": [13, 28], "sp": [13, 14], "s_t": 13, "s_prime_t": 13, "remain": [13, 20], "fix": [13, 15, 19, 26, 30], "locat": [13, 17, 30], "t_x": 13, "livrari": 13, "t_prime_x": 13, "conveni": 13, "straight": [13, 30], "road": 13, "p": [13, 15, 24, 28], "2t": 13, "3t": 13, "4t": 13, "p_t": 13, "p_prime_t": 13, "rectangl": 13, "width": [13, 21, 26, 28], "a_x": 13, "a_prime_x": 13, "speedomet": 13, "econom": [13, 31], "revenu": 13, "busi": 13, "safe": 13, "sensit": [13, 20, 21, 24, 28, 31], "aid": [13, 27], "formul": 13, "assist": 13, "node": [13, 28], "abc": [13, 14], "sai": [13, 30], "value_at_x": 13, "rate_of_chang": 13, "sub": 13, "lambda": [13, 14], "func_lambda": [13, 14], "lambdifi": [13, 14], "deriv_lambda": 13, "x_val": [13, 14], "y_val": [13, 14], "tangent_lin": 13, "figur": [13, 14, 18, 19, 21, 22, 25, 26, 27, 28, 30], "figsiz": [13, 14, 19, 21, 22, 25, 26, 27, 30, 31], "linestyl": [13, 18, 30], "dash": [13, 30], "scatter": [13, 21, 27, 30, 31], "tangenc": 13, "legend": [13, 14, 18, 20, 21, 24, 28, 30, 31], "distinguish": 13, "interv": [13, 14, 15, 17], "impart": 13, "mark": 13, "stride": 13, "machinelearningmasteri": [13, 18, 20, 21, 22, 27, 28], "gentl": 13, "partial": 13, "openstax": 13, "book": 13, "page": [13, 19], "towardsai": 13, "net": 13, "master": [13, 22, 27], "towardsdatasci": [13, 18, 21, 22, 24], "peopl": [13, 18], "3cd913c5cf33": 13, "deepen": [14, 15, 20, 22, 25, 28], "profound": 14, "profici": [14, 15, 24], "eager": 14, "accumul": 14, "infinitesim": 14, "small": [14, 19], "piec": 14, "much": [14, 28, 30], "a_b": 14, "indefinit": 14, "antideriv": 14, "famili": 14, "whose": [14, 30], "assert": 14, "a_bf": 14, "dxf": 14, "extens": [14, 31], "roc": [14, 18, 19], "deep": [14, 15, 24, 26, 32], "indefinite_integr": 14, "definite_integr": 14, "integral_lambda": 14, "fill_between": 14, "grai": [14, 30], "alpha": [14, 15, 20, 21, 26, 28, 30], "equip": [15, 27], "keen": 15, "interrel": 15, "sens": [15, 19, 22, 28, 30], "event": 15, "infer": [15, 24, 30, 31], "cannot": [15, 30], "certainti": 15, "subset": [15, 18, 19, 28], "imposs": 15, "likelihood": [15, 20], "occurr": [15, 19], "confid": [15, 28], "uniform": 15, "simplest": [15, 30], "everi": [15, 19], "chanc": 15, "character": 15, "\u03bc": [15, 21], "binomi": 15, "bernoulli": 15, "trial": 15, "poisson": 15, "pd": [15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "tmp": [15, 17, 19, 20, 21, 22, 24, 25, 30], "ipykernel_145386": [], "584559657": 15, "deprecationwarn": [15, 17, 19, 20, 21, 22, 24, 25, 30], "pyarrow": [15, 17, 19, 20, 21, 22, 24, 25, 30], "major": [15, 17, 19, 20, 21, 22, 24, 25, 30], "releas": [15, 17, 19, 20, 21, 22, 24, 25, 30], "arrow": [15, 17, 19, 20, 21, 22, 24, 25, 30], "interoper": [15, 17, 19, 20, 21, 22, 24, 25, 30], "instal": [15, 17, 19, 21, 22, 24, 25, 30, 31], "dev": [15, 17, 19, 20, 21, 22, 24, 25, 30], "54466": [15, 17, 19, 20, 21, 22, 24, 25, 30], "range_": 15, "ptp": 15, "var": [15, 17, 19, 24, 25, 26], "std_dev": [15, 25], "std": [15, 17, 19, 21, 22, 24, 25], "8722813232690143": 15, "mu": [15, 18], "1000": 15, "bin": [15, 20, 24, 25, 26, 28], "hist": [15, 20, 24, 25, 26, 31], "exp": 15, "linewidth": [15, 19], "lambda_": 15, "null": [15, 17, 19, 24], "\u03bc_0": 15, "altern": [15, 22, 24], "mu_0": 15, "05": [15, 28], "t_statist": [15, 24], "p_valu": [15, 24, 28], "ttest_1samp": [15, 24], "reject": 15, "fail": [15, 28], "5222329678670935": 15, "614117254808394": 15, "rigor": 15, "probabilitycours": 15, "prefac": 15, "php": 15, "vfu": 15, "bg": 15, "bertsekas_tsitsiklis_introduction_to_prob": 15, "pdf": 15, "1uw3qmfa9ho": 15, "plul4u3cngp60hi9atjsfglzpbnj7myag6": 15, "morningsid": 15, "libguid": 15, "raw": 17, "clean": 17, "duplic": 17, "discret": [17, 28], "qualit": 17, "nomin": 17, "blood": 17, "ordin": 17, "ratio": 17, "height": [17, 26, 31], "covid": 17, "ipykernel_145430": [], "2223182689": [17, 19], "datafram": [17, 18, 19, 20, 21, 22, 28, 31], "covid_data": 17, "read_csv": [17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "inspect": [17, 19], "five": [17, 18, 19, 21], "iso_cod": 17, "contin": 17, "total_cas": 17, "new_cas": 17, "new_cases_smooth": 17, "total_death": 17, "new_death": 17, "new_deaths_smooth": 17, "female_smok": 17, "male_smok": 17, "handwashing_facil": 17, "hospital_beds_per_thousand": 17, "life_expect": 17, "human_development_index": 17, "excess_mortality_cumulative_absolut": 17, "excess_mortality_cumul": 17, "excess_mort": 17, "excess_mortality_cumulative_per_million": 17, "afg": 17, "asia": 17, "afghanistan": 17, "02": [17, 21, 31], "2020": [17, 21, 22, 28], "nan": [17, 20, 21, 22], "746": 17, "511": 17, "tail": [17, 19, 26], "5813": 17, "nga": 17, "africa": 17, "nigeria": 17, "2022": 17, "265741": 17, "236": 17, "286": 17, "3155": 17, "949": 17, "539": 17, "5814": 17, "07": [17, 18], "5815": 17, "08": [17, 19, 22], "265816": 17, "5816": 17, "09": [9, 17], "5817": 17, "info": [17, 19], "rangeindex": [17, 19], "5818": 17, "dtype": [17, 19, 20, 21, 22, 28, 31], "int64": [17, 19, 20, 21], "5788": 17, "float64": [17, 19, 20, 22, 31], "5638": 17, "5627": 17, "5596": 17, "total_cases_per_million": 17, "new_cases_per_million": 17, "new_cases_smoothed_per_million": 17, "total_deaths_per_million": 17, "new_deaths_per_million": 17, "new_deaths_smoothed_per_million": 17, "reproduction_r": 17, "5566": 17, "icu_pati": 17, "2610": 17, "icu_patients_per_million": 17, "hosp_pati": 17, "hosp_patients_per_million": 17, "weekly_icu_admiss": 17, "weekly_icu_admissions_per_million": 17, "weekly_hosp_admiss": 17, "934": 17, "weekly_hosp_admissions_per_million": 17, "total_test": 17, "3174": 17, "new_test": 17, "2948": 17, "total_tests_per_thousand": 17, "new_tests_per_thousand": 17, "new_tests_smooth": 17, "4114": 17, "new_tests_smoothed_per_thousand": 17, "positive_r": 17, "3440": 17, "tests_per_cas": 17, "tests_unit": 17, "4156": 17, "total_vaccin": 17, "2104": 17, "people_vaccin": 17, "2051": 17, "people_fully_vaccin": 17, "2004": 17, "total_boost": 17, "1170": 17, "new_vaccin": 17, "1827": 17, "new_vaccinations_smooth": 17, "3658": 17, "total_vaccinations_per_hundr": 17, "people_vaccinated_per_hundr": 17, "people_fully_vaccinated_per_hundr": 17, "total_boosters_per_hundr": 17, "new_vaccinations_smoothed_per_million": 17, "new_people_vaccinated_smooth": 17, "new_people_vaccinated_smoothed_per_hundr": 17, "stringency_index": 17, "5699": 17, "population_dens": 17, "median_ag": 17, "aged_65_old": 17, "aged_70_old": 17, "gdp_per_capita": 17, "extreme_poverti": 17, "2922": 17, "cardiovasc_death_r": 17, "diabetes_preval": 17, "4860": 17, "1913": 17, "4863": 17, "421": 17, "mb": 17, "covid_datanew": 17, "bar": [17, 18, 22, 25, 26, 27, 28, 30], "newcase_mean": 17, "8814": 17, "365761430045": 17, "middl": [17, 19, 26], "sort": [17, 25], "newcase_median": 17, "261": 17, "moderesult": 17, "modal": [17, 26], "thu": [17, 19], "newcase_mod": 17, "805": 17, "\u03c3\u00b2": [17, 21], "newcase_vari": 17, "451321915": 17, "9280954": 17, "451399502": 17, "6421969": 17, "ddof": [17, 19], "newcase_stdev": 17, "stdev": [17, 19], "21246": 17, "164421895": 17, "freedom": [17, 28], "unbias": [17, 18], "mle": 17, "stackoverflow": 17, "62938495": 17, "stand": [17, 28], "alon": 17, "mislead": [17, 22, 24], "covid_newcases_max": 17, "covid_newcases_min": 17, "287149": 17, "iqr": [17, 25, 26], "sever": [17, 19, 20, 31], "fall": [17, 19, 26], "q1": [17, 19, 26], "q3": [17, 19, 26], "parametr": [17, 28], "segment": 17, "sale": 17, "depict": [17, 26], "quantil": [17, 19], "25th": [17, 19], "percentil": [17, 19], "75th": [17, 19], "3666": 17, "3642": 17, "nehalbirla": 17, "vehicl": 17, "cardekho": 17, "quantinsti": 17, "experfi": 17, "clt": 18, "sim": 18, "unknown": 18, "observ": [18, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "homogen": [18, 19, 28], "subgroup": 18, "proport": [18, 19, 22, 26, 28, 31], "strata": 18, "stratum": 18, "sklearn": [18, 19, 20, 21, 22, 28, 30, 31], "model_select": [18, 19, 21, 28, 30, 31], "train_test_split": [18, 19, 21, 28, 30, 31], "train_set": 18, "test_set": 18, "test_siz": [18, 19, 21, 28, 30, 31], "random_st": [18, 19, 20, 21, 28, 30, 31], "pseudo": 18, "reproduc": 18, "softwar": 18, "talk": 18, "intern": 18, "imbalanc": [18, 19], "stratifiedshufflesplit": 18, "n_split": 18, "train_index": 18, "test_index": 18, "stratum_column": 18, "strat_train_set": 18, "loc": [18, 26, 30], "strat_test_set": 18, "fold": [18, 19], "kfold": 18, "cross_val_scor": [18, 19], "ensembl": [18, 19, 29], "randomforestclassifi": [18, 19], "kf": 18, "df_featur": 18, "df_target": 18, "cv": [18, 19], "stratifiedkfold": 18, "skf": 18, "x_train": [18, 19, 21, 28, 30, 31], "x_test": [18, 19, 21, 28, 30, 31], "y_train": [18, 19, 21, 28, 30, 31], "y_test": [18, 19, 21, 28, 30, 31], "subject": 18, "suit": [18, 30], "download": [18, 19], "wine": [18, 24], "100daysofml_notebook": [18, 21, 22], "accord": [18, 19, 28], "wine_data": [18, 19, 24, 25, 26, 27], "winequ": 18, "standardscal": [18, 19, 21, 28, 31], "labelencod": [18, 19, 22, 28], "fillna": [18, 19, 20, 21, 31], "inplac": [18, 19, 20, 21, 31], "categorical_column": [18, 19], "fit_transform": [18, 19, 20, 21, 22, 28, 31], "scaler": [18, 19, 21, 31], "wine_data_sc": [18, 19], "drop": [18, 19, 22, 28, 31], "accuracy_scor": [18, 19, 28], "confusion_matrix": [18, 19], "recal": [18, 19, 21, 22], "f1": [18, 19], "classification_report": [18, 19], "roc_curv": 18, "auc": [18, 19], "predict_proba": 18, "fpr": 18, "tpr": 18, "threshold": [18, 28], "roc_auc": 18, "darkorang": 18, "lw": 18, "navi": 18, "receiv": 18, "outlin": 18, "confidenti": 18, "conduct": [18, 19, 24, 26, 28, 31], "befor": [18, 20, 21, 22, 24, 27, 28], "unseen": [18, 19, 28, 31], "generaliz": 18, "leak": [18, 31], "vigil": 18, "augment": 18, "datasciencewizard": 18, "49a959c95fa1": 18, "8ef4e3a97562": 18, "analyticsvidhya": [18, 20, 21, 22, 25, 28], "2021": [18, 20, 25], "jfrog": 18, "ipykernel_145464": [], "wine_qu": [19, 24, 25, 26, 27], "acid": [19, 26], "volatil": 19, "citric": 19, "residu": [19, 25, 26, 30], "sugar": [19, 25, 26], "chlorid": 19, "sulfur": [19, 26], "dioxid": [19, 26], "ph": [19, 25, 26], "sulphat": 19, "alcohol": [19, 24, 25, 26], "076": 19, "9978": 19, "098": 19, "9968": 19, "04": [19, 21], "092": 19, "9970": 19, "075": 19, "9980": 19, "1138": 19, "510": 19, "99574": 19, "1592": 19, "1139": 19, "620": 19, "068": 19, "99651": 19, "1593": 19, "1140": 19, "600": 19, "090": 19, "99490": 19, "1594": 19, "1141": 19, "550": 19, "062": 19, "99512": 19, "1595": 19, "1142": 19, "645": 19, "99547": 19, "1597": 19, "1143": 19, "116": 19, "kb": 19, "copi": [19, 20, 21], "wine_datanew": 19, "winequality_mean": 19, "657": 19, "winequality_median": 19, "winequality_var": 19, "6488": 19, "extent": 19, "somewhat": 19, "heterogen": 19, "alongsid": 19, "holist": 19, "winequality_stdev": 19, "8058": 19, "tend": [19, 26], "wider": 19, "typic": [19, 25], "pronounc": 19, "pictur": 19, "winequality_max": 19, "winequality_min": 19, "maximum": [19, 21, 26], "minimum": [19, 21, 26], "highest": [19, 30], "lowest": [19, 30], "presenc": [19, 21, 22, 25, 26], "exploratori": [19, 25, 26, 28, 32], "reveal": 19, "factor": [19, 27, 28, 31], "upper": [19, 26, 30], "third": [19, 26], "closer": [19, 30, 31], "half": 19, "narrow": [19, 26], "higher": [19, 28, 31], "sn": [19, 21, 22, 24, 25, 26, 27, 31], "correlation_matrix": [19, 24], "corr": [19, 21, 24, 27], "annot": [19, 24, 27], "cmap": [19, 24, 27], "coolwarm": 19, "attribut": [19, 28], "decreas": 19, "6731": 19, "6815": 19, "6852": 19, "4074": 19, "5442": 19, "4947": 19, "5463": 19, "2577": 19, "4849": 19, "chemic": 19, "properti": [19, 28], "trust": 19, "On": [19, 30], "unabl": 19, "nbviewer": 19, "nbsp": 19, "randomforestclassifierifittedrandomforestclassifi": 19, "9782": 19, "strong": [19, 24, 27], "significantli": [19, 20, 22, 26, 27, 28], "outnumb": 19, "tell": [19, 30], "categorical_featur": 19, "x_train_scal": [19, 31], "x_test_scal": [19, 31], "diagon": 19, "No": [19, 20, 22], "misclassif": 19, "misclassifi": 19, "failur": 19, "imbal": 19, "zero_divis": 19, "229": 19, "macro": 19, "avg": 19, "breakdown": 19, "identif": 19, "poor": 19, "were": 19, "resampl": 19, "underrepres": 19, "cross_val_scores_round": 19, "9825": 19, "9737": 19, "9345": 19, "9476": 19, "9605": 19, "9649": 19, "slight": 19, "fairli": 19, "stabl": [19, 31], "overli": [19, 30], "advis": 19, "intermedi": [20, 21, 22, 24, 25], "mar": 20, "missing": 20, "unobserv": 20, "titanic_data": [20, 21, 22], "isnul": [20, 21, 31], "passengerid": [20, 21, 22], "pclass": [20, 21], "sex": [20, 21, 22, 31], "892": [20, 21, 22], "kelli": [20, 21, 22], "mr": [20, 21, 22], "jame": [20, 21, 22], "male": [20, 21, 22], "893": [20, 21, 22], "wilk": [20, 21, 22, 28], "ellen": [20, 21, 22], "femal": [20, 21, 22], "894": [20, 21, 22], "myle": [20, 21, 22], "thoma": [20, 21, 22], "franci": [20, 21, 22], "wirz": [20, 21, 22], "albert": [20, 21, 22], "896": [20, 21, 22], "hirvonen": [20, 21, 22], "alexand": [20, 21, 22], "helga": [20, 21, 22], "lindqvist": [20, 21, 22], "sibsp": [20, 21, 22], "parch": [20, 21, 22], "ticket": [20, 21, 22], "fare": [20, 21, 22], "cabin": [20, 21], "surviv": [20, 21, 22], "330911": [20, 21, 22], "8292": [20, 21, 22], "363272": [20, 21, 22], "0000": [20, 21, 22], "240276": [20, 21, 22], "6875": [20, 21, 22], "315154": [20, 21, 22], "6625": [20, 21, 22], "3101298": [20, 21, 22], "2875": [20, 21, 22], "327": [20, 21], "ipykernel_145506": [], "245541981": 20, "unduli": 20, "preserv": [20, 21, 22], "embarked_mod": 20, "retain": 20, "distort": [20, 31], "unaffect": 20, "conclus": [20, 24, 26], "684399944": 20, "futurewarn": [20, 21], "col": [20, 21, 22], "knnimput": 20, "n_neighbor": 20, "numeric_column": 20, "select_dtyp": [20, 22], "closest": 20, "exhibit": [20, 30], "captur": [20, 28], "smooth": [20, 26], "inaccur": 20, "expens": 20, "predictor": [20, 27, 30, 31], "poorli": 20, "sophist": [20, 28], "intertwin": 20, "experiment": [20, 28], "enable_iterative_imput": 20, "iterativeimput": 20, "linear_model": [20, 30, 31], "bayesianridg": 20, "iterative_imput": 20, "missing_valu": 20, "max_it": 20, "titanic_data_imput": 20, "bayesian": 20, "incorpor": 20, "prior": 20, "belief": 20, "uncertainti": [20, 28], "posterior": 20, "robin": 20, "fashion": 20, "gaug": 20, "frequenc": [20, 22, 24, 25, 26, 28], "titanic_data_origin": 20, "dropna": 20, "hasn": 20, "alter": [20, 21], "lookout": 20, "unusu": [20, 24, 26], "spike": 20, "weren": 20, "robject": 20, "importr": 20, "pandas2ri": 20, "globalenv": 20, "choosecranmirror": 20, "ind": 20, "magic": 20, "load_ext": 20, "ipython": 20, "install_packag": 20, "remot": 20, "install_github": 20, "njtiernei": 20, "naniar": 20, "r_df": 20, "mcar_test": 20, "consult": 20, "simplilearn": [20, 21], "theanalysisfactor": 20, "seven": 20, "dataaspir": 20, "\u03c3z": 21, "xx": 21, "\u03bc\u03bc": 21, "\u03c3\u03c3": 21, "center": [21, 24, 28], "pro": 21, "con": 21, "bound": [21, 28], "rescal": 21, "xnorm": 21, "xmin": 21, "xmax": 21, "xminxmin": 21, "xmaxxmax": 21, "overpow": 21, "knn": 21, "minmaxscal": 21, "load_iri": 21, "iris_data": [21, 28], "feature_nam": [21, 25], "iris_standard": 21, "min_max_scal": 21, "iris_min_max_sc": 21, "inter": 21, "comprehend": 21, "readi": 21, "iloc": [21, 26], "minmaxscalermin_max_scal": 21, "sepallengthcm": [21, 28], "subplot": [21, 22, 26, 30, 31], "histplot": [21, 26], "kde": [21, 26], "accordingli": 21, "sepalwidthcm": 21, "sepal": [21, 28], "snoop": 21, "petallengthcm": [21, 28], "petalwidthcm": [21, 28], "speci": [21, 28], "setosa": [21, 28], "ipykernel_145532": [], "2131166956": 21, "dancerworld60": 21, "4bb910900ab7": 21, "awar": [21, 24, 28, 31], "e44df654f185": 21, "nsummari": 21, "nmiss": 21, "418": [21, 22], "000000": [21, 22, 28], "332": 21, "1100": [21, 30], "500000": 21, "265550": [21, 22], "272590": 21, "447368": 21, "392344": 21, "120": 21, "810458": 21, "841838": [21, 22], "181209": 21, "896760": 21, "981429": 21, "170000": 21, "996": 21, "250000": 21, "1204": 21, "750000": 21, "1309": 21, "417": 21, "627188": 21, "385167": 21, "907576": 21, "487218": 21, "895800": 21, "454200": 21, "512": 21, "329200": 21, "1279951594": 21, "x_train_standard": 21, "x_test_standard": 21, "x_train_min_max": 21, "x_test_min_max": 21, "tight_layout": [21, 22, 26, 30, 31], "scalingprint": 21, "nstatist": [21, 22], "334": 21, "262": 21, "333": 21, "269461": 21, "115763": 21, "470060": 21, "404192": 21, "909135": 21, "844961": 21, "655775": 21, "944719": 21, "937113": 21, "054690": 21, "330000": 21, "887500": 21, "340000e": 21, "620000e": 21, "330000e": 21, "233742e": 21, "711995e": 21, "127373e": 21, "722904e": 21, "267524e": 21, "001500e": 21, "001914e": 21, "001505e": 21, "504644e": 21, "036246e": 21, "983123e": 21, "319630e": 21, "367217e": 21, "231816e": 21, "006539e": 21, "658800e": 21, "130032e": 21, "873714e": 21, "073537e": 21, "617915e": 21, "606225e": 21, "136788e": 21, "982518e": 21, "186412e": 21, "201500e": 21, "634731": 21, "393627": 21, "058757": 21, "044910": 21, "072042": 21, "422481": 21, "193680": 21, "118090": 21, "104124": 21, "113315": 21, "273160": 21, "015395": 21, "352451": 21, "028213": 21, "511035": 21, "125000": 21, "063436": 21, "alexisbcook": 21, "primarili": 22, "intrins": 22, "gender": 22, "rank": 22, "school": 22, "bachelor": 22, "satisfact": 22, "unsatisfi": 22, "neutral": 22, "pose": 22, "cherbourg": 22, "queenstown": 22, "southampton": 22, "3rd": 22, "c85": 22, "c123": 22, "e46": 22, "curs": [22, 28], "elimin": [22, 28], "treat": 22, "linearli": 22, "spars": 22, "category_encod": 22, "ce": 22, "binaryencod": 22, "titanic_binary_encod": 22, "onehotencod": 22, "titanic_one_hot_encod": 22, "titanic_one_hot_encoded_df": 22, "toarrai": 22, "get_feature_names_out": 22, "pclass_encod": 22, "hierarchi": 22, "leakag": 22, "dummi": 22, "trap": 22, "multicollinear": [22, 27, 31], "mind": [22, 24, 30], "fictiti": 22, "pairwis": [22, 24, 25], "mostli": 22, "preval": 22, "1s": 22, "mix": 22, "passeng": 22, "sink": 22, "ipykernel_145572": [], "3916798240": 22, "modulenotfounderror": 22, "modul": [22, 32], "ndata": 22, "nuniqu": 22, "363": 22, "nbinari": 22, "value_count": 22, "nameerror": [22, 24], "embarked_c": 22, "embarked_q": 22, "embarked_": 22, "nlabel": 22, "b57": 22, "b59": 22, "b63": 22, "b66": 22, "freq": 22, "270": 22, "244019": 22, "110048": 22, "645933": 22, "430019": 22, "313324": 22, "478803": 22, "aiskunk": 22, "d6296697a40f": 22, "547707acf4e5": 22, "305f3361fd02": 22, "uncov": 24, "trend": [24, 25, 32], "draw": [24, 26, 30], "adopt": 24, "ethic": [24, 32], "ipykernel_145606": [], "955872667": [24, 25], "spot": 24, "mistak": 24, "erron": 24, "summari": [24, 25, 30], "ts": [24, 25, 27], "wise": [24, 26, 31], "preliminari": 24, "carefulli": 24, "overplot": 24, "violinplot": [24, 25], "diverg": 24, "scheme": 24, "hard": 24, "vmin": 24, "vmax": 24, "diverging_palett": 24, "220": 24, "200": 24, "set_xticklabel": 24, "get_xticklabel": 24, "horizontalalign": 24, "657042869641295": 24, "6493527188260838": 24, "8058242481000952": 24, "asymmetri": [24, 26], "tailed": 24, "2867917004538591": 24, "3146639385893346": 24, "nearli": 24, "enough": 24, "claim": 24, "hypothes": [24, 25, 27], "ii": 24, "popmean": 24, "811761283140333": 24, "0619222323076622e": 24, "compel": 24, "manner": 24, "coincid": 24, "spuriou": 24, "briefli": [24, 26], "main": 24, "seller": 24, "appendix": [24, 26], "visualis": 24, "8151e63ce8f0": 24, "boadziedaniel": 24, "890dc0e79799": 24, "datasciencedojo": 24, "ipykernel_145665": [], "heavili": 25, "mean_valu": 25, "median_valu": 25, "mode_valu": 25, "oversimplifi": 25, "realiti": [25, 30], "complic": 25, "stori": 25, "symmetri": [25, 26], "interquartil": [25, 26], "whisker": [25, 26], "brief": 25, "clariti": 25, "sure": 25, "narr": 25, "meaningless": 25, "analysis_result": 25, "variance_valu": 25, "std_dev_valu": 25, "nstat": 25, "stat_nam": 25, "stat_valu": 25, "442111402741325": 25, "1711473380358497": 25, "0821956098764445": 25, "3110148731408575": 25, "02454362762448039": 25, "15666405977275194": 25, "5321522309711284": 25, "8385121764551762": 25, "3559174666826799": 25, "market": 25, "hcbravo": 25, "introdatasci": 25, "bookdown": 25, "econometricstutor": 25, "expand": 26, "deepli": 26, "chart": 26, "symmetr": 26, "evenli": 26, "longer": 26, "peak": 26, "unimod": 26, "bimod": 26, "multimod": 26, "spiki": 26, "hide": 26, "value1": 26, "value2": 26, "valuen": 26, "skyblu": 26, "freedman": 26, "diaconi": 26, "disregard": 26, "quartil": 26, "span": 26, "q2": 26, "side": [26, 31], "reli": [26, 28, 30], "descriptive_stat": 26, "methodolog": 26, "plotli": 26, "machinelearningplu": 26, "oreilli": 26, "9781491912126": 26, "ch04": 26, "interconnected": 27, "strength": 27, "direct": 27, "wherea": 27, "monoton": 27, "rho": 27, "d_i": 27, "r_": 27, "rg": 27, "rg_x": 27, "rg_y": 27, "pinpoint": 27, "pearson_corr": 27, "spearman_corr": 27, "cm": 27, "causat": 27, "meet": [27, 28], "corr_matrix": 27, "surpris": 27, "thereof": 27, "deliver": 27, "stage": [27, 30], "thoughtfulli": 27, "geo": 27, "fu": 27, "berlin": 27, "de": 27, "soga": 27, "inferenti": 27, "sound": 28, "heart": 28, "elev": 28, "summat": 28, "unpredict": 28, "ss": 28, "aa": 28, "randomli": 28, "incorrectli": 28, "faster": [28, 31], "intens": 28, "jump": 28, "150": 28, "virginica": 28, "versicolor": 28, "petal": 28, "disord": 28, "decid": 28, "criterion": 28, "puriti": 28, "decisiontreeclassifi": 28, "clf_entropi": 28, "y_pred_entropi": 28, "clf_gini": 28, "y_pred_gini": 28, "importances_entropi": 28, "feature_importances_": 28, "importances_gini": 28, "9777777777777777": 28, "agre": 28, "worth": 28, "redund": 28, "tweak": 28, "prune": 28, "joint": 28, "properli": 28, "tricki": 28, "invari": 28, "suffer": 28, "causal": [28, 30], "misinterpret": 28, "feature_select": 28, "mutual_info_classif": 28, "x_normal": 28, "mi": 28, "08486414": 28, "49537028": 28, "24562179": 28, "9858617": 28, "99351315": 28, "df1": 28, "df2": 28, "shapiro": 28, "leven": 28, "bartlett": 28, "hoc": 28, "factori": 28, "selectkbest": 28, "f_classif": 28, "k_best_featur": 28, "score_func": 28, "pvalues_": 28, "scores_": 28, "6f": 28, "588": 28, "235294": 28, "119": 28, "264502": 28, "364461": 28, "1179": 28, "034328": 28, "959": 28, "324406": 28, "systemat": 28, "forward": 28, "justifi": 28, "statsmodel": 28, "api": 28, "sm": 28, "label_encod": 28, "forward_select": 28, "significance_level": 28, "initial_featur": 28, "tolist": 28, "best_featur": 28, "remaining_featur": 28, "new_pval": 28, "new_column": 28, "ol": 28, "add_const": 28, "pvalu": 28, "min_p_valu": 28, "idxmin": 28, "selected_featur": 28, "pure": 28, "accuracy_entropi": 28, "accuracy_gini": 28, "deem": 28, "argsort": 28, "barh": 28, "ytick": 28, "features_to_keep_entropi": 28, "features_to_keep_gini": 28, "refin": 28, "technic": 28, "realm": [28, 30], "clf_entropy_deep": 28, "max_depth": 28, "y_pred_entropy_deep": 28, "clf_gini_deep": 28, "y_pred_gini_deep": 28, "victorzh": 28, "mlearn": 28, "82c2123bd548": 28, "codex": 28, "cd9f99a26e0d": 28, "advanc": [29, 30, 32], "pip": [30, 31], "cornerston": 30, "importantli": 30, "contrast": 30, "counterpart": 30, "upcom": 30, "reserv": 30, "entail": 30, "establish": 30, "slope": 30, "indpend": 30, "hat": 30, "beta": 30, "_1": 30, "_0": 30, "isol": 30, "still": 30, "consequ": 30, "foot": 30, "_i": 30, "2_i": 30, "wors": 30, "linearregress": [30, 31], "intercept_": 30, "coef_": [30, 31], "marker": 30, "o": 30, "vline": 30, "ymin": 30, "ymax": 30, "nsse": 30, "fontsiz": 30, "bbox": 30, "dict": 30, "facecolor": 30, "yellow": 30, "inferior": 30, "inferior_slop": 30, "inferior_intercept": 30, "inferior_predict": 30, "inferior_ss": 30, "purpl": 30, "shown": 30, "scatterplot": 30, "yet": 30, "dimenion": 30, "clinic": 30, "subspac": 30, "ambient": 30, "human": 30, "meaningfulli": 30, "teach": 30, "bend": 30, "cancel": 30, "penal": 30, "2r": 30, "farther": 30, "pm": 30, "thank": 30, "strictli": [30, 31], "inclin": 30, "mine": 30, "static": 30, "anim": 30, "confabul": [30, 31], "against": 30, "publicli": 30, "toi": 30, "housing_data": 30, "squarefeet": 30, "bedroom": 30, "bathroom": 30, "850": 30, "200000": 30, "suburban": 30, "900": 30, "205000": 30, "urban": 30, "1200": 30, "210000": 30, "rural": 30, "950": 30, "215000": 30, "220000": 30, "ipykernel_145702": [], "737031205": 30, "aim": 30, "wasn": 30, "memor": 30, "2d": 30, "suffici": 30, "footag": 30, "sq": 30, "ft": 30, "107": 30, "6641786": 30, "103044": 30, "81439951799": 30, "datapoint": 30, "\u03b20": [], "\u03b21x1": [], "\u03b22x2": [], "\u03b2nxny": [], "\u03b21": [], "\u03b22": [], "\u03b2n": [], "estat": [], "l1": [], "environment": 31, "symptom": [], "scientiast": 32, "week": 32, "supervis": 32, "unsupervis": 32, "reduct": 32, "capston": 32, "project": 32, "join": 32, "invit": 32, "v4dsssc5": 32, "028972567226124957": [], "380253": [], "108": [], "110": [], "ipykernel_148464": [], "ipykernel_148499": [], "ipykernel_148533": [], "ipykernel_148570": [], "ipykernel_148597": [], "ipykernel_148635": [], "ipykernel_148671": [], "ipykernel_148721": [], "ipykernel_148756": [], "unlabel": 30, "y_intercept": 30, "ipykernel_150564": [], "5113710410031654": [], "647975": [], "145": [], "111": [], "165": [], "115": [], "137": [], "144": [], "121": 12, "146": [], "143": [], "179": [], "ipykernel_208140": [], "ipykernel_208178": [], "ipykernel_208211": [], "ipykernel_208253": [], "ipykernel_208280": [], "ipykernel_208323": [], "ipykernel_208363": [], "ipykernel_208425": [], "ipykernel_208460": [], "x_n": 31, "practition": 31, "beta_0": 31, "beta_1x_1": 31, "beta_2x_2": 31, "beta_nx_n": 31, "beta_1": 31, "beta_2": 31, "beta_n": 31, "hold": 31, "homoscedast": 31, "inflat": 31, "vif": 31, "peek": 31, "hope": 31, "achiev": 31, "incom": 31, "spending_scor": 31, "hopefulli": 31, "ye": 31, "customer_data2": 31, "x_var": 31, "y_var": 31, "reg": 31, "gap": [], "load_csv": [], "illustr": [], "mpl_toolkit": [], "mplot3d": [], "axes3d": [], "rand": [], "fig": 31, "add_subplot": [], "set_xlabel": [], "set_ylabel": [], "set_zlabel": [], "real_est": [], "mean_squared_error": 31, "r2_score": 31, "r2": 31, "reader": [], "154": [], "54000": [], "rows2": [], "age_coeff": [], "income_coeff": [], "14400000000": [], "30000": [], "120000": [], "15000": [], "1625": [], "36562500000000003": [], "015625": [], "4625000000000001": [], "990625": [], "rows3": [], "051576000000004": [], "62000": [], "942021555555556": [], "wb": [], "writer": [], "stdin": [], "listcomp": [], "attributeerror": [], "_csv": [], "writerow": [], "byte": [], "newlin": [], "6508227309087278": 9, "276254": 9, "132": 12, "109": 12, "ipykernel_237581": 15, "ipykernel_237615": 17, "ipykernel_237648": 19, "ipykernel_237687": 20, "ipykernel_237713": 21, "ipykernel_237751": 22, "ipykernel_237786": 24, "ipykernel_237837": 25, "ipykernel_237871": 30, "suptitl": 31, "versu": 31, "spend": 31, "eventu": 31, "customer_data": 31, "rare": 31, "x_test_scaled_df": 31, "set_titl": 31, "explanatori": 31, "disproportion": 31, "penalti": 31, "undesir": 31, "punish": 31, "732": 31, "3551245668029": 31, "027105564211052702": 31, "24544393": 31, "72516579": 31, "put": 31, "predict_original_scale_datafram": 31, "input_df": 31, "input_sc": 31, "50000": 31, "crunch": 31, "57488877753046": 31, "diabet": 31, "toy_dataset": 31, "abl": 31, "load_diabet": 31, "as_fram": 31, "bmi": 31, "bp": 31, "s1": 31, "s2": 31, "s3": 31, "s4": 31, "s5": 31, "s6": 31, "038076": 31, "050680": 31, "061696": 31, "021872": 31, "044223": 31, "034821": 31, "043401": 31, "002592": 31, "019907": 31, "017646": 31, "001882": 31, "044642": 31, "051474": 31, "026328": 31, "008449": 31, "019163": 31, "074412": 31, "039493": 31, "068332": 31, "092204": 31, "085299": 31, "044451": 31, "005670": 31, "045599": 31, "034194": 31, "032356": 31, "002861": 31, "025930": 31, "089063": 31, "011595": 31, "036656": 31, "012191": 31, "024991": 31, "036038": 31, "034309": 31, "022688": 31, "009362": 31, "005383": 31, "036385": 31, "003935": 31, "015596": 31, "008142": 31, "031988": 31, "046641": 31, "151": 31, "206": 31, "135": 31, "fun": 31, "statolog": 31}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"100": [0, 2, 32], "dai": [0, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "machin": [0, 1, 2, 11, 14, 32], "learn": [0, 1, 2, 11, 14, 29, 30, 32], "challeng": [0, 1, 8, 32], "overview": [0, 2, 17, 22, 30, 32], "cours": [0, 4, 10, 16, 23, 29, 32], "structur": [0, 2, 4, 7, 8, 9, 10, 16, 23, 29, 32], "modul": [0, 1, 2, 4, 9, 10, 16, 23, 29], "1": [0, 1, 2, 4, 5, 7, 9, 10, 11, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28], "introduct": [0, 1, 2, 4, 10, 11, 12, 13, 14, 15, 17, 21, 22, 24, 25, 28, 30, 31], "python": [0, 1, 2, 4, 5, 6, 8, 10, 11, 12, 13, 14, 15, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "basic": [0, 1, 2, 4, 5, 7, 9, 10, 11, 12, 13, 15, 17, 20, 30], "mathemat": [0, 1, 2, 4, 10, 13, 14, 15, 18, 21, 22, 27, 30], "week": [0, 1, 2, 4, 9, 10, 16, 23, 29], "2": [0, 1, 2, 4, 6, 7, 10, 11, 13, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28], "data": [0, 1, 2, 6, 7, 11, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 30], "preprocess": [0, 1, 2, 16, 17, 18, 21, 23, 31], "exploratori": [0, 1, 2, 16, 23, 24], "analysi": [0, 1, 2, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 30], "3": [0, 1, 2, 7, 11, 13, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29], "4": [0, 1, 2, 8, 11, 13, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28], "supervis": [0, 1, 2, 29, 30], "regress": [0, 1, 2, 20, 28, 29, 30, 31], "classif": [0, 1, 2, 19, 29], "5": [0, 1, 2, 9, 11, 13, 18, 19, 20, 21, 22, 24, 29], "6": [0, 1, 2, 11, 19, 20, 21, 24, 29], "unsupervis": [0, 1, 2, 30], "dimension": [0, 1, 2], "reduct": [0, 1, 2], "7": [0, 1, 2, 12, 19, 21], "9": [0, 1, 2, 14], "deep": [0, 1, 2, 22, 25], "foundat": [0, 1, 21, 30], "10": [0, 1, 2, 15], "12": [0, 1, 2, 18, 19], "advanc": [0, 1, 2, 11, 18, 20, 24, 26, 28], "current": [0, 1, 2], "trend": [0, 1, 2], "13": [0, 1, 2, 20], "14": [0, 1, 2, 21], "practic": [0, 1, 6, 13, 18, 20, 21, 22, 24, 25, 26, 27, 28], "aspect": [0, 1], "15": [0, 1, 2, 22], "17": [0, 1, 2, 25], "8": [0, 1, 2, 13, 19, 21], "appli": [0, 1, 2, 13, 21, 24], "ai": [0, 1, 2, 9], "ethic": [0, 1, 2], "consider": [0, 1, 18, 20, 21, 22], "18": [0, 1, 2, 26], "19": [0, 1, 2, 27], "capston": [0, 1, 2], "project": [0, 1, 2, 5, 6, 7, 8, 9, 11], "20": [0, 1, 2, 28], "21": [0, 1, 2, 30], "join": 0, "our": 0, "commun": 0, "social": [0, 32], "media": [0, 32], "contact": [0, 9, 32], "daili": [1, 2, 8], "curriculum": [1, 2], "numer": [1, 2, 4, 17], "oper": [1, 2, 4, 6, 11, 12], "concept": [1, 2, 10, 13, 14, 15, 28, 30, 31], "eda": [1, 2, 23, 24, 25], "ensembl": [1, 2], "method": [1, 2, 20, 28, 30], "neural": [1, 2], "network": [1, 2], "11": [1, 2, 17], "convolut": [1, 2], "cnn": [1, 2], "recurr": [1, 2], "rnn": [1, 2], "reinforc": [1, 2], "topic": [1, 2, 11], "mlop": [1, 2], "16": [1, 2, 24], "etl": [1, 2], "process": [1, 2], "transform": [1, 2], "industri": [1, 2], "sector": [1, 2], "applic": [1, 2, 9, 11, 13, 14], "cybersecur": [1, 2], "resourc": [2, 5, 6, 7, 8, 11, 13, 15, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 31], "jupyt": 2, "notebook": 2, "lesson": [2, 8], "syntax": [2, 5, 9], "variabl": [2, 5, 13, 20, 25], "type": [2, 6, 7, 17, 20, 21, 22], "control": [2, 7, 8], "loop": [2, 7], "condit": [2, 8], "statement": [2, 7, 8, 9], "function": [2, 9, 13], "linear": [2, 11, 12, 30, 31], "algebra": [2, 11, 12], "vector": [2, 11], "matric": [2, 12], "matrix": [2, 12, 19, 27], "calculu": [2, 13, 14], "deriv": [2, 13], "integr": [2, 14, 20], "fundament": [2, 14], "theorem": [2, 14, 24], "probabl": [2, 15], "statist": [2, 15, 17, 19, 20, 21, 22, 24, 26], "relev": [2, 15], "distribut": [2, 15, 24, 26], "handl": [2, 20], "miss": [2, 20], "normal": [2, 21], "scale": [2, 17, 21], "us": [2, 13, 14, 17, 20, 21, 27, 28, 30], "encod": [2, 22], "categor": [2, 22], "split": [2, 18, 19, 20, 21, 30], "train": [2, 18, 20, 21, 30], "test": [2, 9, 18, 20, 21, 24, 28, 30], "set": [2, 5, 20, 21], "visual": [2, 11, 20, 21, 22, 24, 25, 27, 30], "implement": [2, 11, 13, 14, 15, 20, 21, 22, 26, 28, 30, 31], "descript": [2, 13, 15, 24, 26], "techniqu": [2, 18, 19, 20, 21, 22, 24, 25, 28], "correl": [2, 19, 27], "featur": [2, 22, 28], "select": [2, 28], "import": [2, 9, 11, 13, 15, 17, 21, 28, 30], "22": [2, 31], "multipl": [2, 11, 12, 31], "23": 2, "polynomi": 2, "lasso": 2, "ridg": 2, "24": 2, "model": [2, 18, 19, 20, 30, 31], "evalu": [2, 18, 20, 31], "metric": [2, 31], "25": 2, "address": 2, "overfit": 2, "underfit": 2, "26": 2, "logist": 2, "27": 2, "k": 2, "nearest": 2, "neighbor": 2, "nn": 2, "algorithm": 2, "28": 2, "support": 2, "svm": 2, "nonlinear": 2, "29": 2, "decis": [2, 28], "tree": 2, "rule": [2, 12, 13], "base": [2, 20], "30": [2, 28], "naiv": 2, "bay": 2, "classifi": 2, "31": 2, "32": 2, "bag": 2, "random": [2, 20, 28], "forest": [2, 28], "33": 2, "boost": 2, "adaboost": 2, "34": 2, "gradient": 2, "gbm": 2, "xgboost": 2, "35": 2, "Their": 2, "36": 2, "cluster": 2, "37": 2, "mean": [2, 24, 25], "differ": [2, 13, 17, 30], "38": 2, "hierarch": 2, "39": 2, "densiti": 2, "dbscan": 2, "40": 2, "gaussian": 2, "mixtur": 2, "gmm": 2, "expect": 2, "maxim": 2, "41": 2, "pca": 2, "42": 2, "43": 2, "singular": 2, "valu": [2, 9, 19, 25], "decomposit": 2, "svd": 2, "Its": 2, "44": 2, "t": 2, "sne": 2, "45": 2, "other": 2, "46": 2, "understand": [2, 7, 9, 13, 15, 17, 20, 21, 22, 26, 27, 28, 31], "perceptron": 2, "47": 2, "feedforward": 2, "activ": [2, 11, 12, 13, 17, 21, 22, 24, 25, 26, 27, 28], "48": 2, "backpropag": 2, "49": 2, "loss": 2, "optim": 2, "50": 2, "tune": 2, "perform": [2, 19, 20], "51": 2, "layer": 2, "52": 2, "pool": 2, "architectur": 2, "53": 2, "imag": 2, "54": 2, "55": 2, "transfer": 2, "56": 2, "57": 2, "long": 2, "short": 2, "term": 2, "memori": 2, "lstm": 2, "58": 2, "build": [2, 30], "sequenc": 2, "59": 2, "time": 2, "seri": 2, "60": 2, "util": 2, "natur": [2, 28], "languag": 2, "nlp": 2, "61": 2, "62": 2, "markov": 2, "63": 2, "q": 2, "64": 2, "dqn": 2, "65": 2, "polici": 2, "66": 2, "depth": [2, 18, 19, 25, 26], "67": 2, "gener": [2, 20], "adversari": 2, "gan": 2, "68": 2, "attent": 2, "mechan": 2, "69": 2, "autoencod": 2, "70": 2, "research": 2, "emerg": 2, "ml": [2, 9], "71": 2, "lifecycl": 2, "72": 2, "version": [2, 8], "experi": 2, "track": 2, "73": 2, "ci": 2, "cd": 2, "74": 2, "monitor": 2, "mainten": 2, "75": 2, "tool": 2, "platform": 2, "76": 2, "extract": 2, "77": 2, "78": 2, "load": [2, 18, 20, 21, 22], "databas": 2, "manag": 2, "79": 2, "an": 2, "pipelin": 2, "80": 2, "technolog": 2, "81": 2, "82": 2, "self": 2, "posit": 2, "83": 2, "84": 2, "85": 2, "domain": 2, "86": 2, "bia": 2, "fair": 2, "87": 2, "privaci": 2, "secur": 2, "system": [2, 9], "88": 2, "explain": 2, "transpar": 2, "89": 2, "regul": 2, "complianc": 2, "90": 2, "make": [2, 28], "91": 2, "healthcar": 2, "92": 2, "financ": 2, "93": 2, "retail": 2, "94": 2, "manufactur": 2, "95": 2, "transport": 2, "educ": 2, "etc": 2, "96": 2, "97": 2, "identifi": 2, "threat": 2, "vulner": 2, "98": 2, "detect": 2, "prevent": 2, "99": 2, "case": 2, "studi": 2, "incid": 2, "101": 2, "plan": 2, "102": 2, "104": 2, "develop": [2, 9], "105": 2, "final": [2, 18], "present": 2, "errata": 3, "up": [5, 20], "your": [5, 7, 8, 9, 28], "environ": 5, "hand": [5, 6, 11, 17, 21, 24, 25, 26, 27], "On": [5, 6, 11, 17, 21, 24, 31], "arithmet": [5, 7, 25], "further": [5, 6, 7, 8, 11, 13, 15, 28], "more": 6, "about": 6, "logic": [6, 7], "comparison": [6, 21], "calcul": [6, 12, 13, 19, 26], "solut": [6, 7, 8, 19, 25, 26], "problem": [6, 8, 13], "why": [7, 17, 20], "collect": 7, "The": [7, 12, 13, 15, 31], "while": 7, "rang": [7, 17, 19], "object": [7, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28], "break": 7, "continu": 7, "els": 7, "claus": 7, "combin": 7, "boolean": 7, "exampl": [7, 11, 13, 17, 20, 22, 28, 30], "program": [7, 9], "prime": 7, "number": [7, 9], "checker": 7, "quiz": [7, 9], "task": [7, 24, 26], "If": 8, "thi": 8, "Then": 8, "That": 8, "otherwis": 8, "do": [8, 28], "code": [8, 11, 20, 26, 28], "block": [8, 18], "last": 8, "resort": 8, "save": 8, "word": 8, "succinct": 8, "fizzbuzz": 8, "similar": 8, "altern": 8, "temperatur": 8, "analyz": [8, 21, 30], "step": [8, 11, 12, 13, 15, 18, 20, 21, 22, 26, 28], "counter": 8, "write": 9, "first": 9, "paramet": 9, "argument": 9, "arg": 9, "return": 9, "get": 9, "new": 9, "fast": 9, "via": 9, "standard": [9, 17, 19, 21, 24], "librari": [9, 11, 13, 15, 21, 22], "highlight": 9, "everi": 9, "must": 9, "know": 9, "numpi": [9, 17], "mini": 9, "guess": 9, "game": 9, "prompt": 9, "simpl": [9, 30], "book": 9, "warehous": 9, "order": [9, 17], "food": 9, "shop": 9, "cash": 9, "regist": 9, "what": [11, 12, 13], "represent": 11, "repres": 11, "addit": [11, 12, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 31], "subtract": [11, 12], "scalar": 11, "One": [11, 22], "x": 11, "magnitud": 11, "direct": 11, "dot": [11, 12], "product": [11, 12, 13], "definit": [11, 30], "geometr": 11, "interpret": [11, 19, 26, 28], "properti": [11, 12], "cross": [11, 18, 19], "norm": 11, "real": [11, 13], "world": [11, 13], "comput": [11, 27], "graphic": [11, 13], "simul": 11, "2d": 11, "movement": 11, "physic": 11, "engin": 11, "scienc": [11, 15], "summari": [11, 17, 19, 21, 22], "conclud": 11, "thought": 11, "field": 11, "beginn": 11, "necessari": [11, 15, 21, 22], "creat": [11, 12, 26], "grid": 11, "defin": [11, 13], "plot": [11, 20, 24, 25, 26], "format": 11, "displai": [11, 13, 17], "master": [12, 24, 26], "core": 12, "complex": 12, "element": 12, "wise": [12, 19], "transpos": 12, "invers": 12, "flip": 12, "revers": 12, "instruct": [12, 24], "prerequisit": [13, 14, 15, 18, 20, 21, 22, 24, 25], "ar": [13, 17], "rate": 13, "chang": 13, "slope": 13, "tangent": 13, "line": [13, 30], "notat": 13, "formula": [13, 20, 28], "power": 13, "result": [13, 28], "constant": 13, "sum": 13, "quotient": 13, "A": [13, 22, 28], "view": 13, "best": [13, 18, 20, 21, 22, 24, 25, 26, 27, 28, 30], "conclus": [13, 15, 19, 25], "expand": [15, 22], "uncertainti": 15, "inferenti": [15, 24], "goal": 17, "workflow": 17, "setup": 17, "In": [17, 18, 19, 25, 26], "abov": [17, 30], "we": 17, "column": 17, "mode": [17, 24, 25], "could": 17, "you": 17, "non": 17, "would": 17, "varianc": [17, 19, 24], "deviat": [17, 19, 24], "between": [17, 30], "panda": 17, "quartil": [17, 19], "interquartil": [17, 19], "explor": [18, 19, 20, 21, 28], "valid": [18, 19], "theoret": [18, 30], "background": 18, "principl": [18, 27], "stratifi": 18, "roll": 18, "homework": [18, 19, 20, 24, 25, 26, 27], "assign": [18, 19, 20, 24, 25, 26, 27], "access": 18, "dataset": [18, 19, 20, 21, 22, 26, 27, 28, 30], "note": 18, "leakag": [18, 20, 21], "qualiti": [19, 25, 26, 27], "wine": [19, 25, 26, 27], "iqr": 19, "notabl": 19, "accuraci": [19, 28], "review": 19, "follow": 19, "overal": 19, "observ": 19, "report": [19, 24, 25, 26], "class": 19, "score": [19, 21], "imput": 20, "fill": 20, "ag": 20, "median": [20, 24, 25], "how": 20, "knn": 20, "mnar": 20, "Not": 20, "approach": 20, "augment": 20, "impact": 20, "histogram": [20, 24, 25, 26], "scatter": 20, "two": [20, 30], "littl": 20, "s": [20, 27, 28], "mcar": 20, "rpy2": 20, "instal": 20, "r": 20, "packag": 20, "tip": 20, "discern": 20, "comprehens": [21, 24, 26], "z": 21, "min": 21, "max": 21, "iri": [21, 28], "post": [21, 22], "analyt": [21, 28], "assess": [21, 28], "effect": 21, "implic": 22, "binari": 22, "high": 22, "cardin": 22, "hot": 22, "nomin": 22, "label": 22, "ordin": 22, "context": 22, "cabin": 22, "embark": 22, "pclass": 22, "dive": [22, 25], "titan": 22, "identif": 22, "b": 22, "c": [22, 30], "boxplot": [24, 25], "violin": [24, 25], "pair": [24, 25], "heatmap": [24, 27], "skew": 24, "kurtosi": 24, "sampl": 24, "central": [24, 25], "limit": 24, "hypothesi": 24, "tendenc": 25, "averag": 25, "middl": 25, "most": 25, "frequent": 25, "compar": 25, "measur": 25, "templat": 25, "dispers": 25, "find": 25, "discuss": 25, "box": 26, "detail": [26, 28], "requir": [26, 28], "compil": 26, "signific": 27, "pearson": 27, "spearman": 27, "coeffici": 27, "rank": 27, "common": 27, "pitfal": 27, "With": 28, "part": 28, "entropi": 28, "sum_": 28, "i": 28, "n": 28, "p_i": 28, "log_2": 28, "inform": 28, "gain": 28, "informationgain": 28, "v": 28, "frac": 28, "s_v": 28, "gini": 28, "impur": 28, "vs": 28, "when": 28, "which": 28, "conceptu": 28, "think": 28, "minut": 28, "filter": 28, "mutual": 28, "don": 28, "ts": 28, "carefulli": 28, "consid": 28, "anova": 28, "f": 28, "wrapper": 28, "stepwis": 28, "pseudo": 28, "embed": 28, "purpos": 30, "explan": 30, "equat": [30, 31], "y": 30, "mx": 30, "hyperplan": 30, "relat": 30, "dimens": 30, "fit": 30, "least": 30, "squar": 30, "scikit": 30, "matplotlib": 30, "hous": 30, "predict": 30, "price": 30, "excercis": 30, "reader": [30, 31], "outlin": [], "onli": [], "kei": 31, "intro": [], "draft": [], "starter": [], "overviewdemo": [], "concept1": [], "demo1": [], "concept2": [], "demo2": [], "exercis": 31, "customer_data": [], "csv": [], "look": [], "like": [], "static": [], "let": [], "give": [], "some": [], "shape": [], "For": 31}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx": 56}}) \ No newline at end of file +Search.setIndex({"docnames": ["Week_00/00_Overview", "Week_00/00a_DailyChallenge", "Week_00/00b_DailyResources", "Week_00/01_Errata", "Week_01/001_Overview", "Week_01/Lesson_01", "Week_01/Lesson_02", "Week_01/Lesson_03", "Week_01/Lesson_04", "Week_01/Lesson_05", "Week_02/002_Overview", "Week_02/Lesson_06", "Week_02/Lesson_07", "Week_02/Lesson_08", "Week_02/Lesson_09", "Week_02/Lesson_10", "Week_03/003_Overview", "Week_03/Lesson_11", "Week_03/Lesson_12", "Week_03/Lesson_12solution", "Week_03/Lesson_13", "Week_03/Lesson_14", "Week_03/Lesson_15", "Week_04/004_Overview", "Week_04/Lesson_16", "Week_04/Lesson_17", "Week_04/Lesson_18", "Week_04/Lesson_19", "Week_04/Lesson_20", "Week_05/005_Overview", "Week_05/Lesson_21", "Week_05/Lesson_22", "Week_05/Lesson_23", "index"], "filenames": ["Week_00/00_Overview.md", "Week_00/00a_DailyChallenge.md", "Week_00/00b_DailyResources.md", "Week_00/01_Errata.md", "Week_01/001_Overview.md", "Week_01/Lesson_01.ipynb", "Week_01/Lesson_02.ipynb", "Week_01/Lesson_03.ipynb", "Week_01/Lesson_04.ipynb", "Week_01/Lesson_05.ipynb", "Week_02/002_Overview.md", "Week_02/Lesson_06.ipynb", "Week_02/Lesson_07.ipynb", "Week_02/Lesson_08.ipynb", "Week_02/Lesson_09.ipynb", "Week_02/Lesson_10.ipynb", "Week_03/003_Overview.md", "Week_03/Lesson_11.ipynb", "Week_03/Lesson_12.ipynb", "Week_03/Lesson_12solution.ipynb", "Week_03/Lesson_13.ipynb", "Week_03/Lesson_14.ipynb", "Week_03/Lesson_15.ipynb", "Week_04/004_Overview.md", "Week_04/Lesson_16.ipynb", "Week_04/Lesson_17.ipynb", "Week_04/Lesson_18.ipynb", "Week_04/Lesson_19.ipynb", "Week_04/Lesson_20.ipynb", "Week_05/005_Overview.md", "Week_05/Lesson_21.ipynb", "Week_05/Lesson_22.ipynb", "Week_05/Lesson_23.ipynb", "index.rst"], "titles": ["100 Days of Machine Learning Challenge", "Daily Challenge Curriculum", "Daily Curriculum Resources", "Errata", "Course Structure", "Day 1: Python Basics - Syntax, Variables", "Day 2: Python Data Types", "Day 3: Control Structures - Loops", "Day 4: Control Structures - Conditionals", "Day 5: Functions and Modules", "Course Structure", "Day 6: Linear Algebra - Vector Operations in Python", "Day 7: Linear Algebra - Matrices and Matrix Operations", "Day 8: Calculus - Derivatives, Concept and Applications", "Day 9: Calculus - Integrals, Fundamental Theorems, and Applications in Machine Learning", "Day 10: Probability and Statistics - Basic Concepts, Relevant Distributions - Expanded", "Course Structure", "Day 11: Introduction to Data Preprocessing in Python", "Day 12: In-Depth Exploration of Data Splitting Techniques in Python with Cross-Validation", "Day 12: In-Depth Exploration of Data Splitting Techniques - Solution", "Day 13: Advanced Techniques for Handling Missing Data in Python", "Day 14: Data Normalization and Scaling using Python", "Day 15: Encoding Categorical Data in Python - Expanded with Mathematical Implications", "Course Structure", "Day 16: Comprehensive EDA and Data Visualization in Python", "Day 17: In-Depth EDA and Central Tendency in Python", "Day 18: In-Depth Analysis of Histograms and Box Plots in Python", "Day 19: Correlation Analysis using Python", "Day 20: Advanced Feature Selection and Importance in Python - With Iris Dataset", "Course Structure", "Day 21 - Introduction to Regression Analysis in Python", "Day 22: Implementing Multiple Linear Regression in Python", "Day 23: Advanced Regression Techniques", "100 Days of Machine Learning Challenge"], "terms": {"welcom": [0, 6, 33], "comprehens": [0, 1, 2, 12, 18, 19, 27, 28, 30, 31, 33], "journei": [0, 5, 6, 13, 28, 33], "world": [0, 1, 2, 6, 9, 14, 20, 30, 33], "tailor": [0, 2, 33], "divers": [0, 2, 6, 9, 12, 19, 33], "audienc": [0, 33], "includ": [0, 1, 2, 5, 9, 11, 12, 13, 14, 15, 18, 20, 21, 22, 24, 26, 28, 29, 30, 31, 32, 33], "aspir": [0, 33], "scientist": [0, 30], "profession": [0, 33], "relat": [0, 1, 2, 9, 12, 19, 20, 27, 33], "field": [0, 2, 12, 13, 15, 30, 31, 33], "enthusiast": [0, 33], "thi": [0, 2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32, 33], "program": [0, 1, 2, 4, 5, 6, 8, 10, 11, 13, 14, 15, 18, 33], "design": [0, 9, 11, 13, 17, 28, 32, 33], "individu": [0, 2, 5, 26, 27, 33], "high": [0, 1, 2, 9, 17, 19, 26, 27, 28, 31, 33], "colleg": [0, 2, 33], "level": [0, 9, 15, 17, 19, 22, 24, 26, 27, 33], "algebra": [0, 1, 4, 10, 13, 14, 15, 21, 24, 25, 33], "knowledg": [0, 1, 2, 11, 13, 14, 18, 20, 22, 24, 27, 28, 33], "It": [0, 2, 5, 6, 7, 8, 9, 11, 12, 13, 15, 18, 19, 20, 21, 25, 27, 28, 30, 31, 32, 33], "offer": [0, 2, 12, 15, 33], "well": [0, 2, 11, 18, 19, 26, 27, 28, 30, 32, 33], "round": [0, 2, 9, 19, 20, 33], "educ": [0, 1, 22, 33], "experi": [0, 1, 5, 15, 28, 33], "through": [0, 1, 2, 4, 5, 6, 7, 8, 13, 20, 21, 22, 25, 26, 30, 32, 33], "video": [0, 2, 12, 33], "lectur": [0, 12, 33], "question": [0, 7, 9, 17, 33], "hand": [0, 1, 2, 9, 28, 30, 33], "tutori": [0, 2, 5, 18, 26, 31, 32, 33], "focu": [0, 1, 2, 4, 5, 10, 16, 23, 24, 26, 29, 30, 33], "topic": [0, 4, 10, 16, 23, 29, 32, 33], "syntax": [0, 1, 4, 6, 8, 10, 11, 33], "linear": [0, 1, 4, 9, 10, 19, 20, 21, 24, 25, 27, 28, 29, 32, 33], "calculu": [0, 1, 4, 10, 29, 33], "statist": [0, 1, 4, 10, 14, 16, 18, 23, 25, 27, 28, 30, 31, 33], "method": [0, 7, 9, 13, 15, 16, 17, 18, 21, 23, 24, 26, 27, 29, 31, 32, 33], "visual": [0, 1, 13, 14, 15, 16, 17, 23, 26, 28, 33], "descript": [0, 1, 12, 16, 19, 23, 25, 33], "algorithm": [0, 1, 7, 11, 12, 13, 14, 18, 21, 28, 29, 30, 31, 32, 33], "decis": [0, 1, 6, 8, 13, 15, 17, 20, 26, 29, 33], "tree": [0, 1, 13, 28, 29, 31, 33], "svm": [0, 1, 13, 29, 33], "techniqu": [0, 1, 14, 15, 16, 23, 29, 30, 31, 33], "reduc": [0, 1, 2, 18, 22, 28, 30, 32, 33], "complex": [0, 1, 2, 5, 7, 8, 9, 11, 18, 20, 24, 28, 31, 32, 33], "cluster": [0, 1, 11, 19, 25, 33], "gaussian": [0, 1, 15, 21, 33], "mixtur": [0, 1, 33], "model": [0, 1, 5, 9, 11, 13, 14, 15, 21, 22, 27, 28, 29, 32, 33], "pca": [0, 1, 33], "t": [0, 1, 5, 6, 9, 12, 13, 15, 19, 20, 22, 24, 26, 27, 28, 30, 31, 32, 33], "sne": [0, 1, 33], "core": [0, 1, 2, 15, 17, 19, 28, 33], "concept": [0, 5, 6, 8, 11, 12, 16, 18, 21, 22, 24, 25, 29, 33], "architectur": [0, 1, 33], "neural": [0, 11, 13, 14, 21, 31, 33], "network": [0, 11, 13, 14, 21, 31, 33], "cnn": [0, 33], "rnn": [0, 33], "imag": [0, 1, 11, 12, 33], "sequenc": [0, 1, 4, 5, 7, 32, 33], "process": [0, 7, 9, 11, 12, 17, 18, 19, 20, 22, 28, 30, 32, 33], "emerg": [0, 1, 33], "reinforc": [0, 7, 33], "transfer": [0, 1, 33], "gan": [0, 1, 33], "attent": [0, 1, 33], "mechan": [0, 1, 11, 12, 20, 33], "operation": [0, 1, 2, 33], "understand": [0, 1, 4, 5, 6, 8, 10, 11, 14, 16, 18, 19, 23, 24, 25, 29, 30, 33], "transform": [0, 11, 12, 18, 19, 21, 22, 26, 28, 31, 32, 33], "mlop": [0, 33], "etl": [0, 33], "applic": [0, 6, 10, 12, 15, 17, 18, 20, 24, 26, 28, 29, 32, 33], "variou": [0, 1, 2, 11, 12, 13, 14, 15, 17, 19, 20, 22, 23, 28, 30, 32, 33], "industri": [0, 33], "healthcar": [0, 1, 31, 33], "financ": [0, 1, 17, 31, 33], "retail": [0, 1, 33], "manufactur": [0, 1, 33], "build": [0, 1, 5, 7, 9, 11, 19, 20, 28, 31, 32, 33], "evalu": [0, 1, 5, 6, 8, 9, 13, 14, 19, 21, 22, 25, 27, 28, 29, 32, 33], "connect": [0, 1, 2, 14], "learner": 0, "expert": [0, 20], "share": [0, 9], "your": [0, 2, 6, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 30, 31, 32], "insight": [0, 1, 2, 17, 19, 20, 22, 24, 25, 26, 27, 31], "particip": 0, "discuss": [0, 2, 24, 26, 27, 30], "collabor": 0, "start": [0, 2, 5, 7, 9, 12, 24, 30], "date": [0, 5, 9, 17], "januari": 0, "1st": [0, 22], "2024": [0, 9], "twitter": [0, 33], "100daysml": [0, 33], "reddit": [0, 33], "r": [0, 1, 2, 9, 11, 15, 27, 28, 29, 30, 31, 32, 33], "discord": [0, 33], "us": [0, 1, 4, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 18, 19, 22, 23, 24, 25, 26, 31, 32, 33], "websit": [0, 2, 33], "http": [0, 2, 5, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 33], "www": [0, 2, 5, 15, 17, 18, 20, 21, 22, 25, 26, 27, 28, 31, 33], "100daysofml": [0, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 33], "com": [0, 2, 5, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 33], "we": [0, 5, 6, 9, 11, 12, 13, 15, 20, 21, 25, 26, 27, 28, 30, 31, 32], "ar": [0, 2, 5, 6, 7, 8, 9, 11, 12, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "excit": 0, "embark": [0, 20, 21, 27, 28], "explor": [0, 1, 2, 4, 6, 10, 13, 14, 15, 16, 22, 23, 25, 26, 27, 29, 30, 31], "discoveri": 0, "you": [0, 2, 5, 6, 7, 9, 11, 12, 13, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "let": [0, 5, 9, 11, 12, 13, 14, 15, 20, 26, 28, 30, 31, 32], "s": [0, 2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 21, 22, 24, 25, 26, 30, 31, 32], "grow": [0, 32], "togeth": [0, 12, 32], "skill": [1, 6, 8, 13, 15, 20, 21, 22, 24, 25, 26, 28, 30], "type": [1, 4, 5, 9, 12, 15, 16, 19, 23, 24, 25, 26, 28, 30], "control": [1, 4, 6, 12, 32], "structur": [1, 5, 11, 12, 20, 22, 24, 26], "dai": [1, 4, 10, 16, 23, 29], "variabl": [1, 4, 6, 7, 9, 12, 17, 18, 19, 21, 22, 24, 26, 27, 28, 30, 31, 32], "assign": [1, 2, 4, 5, 8, 9, 12, 21, 28], "math": [1, 2, 4, 7, 9, 10, 15, 16, 18, 23, 29], "arithmet": [1, 2, 4, 6, 17], "differ": [1, 4, 5, 6, 7, 8, 9, 11, 12, 15, 19, 20, 22, 24, 25, 26, 27, 28, 31, 32], "logic": [1, 2, 4, 5, 8, 22], "calcul": [1, 2, 4, 7, 9, 10, 11, 14, 17, 18, 24, 25, 27, 28, 30, 32], "loop": [1, 4, 5, 6, 8, 9, 25, 30], "construct": [1, 4, 26, 28, 30], "while": [1, 2, 4, 5, 9, 11, 13, 17, 19, 20, 22, 24, 27, 28, 30, 32], "condit": [1, 4, 5, 6, 7, 9, 11, 13, 30], "statement": [1, 4, 5, 6, 12], "elif": [1, 2, 4, 7, 8, 9], "els": [1, 2, 4, 8, 9, 15, 28], "flow": [1, 4], "implement": [1, 4, 10, 16, 18, 19, 23, 24, 25, 29, 32], "function": [1, 4, 5, 6, 7, 14, 17, 20, 21, 27, 28, 29, 30, 32], "defin": [1, 2, 4, 5, 7, 8, 9, 12, 14, 20, 22, 24, 28], "write": [1, 4, 5, 6, 7, 8, 12, 24, 25, 27], "formula": [1, 4, 11, 12, 17, 18, 21, 22, 25, 27, 30], "vector": [1, 10, 12, 13, 31], "work": [1, 2, 5, 7, 10, 12, 13, 20, 21], "perform": [1, 6, 9, 10, 11, 12, 14, 15, 17, 18, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "matric": [1, 10, 11, 22, 24], "matrix": [1, 9, 10, 18, 24, 32], "deriv": [1, 10, 14, 31], "integr": [1, 10], "fundament": [1, 6, 7, 8, 10, 11, 12, 13, 15, 26, 28, 29, 30], "theorem": [1, 10, 18], "simpl": [1, 2, 7, 10, 11, 18, 21, 24, 29, 31, 32], "probabl": [1, 5, 10, 14, 18, 25, 28, 32], "relev": [1, 9, 10, 11, 17, 19], "distribut": [1, 10, 11, 12, 14, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 31], "prepar": [1, 2, 17, 20, 21, 22, 28, 31], "import": [1, 5, 7, 12, 14, 16, 18, 19, 20, 22, 23, 24, 25, 26, 27, 31, 32], "scale": [1, 11, 16, 18, 19, 20, 28, 31, 32], "split": [1, 12, 13, 16, 28, 31, 32], "train": [1, 11, 13, 16, 17, 19, 22, 28, 31, 32], "test": [1, 5, 6, 7, 8, 15, 16, 19, 22, 27, 31, 32], "set": [1, 7, 15, 16, 17, 18, 19, 22, 25, 27, 28, 30, 31, 32], "random": [1, 7, 9, 12, 15, 16, 18, 30, 32], "sampl": [1, 2, 9, 15, 16, 17, 18, 19, 26, 27, 28, 30], "stratifi": [1, 2, 16, 30], "principl": [1, 2, 14, 16, 20, 21, 24], "handl": [1, 8, 9, 11, 12, 16, 17, 18, 19, 21, 28, 30, 31], "miss": [1, 16, 17, 18, 19, 21, 24, 28, 31], "detect": [1, 16, 17, 18, 21, 28, 31], "imput": [1, 2, 16, 17], "rational": [1, 2, 16, 20, 21, 22], "normal": [1, 11, 15, 16, 17, 18, 19, 20, 24, 27, 28, 31, 32], "about": [1, 2, 7, 9, 13, 15, 16, 18, 19, 20, 21, 22, 24, 26, 27, 28, 30, 31], "featur": [1, 5, 6, 9, 11, 13, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 30, 31, 32], "z": [1, 2, 9, 11, 12, 16, 17, 30], "score": [1, 2, 9, 16, 17, 18, 26, 28, 31, 32], "min": [1, 2, 16, 17, 19, 22, 28, 32], "max": [1, 2, 16, 17, 19, 22, 32], "encod": [1, 16, 18, 19, 21, 31], "categor": [1, 8, 16, 17, 18, 19, 20, 21, 25, 28, 30, 31], "binari": [1, 2, 9, 16, 18], "one": [1, 2, 6, 7, 8, 9, 11, 16, 17, 18, 19, 22, 26, 27, 28, 30, 31], "hot": [1, 2, 8, 16, 31], "label": [1, 2, 13, 14, 16, 18, 20, 21, 24, 26, 28, 30, 31, 32], "implic": [1, 2, 16, 21, 24, 25, 26], "graphic": [1, 17, 23, 30], "represent": [1, 2, 12, 14, 18, 19, 21, 22, 23, 24, 26, 32], "measur": [1, 2, 9, 11, 13, 15, 17, 18, 19, 23, 24, 27, 28, 30, 31], "central": [1, 2, 15, 18, 20, 21, 23, 26], "tendenc": [1, 2, 15, 20, 21, 23, 24, 26], "dispers": [1, 2, 15, 17, 19, 23, 26], "creat": [1, 2, 5, 6, 7, 8, 9, 17, 19, 20, 22, 23, 24, 25, 30, 32], "plot": [1, 2, 5, 13, 14, 15, 17, 18, 19, 21, 22, 23, 27, 28, 30, 31, 32], "histogram": [1, 2, 21, 22, 23, 31], "box": [1, 2, 17, 21, 23, 25], "correl": [1, 21, 22, 23, 24, 25, 28, 31], "its": [1, 2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 23, 24, 28, 30, 31, 32], "coeffici": [1, 2, 9, 23, 28, 29, 30, 31, 32], "interpret": [1, 2, 5, 8, 13, 15, 21, 22, 23, 24, 25, 27, 29, 30, 31, 32], "select": [1, 9, 13, 18, 20, 21, 23, 24, 27, 30, 32], "inform": [1, 2, 9, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26], "gain": [1, 2, 19, 23, 24, 25, 26, 27], "gini": [1, 2, 23], "impur": [1, 2, 23], "metric": [1, 18, 19, 20, 22, 23, 28, 29, 32], "kei": [1, 2, 5, 7, 8, 12, 17, 18, 19, 20, 21, 25, 26, 28, 29, 30], "equat": [1, 2, 9, 11, 12, 29, 32], "fit": [1, 2, 18, 19, 20, 21, 22, 28, 29, 31, 32], "22": [1, 7, 8, 9, 12, 17, 20, 21, 22, 29, 32], "multipl": [1, 5, 7, 8, 9, 13, 20, 28, 29, 32], "multivari": [1, 2, 29, 31, 32], "23": [1, 8, 9, 17, 29], "polynomi": [1, 29], "lasso": [1, 29], "ridg": [1, 20, 29], "regular": [1, 2, 11, 14, 29, 31, 32], "24": [1, 7, 8, 9, 12, 17, 29, 32], "mean": [1, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 26, 27, 28, 29, 30, 31, 32], "squar": [1, 2, 9, 12, 19, 24, 28, 29, 31, 32], "error": [1, 2, 5, 6, 7, 9, 17, 18, 19, 24, 28, 29, 30, 31, 32], "mse": [1, 2, 9, 29, 31, 32], "root": [1, 2, 29, 31], "rmse": [1, 2, 29, 31], "25": [1, 5, 6, 7, 8, 9, 12, 13, 15, 17, 19, 21, 22, 29, 30, 31, 32], "address": [1, 9, 29, 31, 32], "overfit": [1, 14, 20, 22, 28, 29, 32], "underfit": [1, 29, 32], "strategi": [1, 2, 28, 29, 31], "combat": [1, 2, 29], "bia": [1, 18, 20, 29, 32], "varianc": [1, 2, 15, 18, 20, 21, 22, 25, 26, 28, 29, 30, 31, 32], "tradeoff": [1, 2, 29], "26": [1, 8, 9, 14, 17, 19], "logist": [1, 20, 21, 30], "27": [1, 8, 12, 17, 20, 21, 22], "k": [1, 11, 12, 13, 18, 20, 21, 28, 32], "nearest": [1, 20, 21], "neighbor": [1, 20, 21], "nn": 1, "distanc": [1, 2, 11, 13, 20, 30], "euclidean": [1, 2, 20], "manhattan": [1, 2], "28": [1, 8, 17, 19], "support": [1, 7, 9, 19, 24, 31], "nonlinear": 1, "both": [1, 2, 6, 7, 8, 9, 11, 13, 17, 18, 19, 24, 27, 28, 30, 31], "nonlinearli": 1, "separ": [1, 2, 5, 9, 12, 19, 28, 31], "hyperplan": [1, 2], "margin": [1, 2, 13, 28], "maxim": [1, 24], "kernel": [1, 2, 7, 9, 24], "trick": 1, "29": [1, 7, 8, 17, 19], "rule": [1, 6, 11, 26], "base": [1, 5, 7, 8, 9, 11, 12, 15, 18, 24, 25, 28, 30, 31, 32], "entropi": [1, 2], "30": [1, 6, 8, 12, 15, 17, 21], "naiv": [1, 21], "bay": [1, 21], "classifi": [1, 19, 20, 22, 28], "context": [1, 2, 17, 19, 20, 25, 27, 28, 31, 32], "31": [1, 8, 9, 17, 21, 25], "overview": [1, 24, 32], "combin": [1, 2, 5, 6, 19, 20, 22, 24, 26, 28, 31], "weight": [1, 2, 13, 19, 22, 30], "averag": [1, 2, 9, 13, 15, 17, 19, 20, 30, 31], "32": [1, 8, 12, 17, 19, 21], "bag": 1, "forest": 1, "bootstrap": [1, 2], "role": [1, 2, 7, 11, 12, 13, 14, 17, 20], "33": [1, 9, 17], "boost": 1, "adaboost": 1, "updat": [1, 2, 9, 13, 18, 19], "34": [1, 8, 9, 17, 19, 20, 21, 22, 31], "gradient": [1, 11, 13, 14], "gbm": 1, "xgboost": 1, "descent": [1, 2, 11, 13], "35": [1, 9, 17, 21], "Their": [1, 9, 11, 13], "stack": [1, 2], "blend": [1, 2, 24], "36": [1, 17, 21, 32], "37": [1, 8, 9, 17, 32], "dataset": [1, 2, 7, 17, 24, 25, 31, 32], "centroid": [1, 2], "converg": [1, 2, 11, 21, 31, 32], "criteria": [1, 2, 6, 28], "38": [1, 8, 12, 17, 19], "hierarch": 1, "dendrogram": [1, 2], "linkag": [1, 2], "39": [1, 17, 19, 21], "densiti": [1, 15, 19, 21, 24, 25, 26], "dbscan": 1, "40": [1, 8, 12, 17, 19, 24], "gmm": 1, "expect": [1, 14, 30], "41": [1, 8, 17, 32], "princip": [1, 2], "compon": [1, 2, 11, 30], "covari": [1, 2], "eigenvalu": [1, 2, 11, 12], "eigenvector": [1, 2, 11], "42": [1, 8, 9, 17, 18, 19, 21, 28, 30, 31, 32], "step": [1, 2, 5, 7, 9, 14, 27, 31, 32], "involv": [1, 2, 13, 19, 20, 28, 30], "comput": [1, 2, 5, 9, 12, 13, 14, 17, 19, 20, 28, 30, 32], "43": [1, 8, 17], "singular": 1, "valu": [1, 5, 6, 7, 8, 11, 13, 14, 15, 17, 18, 20, 21, 22, 24, 26, 27, 28, 30, 31, 32], "decomposit": 1, "svd": 1, "Its": 1, "44": [1, 8, 9, 17, 19], "stochast": [1, 2, 11], "embed": [1, 2], "45": [1, 12, 17, 19, 24], "other": [1, 5, 6, 7, 9, 11, 12, 13, 15, 17, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31, 32], "addit": [1, 2, 5, 6, 7, 9, 13, 19], "like": [1, 2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 22, 24, 26, 27, 28, 30, 31, 32], "lda": [1, 2], "autoencod": 1, "behind": [1, 2, 9, 18, 20], "case": [1, 8, 9, 12, 13, 17, 19, 20, 21, 22, 25, 30], "46": [1, 8, 9, 12, 17], "perceptron": 1, "activ": [1, 8, 14, 18, 20], "47": [1, 8, 9, 12, 17, 20, 21, 22, 28, 32], "feedforward": 1, "layer": [1, 25], "neuron": [1, 2], "48": [1, 17], "backpropag": [1, 13, 14], "dive": [1, 2, 15], "The": [1, 2, 5, 6, 8, 9, 11, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30], "chain": [1, 2, 6, 20, 21, 32], "49": [1, 8, 9, 17], "loss": [1, 9, 14], "optim": [1, 6, 11, 13, 14, 30, 32], "focus": [1, 2, 5, 12, 18, 19, 20, 22, 26, 32], "50": [1, 6, 8, 9, 12, 17, 19, 21, 22, 26], "tune": [1, 19, 28, 32], "improv": [1, 2, 8, 9, 17, 19, 21, 24, 28, 32], "hyperparamet": [1, 2, 28], "avoid": [1, 2, 6, 7, 9, 11, 18, 19, 20, 21, 22, 24, 27], "51": [1, 17, 19], "map": [1, 2], "gener": [1, 7, 9, 13, 14, 15, 18, 19, 28, 30, 31, 32], "52": [1, 8, 9, 17, 19, 32], "pool": 1, "spatial": [1, 2], "effect": [1, 2, 7, 9, 11, 12, 13, 18, 20, 24, 25, 26, 28, 30, 31, 32], "53": [1, 8, 17], "task": [1, 2, 5, 8, 11, 12, 18, 20, 21, 25, 27, 30], "filter": [1, 2], "54": [1, 12, 17, 19], "enhanc": [1, 2, 8, 11, 13, 17, 18, 19, 21, 26, 28], "dropout": [1, 2], "batch": [1, 2], "basi": [1, 2, 17, 30], "55": [1, 17, 21, 31], "fine": [1, 2, 28], "extract": [1, 15, 26], "56": [1, 8, 17, 19], "uniqu": [1, 2, 5, 22, 28], "57": [1, 6, 17, 19], "long": [1, 5, 7, 11, 17], "short": [1, 6, 8], "term": [1, 6, 13, 14, 22, 27, 31, 32], "memori": [1, 17, 19], "lstm": 1, "cell": [1, 2, 5, 7, 9, 19, 22, 24, 32], "depend": [1, 2, 5, 7, 8, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31, 32], "58": [1, 8, 17, 19, 21], "time": [1, 7, 9, 12, 13, 15, 17, 18, 20, 24, 30], "59": [1, 8, 17], "seri": [1, 5, 7, 9, 18, 20, 21, 24, 28, 30, 31, 32], "forecast": [1, 2, 30], "60": [1, 6, 8, 12, 17, 19], "util": [1, 9, 11, 13, 20, 24, 30, 31, 32], "natur": [1, 5, 7, 11, 15, 20, 22, 27, 30, 31], "languag": [1, 5, 7, 9, 11], "nlp": [1, 11], "word": [1, 2, 6, 9, 11], "space": [1, 2, 5, 11, 15, 22, 30, 32], "61": [1, 8, 17], "framework": [1, 2, 15], "reward": [1, 2], "make": [1, 5, 6, 7, 8, 9, 11, 12, 13, 15, 17, 20, 22, 24, 25, 26, 30, 31, 32], "62": [1, 8, 17, 20, 21, 22], "markov": 1, "mdp": [1, 2], "rl": 1, "transit": [1, 2], "state": [1, 2, 6, 12, 13, 22, 24], "63": [1, 17], "q": [1, 20, 21, 22], "bellman": [1, 2], "estim": [1, 2, 17, 19, 20, 24, 28, 30, 31, 32], "64": [1, 8, 17], "dqn": 1, "environ": [1, 2, 18, 19, 20, 32], "65": [1, 6, 17, 19], "polici": [1, 18], "ascent": [1, 2], "66": [1, 17], "depth": [1, 27, 28], "67": [1, 8, 17, 19], "adversari": 1, "minimax": [1, 2], "game": [1, 2, 11], "theori": [1, 2, 12, 18, 28], "68": [1, 8, 19], "self": [1, 7, 9], "69": [1, 17], "more": [1, 2, 5, 7, 8, 9, 11, 12, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 30, 31, 32], "reconstruct": [1, 2], "latent": [1, 2], "70": [1, 6, 19, 32], "research": 1, "ml": [1, 13, 14, 18, 33], "aih": 1, "latest": [1, 2, 5], "artifici": [1, 2, 11, 20, 22], "intellig": [1, 2, 11], "technolog": 1, "71": [1, 8, 19], "lifecycl": 1, "72": [1, 19], "version": [1, 5], "track": [1, 9, 20], "73": [1, 8], "ci": 1, "cd": 1, "continu": [1, 2, 5, 9, 12, 13, 14, 17, 20, 22, 27, 28, 30, 31], "deliveri": 1, "autom": [1, 2, 7, 11], "valid": [1, 2, 9, 13, 21, 28, 31, 32], "74": [1, 8, 12], "monitor": 1, "mainten": 1, "maintain": [1, 5, 7, 20], "product": [1, 2], "anomali": [1, 2, 20], "drift": [1, 2], "behavior": [1, 2, 6, 9, 13, 20, 21], "75": [1, 12, 17, 19, 21, 22, 31], "tool": [1, 5, 11, 13, 17, 24, 25, 26, 27, 30, 31], "platform": [1, 5], "scalabl": [1, 2], "effici": [1, 2, 7, 8, 9, 11, 13, 17, 18, 22, 28, 32], "76": [1, 8, 12, 19, 21, 22], "load": [1, 9, 11, 17, 19, 24, 25, 26, 27, 28, 31, 32], "queri": [1, 2], "77": [1, 8], "approach": [1, 2, 6, 19, 28, 31], "78": [1, 19], "databas": 1, "manag": [1, 9, 22], "phase": 1, "balanc": [1, 2, 18, 19, 28, 32], "79": [1, 8], "an": [1, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "pipelin": [1, 28, 32], "workflow": [1, 2, 32], "80": [1, 12], "81": 1, "82": [1, 8, 19], "posit": [1, 5, 7, 9, 11, 13, 17, 18, 19, 26, 27, 30], "83": [1, 8, 12, 17], "84": [1, 12], "e": [1, 2, 5, 9, 11, 12, 15, 17, 20, 21, 22, 24, 28, 32], "g": [1, 2, 9, 11, 13, 17, 20, 21, 22, 24, 28, 31, 32], "bert": [1, 2], "gpt": [1, 2], "geometri": [1, 2], "contextu": [1, 2, 19, 20], "85": [1, 32], "domain": [1, 13, 20, 28, 32], "beyond": [1, 2, 26, 28, 30], "vision": [1, 2], "adapt": [1, 2], "issu": [1, 2, 15, 17, 19, 20, 21, 22, 24, 25, 26, 30], "86": [1, 8, 20, 21, 32], "fair": 1, "quantit": [1, 2, 17, 27], "87": 1, "privaci": 1, "secur": 1, "system": [1, 11, 12, 13, 15, 17, 19, 20, 21, 22, 24, 25, 30], "cryptographi": [1, 2, 9], "protect": [1, 2], "88": [1, 8, 19, 32], "explain": [1, 5], "transpar": [1, 20], "need": [1, 2, 6, 7, 9, 12, 17, 19, 20, 21, 22, 28, 32], "explan": [1, 2, 18, 31], "89": [1, 8, 12], "regul": 1, "complianc": [1, 18], "affect": [1, 2, 6, 13, 20, 21, 25, 26, 28], "gdpr": [1, 2], "risk": [1, 2, 18, 32], "assess": [1, 2, 8, 18, 19, 20, 22, 26, 27, 31], "90": 1, "develop": [1, 7, 11, 20, 24], "91": [1, 8, 22], "diagnost": [1, 2], "treatment": [1, 2], "plan": [1, 18], "predict": [1, 2, 9, 11, 13, 15, 18, 19, 20, 24, 27, 28, 31, 32], "health": [1, 2], "92": [1, 8], "fraud": [1, 2], "financi": [1, 2], "93": [1, 12, 19], "custom": [1, 2, 6, 9], "suppli": [1, 2], "demand": [1, 2], "94": [1, 8], "qualiti": [1, 2, 17, 18, 20, 24], "reliabl": [1, 2, 19, 28], "95": [1, 6], "transport": 1, "etc": [1, 11, 30, 32], "broad": [1, 2], "specif": [1, 2, 5, 6, 9, 11, 13, 18, 20, 21, 28, 32], "A": [1, 2, 5, 7, 9, 11, 12, 15, 19, 20, 21, 24, 27, 31, 32], "encompass": 1, "96": [1, 19], "protocol": [1, 2], "encrypt": [1, 2], "97": [1, 8, 9, 19], "identifi": [1, 9, 11, 17, 19, 20, 22, 26, 27, 30], "threat": 1, "vulner": 1, "potenti": [1, 2, 18, 19, 22, 24, 25, 26, 27, 28, 31], "98": [1, 8, 12, 19], "prevent": [1, 14, 18, 20, 21, 22, 30], "pattern": [1, 2, 9, 11, 19, 20, 24, 25, 26, 30], "recognit": [1, 2, 11], "99": [1, 19], "best": [1, 2, 5, 19, 31, 32], "100": [1, 5, 6, 8, 9, 12, 13, 14, 19, 30, 32], "studi": [1, 12, 31], "incid": 1, "real": [1, 2, 14, 20, 28, 30, 31, 32], "forens": [1, 2], "post": [1, 2, 20, 28], "101": [1, 8], "guidanc": [1, 2], "scope": [1, 2, 8, 9], "definit": [1, 2, 9, 12, 14, 19, 32], "feasibl": [1, 2], "102": 1, "104": 1, "throughout": [1, 5, 9], "cours": [1, 2, 11, 12, 17], "problem": [1, 2, 7, 9, 11, 12, 14, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30], "solv": [1, 2, 6, 7, 9, 11, 12, 30], "105": 1, "final": [1, 6, 8, 9, 32], "present": [1, 7, 9, 15, 22, 24, 25, 26, 28, 32], "result": [1, 2, 5, 6, 8, 9, 11, 12, 19, 20, 21, 22, 24, 25, 26, 27, 31, 32], "googl": [2, 5], "edu": 2, "interact": [2, 5, 9, 11, 12, 28, 30, 31, 32], "cover": [2, 12], "realpython": [2, 26, 27], "demonstr": [2, 9, 19, 22, 28, 30], "code": [2, 5, 6, 7, 9, 17, 18, 21, 22, 24, 25, 27, 30, 32], "execut": [2, 5, 7, 8, 9, 32], "comment": [2, 5], "express": [2, 5, 6, 8, 11, 12, 13, 31], "exampl": [2, 5, 6, 9, 15, 21, 31, 32], "numpi": [2, 5, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 27, 28, 30, 32], "np": [2, 9, 11, 12, 13, 14, 15, 17, 19, 20, 21, 28, 30, 32], "number": [2, 5, 6, 8, 11, 12, 13, 15, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 30, 32], "arrai": [2, 9, 11, 12, 15, 17, 30, 32], "w3school": 2, "python_datatyp": 2, "asp": 2, "document": [2, 9, 11, 19, 20, 26, 27, 28, 32], "tutorialspoint": 2, "python_data_structur": 2, "index": [2, 7, 9, 11, 21, 27, 28], "htm": 2, "string": [2, 5, 6, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30, 32], "list": [2, 6, 7, 8, 9, 11, 15, 25, 26, 28], "dictionari": [2, 7, 25], "python_oper": 2, "detail": [2, 9, 15, 19, 22, 27, 31], "comparison": [2, 17, 20, 32], "usag": [2, 7, 17, 18, 19, 20, 27, 28, 31], "check": [2, 6, 7, 8, 9, 13, 17, 19, 20, 21, 24, 27, 28, 31, 32], "practic": [2, 9, 11, 12, 15, 19, 23, 30, 32, 33], "convers": 2, "int": [2, 5, 7, 9], "float_vari": 2, "compar": [2, 5, 6, 18, 20, 21, 22, 24, 26, 28, 30, 31], "dataquest": 2, "io": [2, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28], "python_while_loop": 2, "break": [2, 9, 20, 28], "gloss_python_for_nest": 2, "nest": 2, "iter": [2, 7, 8, 20, 28, 32], "over": [2, 6, 7, 8, 9, 11, 12, 13, 14, 15, 19, 28, 31, 32], "sum": [2, 5, 11, 12, 14, 20, 21, 22, 26, 27, 28, 30, 31], "multi": [2, 17, 19], "counter": 2, "gloss_python_els": 2, "gloss_python_elif": 2, "programiz": 2, "pariti": 2, "modifi": [2, 5, 7, 9, 21], "within": [2, 5, 9, 12, 18, 19, 22, 26, 27, 28, 30], "doc": [2, 31], "org": [2, 5, 13, 15, 17, 19, 25, 27, 28, 31, 32], "es": 2, "html": [2, 19, 25, 26, 27, 28, 31, 32], "offici": 2, "creation": 2, "call": [2, 7, 9, 11, 12, 22, 24, 32], "refer": [2, 5, 6, 8, 11, 12, 30, 31], "guid": [2, 18, 24, 25, 31, 32], "python_modul": 2, "packag": [2, 7, 9, 17, 28, 30], "access": [2, 5, 9, 12, 17, 24], "area": [2, 13, 14, 18, 26], "input": [2, 6, 7, 9, 12, 13, 21, 28, 30, 32], "sqrt": [2, 11, 15, 17, 27], "panda": [2, 5, 9, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "m": [2, 6, 12, 30], "youtub": [2, 15], "watch": [2, 15], "v": [2, 11, 13, 15, 27], "fnk_zzamoss": 2, "khanacademi": [2, 15], "free": [2, 5, 7, 9, 12, 19], "onlin": [2, 30], "exercis": [2, 7, 12, 24, 28, 30], "bvanderlei": 2, "librari": [2, 5, 14, 17, 18, 19, 20, 24, 25, 26, 30], "subtract": [2, 5, 7, 13, 21, 30], "scalar": [2, 12], "dot": [2, 9, 25], "magnitud": [2, 12, 32], "matplotlib": [2, 9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 31, 32], "kyb8iza5au": 2, "mathsisfun": 2, "geeksforgeek": [2, 17, 25, 27, 28], "manipul": [2, 6, 7, 11], "transpos": 2, "invers": 2, "determin": [2, 6, 8, 11, 12, 13, 17, 28, 30, 32], "differenti": [2, 14], "dc": 2, "diff": [2, 13], "intro": [2, 32], "askpython": 2, "sympi": [2, 13, 14], "symbol": [2, 5, 12, 13, 14], "wuvtyaankzm": 2, "composit": 2, "tangent": 2, "line": [2, 5, 7, 8, 9, 12, 17, 19, 22, 24, 25, 26, 31, 32], "ic": 2, "2i44y9hfq4q": 2, "integrand": 2, "simpson": 2, "find": [2, 9, 11, 12, 13, 14, 17, 18, 20, 24, 26, 27, 28, 30, 32], "volum": [2, 11, 13], "done": [2, 7, 9, 18, 31], "lwq1zw": 2, "xhbe": 2, "scipi": [2, 15, 17, 19, 24, 25, 27], "stat": [2, 15, 17, 19, 24, 25], "from": [2, 5, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "median": [2, 15, 17, 19, 21, 26, 31, 32], "standard": [2, 6, 15, 18, 20, 22, 25, 26, 28, 31, 32], "deviat": [2, 15, 21, 22, 25, 26, 28], "boxplot": [2, 21, 26], "hypothesi": [2, 15, 27], "scienc": [2, 5, 9, 12, 14, 18, 24, 26, 28, 30, 32], "mode": [2, 15, 20, 21, 26, 31], "outlier": [2, 17, 19, 20, 21, 24, 25, 26, 27, 31], "determinist": 2, "analyz": [2, 11, 13, 15, 17, 19, 20, 22, 25, 26, 27, 28, 32], "impact": [2, 7, 9, 18, 19, 21, 22, 24, 28], "scikit": [2, 5, 9, 18, 20, 21, 22, 24, 25, 31], "vs": [2, 9, 20, 21, 26, 31, 32], "each": [2, 5, 7, 8, 9, 12, 15, 18, 19, 20, 22, 25, 26, 27, 28, 30, 31, 32], "kaggl": [2, 17, 18, 19, 20, 21, 24], "engin": [2, 12, 13, 14, 17, 18], "One": [2, 13], "between": [2, 6, 7, 8, 9, 11, 12, 13, 14, 18, 19, 20, 21, 22, 24, 27, 28, 31, 32], "cross": [2, 28, 32], "In": [2, 5, 6, 7, 8, 9, 11, 12, 13, 14, 20, 22, 24, 27, 28, 30, 31, 32], "aspect": [2, 5, 8, 28, 31, 32, 33], "rang": [2, 6, 8, 9, 11, 15, 21, 24, 25, 26, 28, 30], "skew": [2, 17, 19, 20, 25, 26, 27], "galleri": 2, "showcas": 2, "overal": [2, 18, 20, 28], "pearson": [2, 28], "spearman": 2, "heatmap": [2, 19], "wrangl": 2, "hous": [2, 32], "seaborn": [2, 19, 21, 22, 24, 25, 26, 27, 31], "pairplot": [2, 24, 25, 31], "price": [2, 6, 9, 13], "than": [2, 5, 6, 7, 8, 9, 11, 12, 17, 25, 26, 28, 30, 31, 32], "independ": [2, 12, 13, 15, 18, 22, 28, 30, 31, 32], "how": [2, 5, 6, 7, 9, 11, 13, 14, 15, 18, 19, 21, 22, 24, 25, 26, 27, 28, 30, 31], "influenc": [2, 18, 19, 20, 22, 25, 27, 31], "With": [2, 5, 9, 32], "relationship": [2, 11, 13, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31, 32], "foundat": [2, 4, 6, 10, 11, 14, 15, 16, 17, 18, 25, 33], "accuraci": [2, 18, 21, 22, 25], "efficaci": 2, "limit": [2, 9, 13, 18, 32], "appropri": [2, 18, 20, 21, 24, 25, 30, 31, 32], "deal": [2, 5, 7, 18, 20, 28, 30, 31, 32], "abil": [2, 19], "titan": [2, 20, 21], "outcom": [2, 9, 15, 30, 31], "confus": [2, 9, 18, 19], "datacamp": 2, "provid": [2, 5, 6, 7, 9, 11, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 30, 31, 32], "theoret": [2, 24, 28], "path": [2, 18, 19, 22], "assumpt": [2, 20, 24, 27, 28, 31, 32], "conceptu": 2, "masteri": [2, 15], "delv": [2, 6, 22, 25, 26, 27, 28], "underpin": [2, 25, 27], "github": [2, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 32], "repositori": 2, "investig": [2, 17, 19, 24, 30], "analyt": [2, 22, 31], "vidhya": 2, "articl": [2, 5, 20, 21], "choos": [2, 9, 14, 18, 20, 21, 24, 25, 26, 27, 28, 32], "nick": 2, "mccullum": 2, "minim": [2, 18, 30, 32], "sse": [2, 30], "built": [2, 5, 28], "beginn": [2, 9], "iri": 2, "also": [2, 5, 6, 8, 9, 11, 14, 18, 19, 20, 24, 25, 26, 28, 32], "group": [2, 6, 17, 18, 19, 26, 28], "point": [2, 5, 7, 9, 11, 13, 14, 15, 18, 19, 20, 24, 25, 26, 27, 30, 32], "recalcul": 2, "format": [2, 9, 17, 30, 31], "abus": 2, "agglom": 2, "divis": [2, 5, 6, 13], "form": [2, 7, 8, 9, 11, 13, 30, 32], "repres": [2, 5, 6, 9, 12, 13, 14, 17, 18, 19, 20, 22, 24, 25, 26, 28, 30, 31, 32], "paramet": [2, 15, 18, 20, 24, 28, 30, 32], "epsilon": [2, 30, 31, 32], "ep": 2, "minpt": 2, "anoth": [2, 5, 9, 11, 27, 28], "found": [2, 5, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30, 32], "renesh": 2, "bedr": 2, "blog": [2, 17, 18, 20, 21, 22, 24, 25, 28], "which": [2, 5, 6, 7, 8, 9, 11, 13, 17, 19, 20, 21, 22, 26, 27, 30, 31, 32], "\u03b5": 2, "vari": [2, 7, 9, 13, 18, 19, 28], "For": [2, 5, 8, 9, 11, 12, 13, 14, 18, 19, 20, 21, 22, 24, 26, 30], "thorough": [2, 13, 15, 24, 27], "excel": [2, 14, 19], "plu": 2, "breast": 2, "cancer": 2, "cifar": 2, "scratch": 2, "necessari": [2, 7, 9, 12, 13, 14, 17, 18, 20, 24, 25, 26, 30, 31, 32], "kindson": 2, "geniu": 2, "particularli": [2, 5, 6, 7, 11, 14, 18, 19, 20, 28, 30, 31, 32], "underli": [2, 19, 21, 24, 28, 31], "benefici": [2, 5, 19, 20, 25, 31], "those": [2, 12, 19, 20, 21, 30, 31], "look": [2, 6, 19, 20, 22, 25, 26, 28, 30, 31], "can": [2, 5, 6, 7, 8, 9, 11, 12, 13, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 30, 31, 32], "decompos": 2, "constitu": 2, "u": [2, 11, 13], "sigma": [2, 15, 17, 18, 30], "\u03c3": [2, 15, 17, 21], "compress": [2, 9, 12], "nois": [2, 20, 26], "To": [2, 9, 11, 12, 13, 19, 20, 21, 30, 32], "recommend": [2, 9, 19, 20], "where": [2, 5, 6, 8, 9, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 27, 28, 30, 31, 32], "ll": [2, 5, 6, 9, 12, 13, 17, 22, 26, 27, 28, 32], "lower": [2, 9, 18, 19, 26, 28, 30, 32], "precursor": 2, "avail": [2, 9, 30], "toward": [2, 19, 30], "often": [2, 5, 6, 7, 8, 9, 11, 12, 13, 17, 20, 26, 28, 30, 32], "have": [2, 5, 6, 9, 11, 12, 13, 19, 20, 21, 22, 28, 30, 31, 32], "discrimin": [2, 21], "class": [2, 7, 17, 18, 22, 28, 31, 32], "bias": [2, 18, 19], "bryn": 2, "mawr": 2, "artificial_neural_network": 2, "ipynb": 2, "relu": 2, "walk": 2, "tensorflow": 2, "kera": [2, 9], "first": [2, 5, 6, 11, 14, 17, 19, 21, 24, 26, 30, 32], "adjust": [2, 11, 21, 28, 30, 31, 32], "relianc": 2, "choic": [2, 5, 7, 9, 20, 27, 28, 32], "crucial": [2, 5, 6, 7, 11, 12, 13, 14, 15, 18, 19, 20, 22, 26, 27, 28, 30, 31], "opendatasci": 2, "emphas": [2, 21], "consid": [2, 8, 9, 13, 14, 17, 19, 20, 21, 25, 26, 27, 30, 31], "size": [2, 9, 11, 12, 18, 19, 24, 28, 30, 32], "varieti": [2, 18], "when": [2, 5, 6, 7, 8, 9, 11, 12, 17, 18, 19, 20, 21, 22, 26, 27, 30, 31, 32], "instanc": [2, 5, 11, 14, 19, 20, 31, 32], "might": [2, 5, 7, 19, 20, 22, 25, 28, 30, 31, 32], "ideal": [2, 13, 18, 20, 21, 22, 27], "larger": [2, 20, 21, 30, 31, 32], "same": [2, 5, 7, 9, 11, 12, 18, 20, 27, 31, 32], "suggest": [2, 19, 25, 27], "most": [2, 7, 8, 9, 17, 19, 20, 22, 24, 27, 28, 30, 32], "target": [2, 7, 19, 20, 21, 27, 28, 30, 31, 32], "output": [2, 6, 9, 12, 13, 22, 24, 28, 30], "larg": [2, 7, 11, 18, 20, 22, 24, 28, 31, 32], "spread": [2, 17, 19, 20, 21, 22, 24, 25, 26], "logarithm": [2, 28], "msle": 2, "mai": [2, 6, 9, 11, 12, 22, 27, 28, 30, 32], "suitabl": [2, 12, 17, 22, 30, 31], "initi": [2, 5, 18, 24, 25, 31], "ad": [2, 9, 11, 12, 25, 28, 30, 32], "rectifi": 2, "unit": [2, 11, 21, 28, 30, 31, 32], "hidden": [2, 21], "quantiti": [2, 9, 11, 12, 14], "especi": [2, 5, 6, 7, 8, 9, 17, 19, 20, 28, 30, 32], "characterist": [2, 18, 19, 20, 22], "learnopencv": 2, "rate": [2, 11, 18, 19, 22, 26], "critic": [2, 24, 26, 28, 32], "signific": [2, 11, 13, 15, 17, 18, 19, 24, 28, 31], "pivot": [2, 11, 13, 14], "pytorch": [2, 9], "immens": 2, "help": [2, 7, 11, 13, 14, 15, 17, 19, 20, 21, 24, 28, 32], "These": [2, 5, 6, 7, 11, 12, 13, 19, 20], "thei": [2, 5, 6, 7, 9, 11, 12, 13, 14, 15, 19, 21, 22, 25, 26, 27, 28, 31, 32], "contribut": [2, 14, 21, 28], "dimens": [2, 12, 13], "produc": [2, 5, 24, 25], "chan": 2, "leverag": [2, 28], "pre": [2, 13, 14, 17], "new": [2, 5, 7, 11, 12, 17, 19, 28, 30, 31, 32], "touch": 2, "exist": [2, 9, 12, 13, 17, 20, 22], "them": [2, 7, 9, 11, 12, 14, 17, 26, 28, 30, 31, 32], "follow": [2, 5, 6, 8, 9, 11, 15, 21, 25, 26, 28, 31, 32], "special": [2, 5, 6, 9, 12], "kind": [2, 12, 22, 31], "complet": [2, 9, 19, 20, 21, 30], "intuit": [2, 6], "ultim": 2, "freecodecamp": 2, "variat": [2, 19], "gate": 2, "challeng": [2, 5, 22, 31], "sequenti": [2, 9], "show": [2, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "extend": [2, 26, 30, 32], "easi": [2, 6, 17, 24, 25], "Into": 2, "friendli": [2, 9], "less": [2, 6, 7, 8, 9, 19, 20, 21, 28, 30, 31], "intimid": 2, "newcom": 2, "agent": 2, "goal": [2, 7, 20, 24, 28], "openai": 2, "gym": [2, 6], "learndatasci": 2, "previous": [2, 5, 28, 30], "mention": 2, "lai": [2, 15], "groundwork": [2, 15, 30], "tradit": [2, 28], "deeper": [2, 6, 28], "mani": [2, 9, 12, 15, 20, 22, 24, 25, 28, 30, 31, 32], "accompani": [2, 9], "instruct": [2, 5], "common": [2, 9, 19, 20, 25, 31, 32], "repurpos": 2, "get": [2, 5, 6, 11, 19, 28, 30, 31, 32], "thing": [2, 7, 9, 11, 32], "two": [2, 5, 7, 9, 11, 12, 13, 17, 21, 22, 25, 26, 27, 31], "simultan": [2, 31], "competit": 2, "respons": [2, 20, 24, 32], "snippet": [2, 28, 30, 32], "translat": [2, 32], "grasp": [2, 6, 13, 19, 27], "text": [2, 5, 11, 18, 28, 30, 32], "denois": 2, "give": [2, 7, 9, 13, 14, 22, 25, 28, 30, 31, 32], "clear": [2, 7, 22, 24, 25, 32], "along": [2, 11, 13, 19, 30, 32], "back": [2, 6, 9, 31], "arxiv": 2, "essenti": [2, 5, 6, 7, 11, 12, 13, 14, 17, 18, 19, 21, 22, 24, 27, 28, 30, 31], "keep": [2, 9, 20, 21, 24, 28, 32], "up": [2, 9, 14, 32], "paper": 2, "vast": [2, 30], "collect": [2, 6, 11, 15], "preprint": 2, "mit": [2, 12], "review": 2, "breakthrough": 2, "written": [2, 8, 9], "novel": 2, "paradigm": 2, "projectpro": 2, "across": [2, 11, 12, 13, 18, 19, 20, 21, 28, 32], "deploy": 2, "container": 2, "kubernet": 2, "ensur": [2, 5, 7, 11, 13, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 31, 32], "robust": [2, 13, 17, 19, 20, 24], "top": [2, 12, 22, 28], "neptun": [2, 28], "landscap": 2, "2023": [2, 21, 28], "cater": 2, "consider": [2, 19, 28, 33], "cloud": [2, 5, 30], "microsoft": 2, "commun": [2, 5, 18, 26, 28], "hub": 2, "host": 2, "codespac": 2, "csv": [2, 9, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "json": [2, 9], "xml": 2, "sourc": [2, 9], "convert": [2, 17, 22, 28, 31, 32], "off": [2, 19, 32], "file": [2, 7, 9, 30], "azur": 2, "cosmo": 2, "db": 2, "storag": 2, "retriev": [2, 5, 7, 9], "log": [2, 9, 26, 28], "streamlin": [2, 32], "sql": 2, "power": [2, 5, 7, 11, 15, 22, 24, 27, 28, 30, 31, 32], "bi": 2, "uva": 2, "dl": 2, "head": [2, 17, 19, 20, 21, 22, 30, 31, 32], "harvard": 2, "llm": 2, "similar": [2, 6, 7, 11, 12, 20, 25, 30, 31], "decod": 2, "examin": [2, 19, 20, 21, 26, 30, 32], "hug": 2, "face": 2, "enabl": [2, 7, 8, 9, 11, 14, 20, 26, 30, 31], "audio": 2, "upon": [2, 9], "broader": [2, 15, 28], "signal": 2, "modif": [2, 9, 18], "outsid": [2, 6, 9, 25, 26, 32], "foster": 2, "opencoursewar": [2, 12], "full": 2, "classroom": 2, "pluralsight": 2, "mitig": 2, "kdnugget": [2, 28], "user": [2, 7, 9], "close": [2, 19, 20, 27, 30], "pertain": 2, "regulatori": 2, "adher": 2, "coursera": [2, 12], "care": [2, 18, 20], "benefit": [2, 11, 31, 32], "stanford": 2, "patient": 2, "visit": 2, "lab": 2, "procedur": [2, 9, 30], "univers": 2, "innov": 2, "extrapol": 2, "though": [2, 9, 32], "capabl": [2, 8, 9, 19], "person": [2, 6], "centric": 2, "modern": 2, "reshap": [2, 30, 32], "cryptograph": 2, "recogn": [2, 13], "ibm": 2, "forb": 2, "driven": [2, 15, 20], "mckinsei": 2, "highlight": [2, 13, 26, 30], "infosecur": 2, "magazin": 2, "report": [2, 18, 20, 27], "probabilist": 2, "viabil": 2, "realist": 2, "edx": 2, "advic": 2, "idea": [2, 9, 13, 31], "engag": [2, 27], "inde": 2, "tip": [2, 5], "sciencedirect": 2, "summar": [2, 9, 15, 24, 25, 26, 30], "synthesi": 2, "wai": [2, 6, 7, 8, 9, 11, 12, 13, 20, 28, 32], "clearli": [2, 24, 26], "data": [4, 5, 8, 9, 12, 14, 25, 26, 27, 29, 31, 32, 33], "3": [4, 5, 6, 8, 9, 12, 14, 19, 30, 31, 32, 33], "4": [4, 5, 7, 9, 12, 14, 17, 30, 31, 32, 33], "5": [4, 5, 6, 7, 8, 12, 14, 15, 17, 25, 26, 28, 30, 32, 33], "what": [5, 6, 7, 8, 9, 19, 22, 25, 28, 30, 31, 32], "machin": [5, 6, 9, 12, 13, 17, 18, 20, 21, 28, 30, 31, 32], "learn": [5, 6, 9, 12, 13, 15, 16, 17, 18, 20, 21, 22, 24, 25, 27, 28, 31, 32], "our": [5, 6, 7, 9, 13, 25, 27, 30, 32], "go": [5, 6, 9, 30], "wide": [5, 11, 19, 26, 28, 30], "due": [5, 11, 19, 22, 25, 28, 32], "readabl": [5, 7, 8, 9], "simplic": [5, 11], "rich": 5, "ecosystem": 5, "invalu": [5, 20], "preprocess": [5, 19, 22, 28, 32, 33], "analysi": [5, 6, 11, 12, 13, 14, 15, 17, 18, 20, 29, 31, 33], "colab": 5, "account": [5, 9, 20], "jupyt": [5, 9, 19, 20, 32], "notebook": [5, 9, 19, 31, 32], "allow": [5, 6, 7, 8, 9, 12, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 30, 31, 32], "browser": 5, "without": [5, 9, 11, 17, 21, 22, 25, 28, 30, 32], "ani": [5, 6, 9, 11, 12, 13, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 31, 32], "setup": 5, "requir": [5, 7, 8, 9, 11, 15, 17, 19, 20, 21, 22, 24, 25, 30, 31], "gpu": 5, "some": [5, 7, 9, 12, 13, 19, 20, 28, 30, 31, 32], "computation": [5, 20, 28, 32], "heavi": 5, "local": [5, 9], "option": [5, 6, 9], "don": [5, 9, 24, 25, 26, 27, 30, 31, 32], "cpu": 5, "want": [5, 7, 13, 30, 32], "acquaint": [5, 27, 30, 32], "anywai": 5, "later": [5, 30], "consist": [5, 18, 19, 20, 21, 28], "contain": [5, 9, 17, 26, 28, 31], "either": [5, 6, 9, 12, 17], "markdown": 5, "rememb": [5, 7, 22, 24, 27, 28], "should": [5, 6, 7, 9, 18, 20, 21, 25, 28, 30, 31], "run": [5, 8, 9, 18, 28], "order": [5, 6, 7, 11, 12, 22, 28, 32], "sinc": [5, 9, 12, 19, 30, 32], "earlier": 5, "howev": [5, 9, 12, 18, 22, 28, 32], "re": [5, 6, 9, 17, 20, 28, 30, 31], "debug": 5, "rerun": [5, 19, 32], "alwai": [5, 6, 7, 9, 13, 19, 20, 21, 28, 30, 31], "appear": [5, 14, 17, 19, 25, 26], "If": [5, 6, 9, 13, 14, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31, 32], "encount": [5, 6, 13, 32], "unexpect": 5, "troubleshoot": 5, "all": [5, 6, 9, 12, 15, 17, 19, 21, 22, 25, 26, 28, 30, 31, 32], "begin": [5, 11, 12, 13], "invalid": [5, 9], "incorrect": [5, 7], "occur": [5, 15, 17, 20, 31], "chang": [5, 7, 9, 11, 20, 21, 22, 27, 30, 31], "haven": 5, "been": [5, 6, 9], "propag": 5, "By": [5, 6, 11, 20, 21, 28], "runtim": 5, "menu": [5, 9], "reflect": [5, 19, 20, 22, 24], "save": [5, 9], "regularli": 5, "autosav": 5, "drive": [5, 13], "good": [5, 19, 30], "habit": 5, "manual": 5, "flexibl": [5, 7, 9], "easili": 5, "perfect": [5, 19, 22], "oper": [5, 7, 9, 10, 18, 20, 21, 32], "print": [5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "after": [5, 6, 7, 9, 12, 18, 20, 21, 22, 28, 31], "next": [5, 7, 15, 17, 19, 20, 21, 22, 24, 25, 30, 32], "block": [5, 7, 9, 32], "whitespac": [5, 8, 9], "indent": [5, 8, 9], "brace": 5, "end": [5, 6, 7, 9, 11, 12, 17, 32], "unind": 5, "amount": [5, 6, 19, 28], "must": [5, 6, 12, 27], "commonli": [5, 6, 8, 12, 13, 17, 20, 24, 27, 28], "x": [5, 6, 8, 9, 12, 13, 14, 17, 18, 19, 21, 24, 25, 27, 28, 30, 31, 32], "0": [5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "here": [5, 6, 7, 9, 13, 19, 22, 27, 30, 32], "true": [5, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 24, 26, 27, 31, 32], "meaning": [5, 9, 24, 26, 27, 30, 31], "apart": [5, 9], "tab": 5, "element": [5, 6, 7, 11, 17, 19, 28, 30, 32], "excess": [5, 19], "ignor": [5, 15, 24, 26, 27, 28], "henc": 5, "b": [5, 6, 8, 9, 11, 12, 14, 28, 30], "harder": 5, "read": [5, 6, 8, 25, 31, 32], "lack": [5, 19, 27], "parenthes": [5, 6, 9], "bracket": 5, "lengthi": 5, "total": [5, 6, 9, 14, 17, 18, 19, 26, 28], "c": [5, 8, 9, 11, 12, 13, 32], "d": [5, 13], "f": [5, 6, 7, 8, 9, 13, 14, 15, 21, 22, 24, 25, 26, 30, 31, 32], "backslash": 5, "indic": [5, 9, 11, 13, 18, 19, 21, 26, 27, 28, 30, 31], "describ": [5, 9, 11, 12, 13, 15, 17, 19, 21, 22, 24, 26, 27, 30, 32], "note": [5, 9, 12, 25, 27, 28, 30, 31, 32], "futur": [5, 30], "carri": 5, "out": [5, 6, 9, 19, 20, 26, 30, 32], "primari": [5, 20, 24], "add": [5, 9, 11, 12, 32], "operand": [5, 6], "equal": [5, 6, 9, 12, 15, 17, 21, 22, 26, 28, 30, 31, 32], "8": [5, 7, 8, 9, 10, 11, 12, 15, 17, 20, 22, 24, 30, 31, 32, 33], "right": [5, 6, 9, 11, 12, 13, 18, 20, 21, 24, 26, 28, 30, 31], "left": [5, 6, 12, 13, 26, 28, 30], "2": [5, 8, 9, 12, 14, 19, 30, 31, 32, 33], "multipli": [5, 11, 12], "15": [5, 8, 12, 16, 17, 19, 24, 25, 30, 33], "divid": [5, 17, 18, 19, 21, 26, 30], "return": [5, 6, 7, 12, 17, 28, 31], "float": [5, 9], "floor": 5, "largest": [5, 8], "whole": 5, "smaller": [5, 19, 20, 21, 32], "modulu": 5, "remaind": 5, "exponenti": 5, "rais": [5, 7, 9], "try": [5, 6, 9, 19, 20, 21, 28, 30, 32], "someth": [5, 9], "yourself": [5, 7, 27, 30], "name": [5, 7, 9, 12, 20, 21, 22, 24, 31, 32], "10": [5, 7, 8, 9, 10, 11, 12, 13, 14, 17, 19, 20, 24, 25, 26, 27, 28, 30, 32, 33], "overwrit": 5, "whatev": [5, 9], "held": 5, "shorthand": [5, 6], "increment": 5, "decrement": 5, "equival": [5, 27, 30], "wa": [5, 7, 9, 12, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 32], "would": [5, 9, 15, 19, 20, 21, 22, 24, 25, 28, 30, 31, 32], "now": [5, 6, 9, 30, 31], "becom": [5, 7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30, 32], "6": [5, 7, 9, 10, 12, 13, 14, 15, 17, 22, 27, 30, 32, 33], "13": [5, 8, 12, 16, 17, 19, 24, 33], "store": [5, 6, 7, 9, 25], "todai": [5, 6, 13, 31], "three": [5, 6, 7, 11, 25, 28, 30], "integ": [5, 9, 12, 22], "decim": 5, "14": [5, 7, 8, 11, 12, 16, 17, 22, 24, 33], "001": 5, "charact": [5, 11], "str": [5, 7, 9], "enclos": [5, 9], "quot": 5, "hello": [5, 9], "my_integ": 5, "my_float": 5, "my_str": 5, "displai": [5, 9, 12, 19, 21, 25, 31], "ask": [5, 7], "current": [5, 7, 9, 33], "There": [5, 8, 9, 18, 30], "restrict": 5, "certain": [5, 7, 8, 12, 19, 24], "ha": [5, 6, 7, 9, 11, 12, 13, 15, 17, 19, 20, 22, 26, 28, 30, 31], "guess": [5, 31], "y": [5, 9, 11, 12, 18, 19, 21, 24, 26, 27, 28, 31, 32], "hi": 5, "constant": [5, 31], "possibl": [5, 9, 15, 20, 24, 28, 30], "down": [5, 9, 20, 28], "convinc": [5, 7], "fill": [5, 12, 21, 31], "behav": [5, 20, 21, 32], "concaten": 5, "academi": [5, 11, 12], "introduct": [5, 16, 23, 26, 29, 33], "codecademi": 5, "introduc": [5, 6, 9, 20, 22, 26, 30, 32], "en": [5, 15, 27], "wikipedia": 5, "wiki": 5, "python_syntax_and_semant": 5, "previou": [6, 9], "session": 6, "laid": 6, "basic": [6, 8, 14, 16, 19, 21, 22, 23, 24, 25, 27, 29, 32, 33], "onli": [6, 7, 9, 11, 12, 17, 18, 21, 22, 24, 25, 27, 28, 31, 32], "lesson": [6, 13, 15, 18, 24, 25, 26, 27, 28, 30, 32], "stronger": 6, "appli": [6, 11, 12, 14, 18, 20, 22, 25, 27, 28, 31, 32, 33], "reason": [6, 17, 18, 20, 25, 27, 30], "boolean": 6, "bool": [6, 7], "truth": [6, 8], "fals": [6, 7, 8, 9, 18, 19, 25], "is_rain": 6, "is_sunni": 6, "none": [6, 9, 22, 32], "signifi": 6, "noth": 6, "absenc": [6, 32], "default": [6, 9, 28], "least": [6, 9, 32], "rainbow": 6, "inequ": 6, "numer": [6, 21, 22, 26, 28, 31], "greater": [6, 7], "object": [6, 9, 11, 17, 32], "ident": [6, 12], "membership": 6, "temperatur": [6, 13, 17], "warm": 6, "cat": 6, "letter": [6, 9, 12], "compound": [6, 32], "concis": [6, 7, 8, 11, 26], "n": [6, 9, 11, 12, 13, 15, 17, 18, 19, 22, 24, 25, 27, 30, 32], "cleaner": [6, 7, 32], "part": [6, 7, 9, 12, 17, 30, 32], "mathemat": [6, 9, 11, 12, 16, 25, 33], "preced": 6, "insid": [6, 9, 25, 26, 32], "circuit": [6, 12], "stop": [6, 7], "soon": [6, 8], "think": [6, 7, 9, 12, 13], "why": [6, 11, 18, 25, 27, 30], "doesn": [6, 13, 19, 22, 27, 28], "matter": [6, 11, 12], "similarli": [6, 13, 32], "doe": [6, 7, 9, 12, 15, 19, 27, 28, 32], "second": [6, 9, 14, 17, 26, 30, 32], "known": [6, 7, 8, 11, 30], "even": [6, 7, 17, 18, 22, 25, 30, 31, 32], "becaus": [6, 7, 9, 13, 17, 20, 21, 28, 30, 32], "alreadi": [6, 9], "satisfi": [6, 22, 30, 31], "whether": [6, 7, 11, 13, 22, 28], "scenario": [6, 8, 9, 11, 13, 14, 20], "fallback": 6, "zero": [6, 11, 13, 17, 21, 24, 30, 31, 32], "elig": 6, "discount": 6, "senior": 6, "citizen": 6, "ag": [6, 7, 21, 22, 30, 31], "older": 6, "student": [6, 24, 25], "purchas": 6, "tuesdai": 6, "everyon": 6, "take": [6, 7, 9, 12, 31, 32], "statu": [6, 9], "def": [6, 7, 9, 28, 31], "calculate_discount": 6, "is_stud": 6, "total_purchas": 6, "is_tuesdai": 6, "discount_elig": 6, "final_pric": 6, "2f": [6, 9, 18, 30, 32], "00": [6, 19, 21], "upgrad": 6, "member": 6, "year": 6, "attend": 6, "friend": 6, "automat": [6, 9, 32], "regardless": [6, 7, 31], "four": [6, 17, 28], "repeatedli": 7, "under": [7, 11, 13, 14], "repetit": 7, "backbon": 7, "script": [7, 9], "shorter": 7, "valuabl": [7, 19, 26], "repeat": [7, 9, 18, 20, 30], "lead": [7, 9, 19, 20, 22, 28, 32], "organ": [7, 9, 15], "python": [7, 9, 16, 19, 23, 29, 32, 33], "item": [7, 9, 25], "mutabl": 7, "my_list": 7, "unord": [7, 22], "pair": [7, 9, 22, 30], "my_dict": 7, "alic": 7, "len": [7, 9, 21, 28, 30], "specifi": [7, 9, 11], "beforehand": 7, "count": [7, 8, 9, 15, 17, 19, 21, 22], "warn": [7, 9], "infinit": 7, "Be": [7, 18, 20, 24, 28], "cautiou": [7, 20, 24, 28], "never": [7, 20, 21], "difficulti": 7, "straightforward": [7, 11, 13, 18, 30], "inher": [7, 22], "extern": 7, "backward": [7, 28], "tupl": [7, 9], "prefer": [7, 12, 28, 32], "prone": [7, 30], "argument": 7, "i": [7, 8, 9, 11, 12, 17, 21, 24, 25, 27, 30, 32], "nuanc": [7, 19, 22, 25], "purpos": [7, 20, 26], "exit": 7, "prematur": 7, "met": [7, 8, 32], "serv": 7, "itself": [7, 9, 11, 17, 20], "skip": 7, "move": [7, 13, 24, 28], "onto": [7, 11], "bypass": 7, "bodi": [7, 11], "odd": 7, "9": [7, 8, 9, 10, 11, 12, 15, 17, 19, 20, 21, 22, 24, 25, 31, 32, 33], "finish": 7, "termin": 7, "search": [7, 9], "trigger": 7, "remind": [7, 12], "content": [7, 9, 19, 24], "search_for": 7, "enumer": [7, 9, 21], "entir": [7, 9, 13, 28, 31, 32], "java": 7, "plai": [7, 11, 12, 14, 20], "emploi": [7, 12], "accomplish": 7, "divisor": 7, "is_prim": 7, "num": 7, "answer": [7, 9, 31], "correct": [7, 9, 17, 19, 22, 25, 28, 30], "immedi": [7, 9], "feedback": [7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 30], "num_quest": 7, "num1": 7, "randint": [7, 9, 12], "num2": 7, "correct_answ": 7, "user_answ": [7, 9], "stdinnotimplementederror": [7, 9], "traceback": [7, 9, 22, 24], "recent": [7, 9, 22, 24], "last": [7, 9, 17, 19, 21, 22, 24, 32], "16": [7, 8, 9, 12, 17, 19, 21, 23], "19": [7, 8, 9, 17, 23, 33], "21": [7, 8, 11, 12, 17, 21, 29, 32, 33], "book_100daysml": [7, 9], "venv": [7, 9], "lib": [7, 9], "python3": [7, 9], "11": [7, 8, 9, 11, 12, 16, 19, 21, 24], "site": [7, 9], "ipykernel": [7, 9], "kernelbas": [7, 9], "py": [7, 9, 15, 17, 19, 20, 21, 22, 24, 25, 27, 30], "1260": [7, 9], "raw_input": [7, 9], "prompt": 7, "1258": [7, 9], "_allow_stdin": [7, 9], "1259": [7, 9], "msg": [7, 9], "frontend": [7, 9], "request": [7, 9], "1261": [7, 9], "_input_request": [7, 9], "1262": [7, 9], "1263": [7, 9], "_parent_id": [7, 9], "shell": [7, 9], "1264": [7, 9], "get_par": [7, 9], "1265": [7, 9], "password": [7, 9], "1266": [7, 9], "quizz": 7, "feel": [7, 9], "action": [8, 9, 25], "branch": 8, "therebi": 8, "increas": [8, 19, 22, 30, 32], "do_someth": 8, "voila": 8, "conjunct": 8, "do_something_els": 8, "Not": [8, 11, 12, 21], "mutual": [8, 22], "exclus": [8, 22, 28], "condition1": 8, "condition2": 8, "neither": 8, "nor": 8, "do_another_th": 8, "liken": 8, "style": [8, 32], "switch": 8, "correspond": [8, 12], "taken": [8, 12], "medium": [8, 18, 21, 22, 24, 28], "compact": 8, "ternari": 8, "quick": [8, 13, 31], "singl": [8, 9, 11, 12, 17, 30, 31, 32], "vertic": 8, "align": [8, 18, 20, 28], "classic": 8, "job": [8, 30], "interview": 8, "1": [8, 12, 14, 30, 31, 32, 33], "fizz": 8, "instead": [8, 17, 20, 21], "buzz": 8, "7": [8, 9, 10, 11, 15, 17, 20, 22, 24, 26, 31, 32, 33], "17": [8, 9, 12, 17, 19, 21, 23, 33], "entri": [8, 12, 17, 19], "celsiu": [8, 17], "below": [8, 9, 17, 19, 30, 32], "freez": 8, "inclus": [8, 25, 28], "cold": 8, "moder": [8, 19], "abov": [8, 19, 32], "categori": [8, 17, 20, 22, 24], "predefin": [8, 11], "temp": 8, "000": [8, 17, 32], "sedentari": 8, "499": 8, "lightli": 8, "500": 8, "999": 8, "veri": [8, 9, 13, 19, 31, 32], "distinct": [9, 28, 30], "situat": [9, 22], "reusabl": 9, "better": [9, 15, 17, 19, 20, 21, 22, 24, 25, 28, 30, 31], "modular": 9, "degre": [9, 17, 19, 28, 32], "reus": 9, "keyword": 9, "colon": 9, "ey": [9, 32], "peel": 9, "resum": 9, "some_funct": 9, "pass": [9, 32], "do_math": 9, "chosen": [9, 28, 31], "my_funct": 9, "empti": 9, "convent": 9, "lowercas": 9, "underscor": 9, "match": [9, 12, 32], "familiar": [9, 18, 22, 31], "directli": [9, 20, 30], "mere": [9, 28], "being": [9, 19, 30, 31, 32], "won": 9, "until": [9, 30, 32], "declar": [9, 12], "proper": 9, "john": 9, "mandatori": 9, "overridden": 9, "reorder": 9, "shuffl": [9, 18], "global": 9, "confin": 9, "shadow": 9, "do": [9, 17, 19, 20, 21, 24, 25, 26, 27, 30, 31, 32], "who": 9, "struggl": [9, 19], "explicitli": 9, "regard": 9, "bad": 9, "anti": 9, "just": [9, 11, 12, 13, 14, 28, 30, 32], "see": [9, 28, 30, 32], "didn": 9, "h": [9, 13], "stuff": [9, 31], "append": [9, 11, 28], "ones": 9, "caus": [9, 15, 17, 19, 20, 21, 22, 24, 25, 27, 30], "typeerror": 9, "send": 9, "caller": 9, "unpack": 9, "usual": [9, 12, 31], "section": [9, 26], "ran": 9, "bring": [9, 28], "sometim": 9, "batteri": 9, "web": 9, "goe": [9, 30], "heard": 9, "slow": [9, 11, 13], "circumst": 9, "popular": [9, 30], "few": [9, 18, 19, 21, 24, 25, 30, 31, 32], "constraint": [9, 32], "rust": 9, "speed": [9, 11, 13, 21], "highli": [9, 22, 26, 27, 30, 31], "compil": [9, 24], "glue": 9, "namespac": 9, "home": [9, 30, 32], "linux": 9, "x86_64": 9, "cpython": 9, "311": 9, "gnu": 9, "so": [9, 13, 17, 20, 21, 27, 30, 31, 32], "fact": 9, "directori": 9, "pi": [9, 15], "141592653589793": 9, "pow": 9, "forc": [9, 11], "simpli": [9, 13, 30, 31, 32], "frequent": [9, 13, 17, 20], "pyplot": [9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "plt": [9, 11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "dozen": 9, "exhaust": 9, "given": [9, 11, 13, 15, 19, 30, 31], "alia": 9, "leav": [9, 30], "rest": [9, 22, 31], "sole": [9, 26, 28], "sparingli": 9, "difficult": 9, "trace": 9, "come": [9, 15], "own": [9, 15], "encapsul": [9, 13, 22], "occasion": 9, "ok": 9, "greatli": 9, "star": 9, "great": [9, 32], "caution": 9, "could": [9, 19, 25, 32], "adequ": [9, 20], "As": [9, 28, 32], "homework": [9, 28], "perus": 9, "handi": 9, "lot": 9, "dice_rol": 9, "11290791626756647": 9, "servic": 9, "txt": 9, "dump": 9, "elaps": 9, "deliber": [9, 30], "sleep": 9, "datetim": 9, "calendar": 9, "timestamp": 9, "timezon": 9, "durat": [9, 11], "01": [9, 21, 32], "08": [9, 17, 19, 22], "083772": 9, "regress": [9, 15, 21, 27, 33], "far": [9, 19], "actual": [9, 11, 17, 19, 30, 31, 32], "suppos": 9, "ax": [9, 11, 24, 26, 30, 31], "column": [9, 12, 19, 20, 21, 22, 28, 30, 31], "intercept": [9, 30, 31, 32], "x_data": 9, "x1": [9, 11, 12], "x2": [9, 12], "xn": 9, "y_data": 9, "y1": [9, 11, 12], "y2": [9, 12], "yn": 9, "y_pred": 9, "quantifi": [9, 15, 27, 28], "replac": [9, 20, 22], "synthes": 9, "everyth": 9, "ve": [9, 30], "correctli": [9, 19, 22, 28, 31], "too": [9, 24, 25, 28, 32], "low": [9, 17, 19, 26, 27, 30], "attempt": 9, "made": 9, "onc": [9, 31], "successfulli": [9, 19], "messag": 9, "user_input": 9, "enter": 9, "except": [9, 32], "valueerror": 9, "pleas": [9, 15, 17, 19, 20, 21, 22, 24, 25, 30, 32], "calculate_scor": 9, "range_s": 9, "fewer": [9, 19, 22], "worst": 9, "log2": 9, "worst_case_binary_search": 9, "interpol": 9, "extrem": [9, 17, 19, 20, 24], "guessing_gam": 9, "min_valu": 9, "max_valu": 9, "configur": [9, 18, 31, 32], "number_to_guess": 9, "user_guess": 9, "congratul": 9, "again": [9, 32], "desir": [9, 19], "20": [9, 11, 12, 17, 19, 20, 23, 24, 26, 32, 33], "record": 9, "got": [9, 30], "wrong": 9, "my": 9, "solut": [9, 11, 13, 30, 32], "disk": 9, "bonu": 9, "quickli": 9, "around": [9, 13, 19, 21, 24, 26], "example_quiz": 9, "filenam": 9, "sample_quiz": 9, "capit": [9, 12, 25], "franc": 9, "pari": 9, "wrong_answ": 9, "rome": 9, "london": 9, "open": 9, "w": 9, "load_quiz": 9, "uncom": 9, "quiz_gam": 9, "total_scor": 9, "all_answ": 9, "chr": 9, "start_tim": 9, "strip": 9, "end_tim": 9, "time_taken": 9, "correct_answer_index": 9, "assum": [9, 17, 18, 19, 20, 21, 27, 28, 30, 31], "1f": 9, "18": [9, 12, 17, 23, 33], "pick": [9, 30], "inspir": 9, "edit": 9, "delet": 9, "phone": 9, "email": 9, "interfac": 9, "command": 9, "view": [9, 18, 26], "confirm": [9, 13], "success": [9, 15], "gracefulli": 9, "inventori": 9, "remov": [9, 17, 28, 31], "id": [9, 19, 21, 28], "stock": [9, 13], "cost": [9, 13, 20, 28], "tax": 9, "mathbf": 11, "bmatrix": [11, 12], "v_1": 11, "v_2": 11, "vdot": [11, 12], "v_n": 11, "possess": 11, "length": [11, 13, 21, 28], "denot": [11, 12, 13, 14, 15, 28], "non": [11, 19, 20, 28, 31, 32], "neg": [11, 19, 26, 27, 30, 31], "orient": 11, "rel": [11, 19, 28], "frame": [11, 17, 19], "angl": [11, 30], "coordin": [11, 12], "fulli": 11, "car": [11, 13], "travel": [11, 13], "60kph": 11, "ne": 11, "paramount": 11, "scientif": 11, "disciplin": [11, 12, 15], "versatil": 11, "veloc": [11, 13], "acceler": [11, 13], "displac": 11, "motion": 11, "civil": 11, "electr": [11, 12], "indispens": [11, 15], "classif": [11, 18, 28, 30, 33], "phenomena": [11, 15], "tackl": 11, "place": [11, 18], "background": 11, "color": [11, 13, 14, 15, 18, 20, 21, 22, 24, 26, 28, 30, 31, 32], "easier": [11, 31, 32], "handwritten": 11, "digit": [11, 22], "optic": 11, "ocr": 11, "shape": [11, 12, 17, 19, 26, 27], "commut": [11, 12], "associ": [11, 12, 28], "therefor": [11, 13], "yield": 11, "OR": [11, 12], "x_add": 11, "sgd": 11, "dynam": 11, "progress": 11, "overshoot": 11, "ab": 11, "bx": 11, "mulitpl": 11, "ay": 11, "xa": 11, "ya": 11, "x_scalar_mult": 11, "navig": 11, "robot": 11, "linalg": [11, 12], "arctan2": 11, "radian": 11, "9272952180016122": 11, "sentiment": 11, "mathbb": 11, "dimension": [11, 22, 28, 30, 33], "cdot": [11, 12, 13], "sum_": [11, 12, 17, 25, 30, 32], "x_i": [11, 17, 27, 30], "y_i": [11, 27, 30, 32], "respect": [11, 13, 21, 27, 28, 31], "co": 11, "theta": 11, "bilinear": 11, "orthogon": 11, "perpendicular": 11, "quad": 11, "dot_product": 11, "x1_3d": 11, "y1_3d": 11, "3d": [11, 30], "surfac": 11, "light": 11, "render": [11, 19, 32], "torqu": 11, "rotat": [11, 24, 30], "origin": [11, 12, 14, 20, 21, 30, 31], "mathbi": 11, "vmatrix": 11, "j": [11, 12, 32], "x_1": [11, 30, 31, 32], "x_2": [11, 30, 31], "x_3": 11, "y_1": 11, "y_2": 11, "y_3": 11, "a_1": 11, "a_2": 11, "a_3": 11, "b_1": 11, "b_2": 11, "b_3": 11, "sin": 11, "plane": [11, 30], "neq": 11, "exert": 11, "simplifi": [11, 28, 32], "cross_product": 11, "l2": [11, 32], "_2": 11, "ldot": [11, 32], "vector_v": 11, "l2_norm": 11, "new_posit": 11, "aerospac": 11, "safeti": 11, "stabil": [11, 19, 21], "bridg": 11, "accur": [11, 24, 27, 30, 31], "analys": [11, 17, 19, 20, 24, 25, 30, 32], "big": 11, "quicker": 11, "precis": [11, 13, 18, 19, 21, 22], "abstract": 11, "infrastructur": 11, "quantum": [11, 12], "stem": 11, "approxim": [11, 19, 28], "minut": 11, "linspac": [11, 13, 14, 32], "meshgrid": 11, "circular": 11, "quiver": 11, "xlim": [11, 30], "ylim": [11, 30], "titl": [11, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "xlabel": [11, 13, 14, 18, 20, 21, 22, 24, 25, 26, 28, 30, 31, 32], "axi": [11, 18, 19, 22, 28, 30, 31], "ylabel": [11, 13, 14, 18, 20, 21, 22, 24, 25, 26, 28, 30, 31, 32], "v1": 11, "v2": 11, "v_add": 11, "v_sub": 11, "v_scalar_mult": 11, "xy": [11, 12], "scale_unit": 11, "green": [11, 20, 21, 30], "red": [11, 13, 21, 22, 27, 30, 31, 32], "blue": [11, 14, 20, 21, 22, 30, 31, 32], "khan": [11, 12], "rectangular": 12, "arrang": 12, "row": [12, 17, 21, 22, 24, 31], "x_": [12, 25, 32], "12": [12, 16, 17, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33], "1n": 12, "2n": [12, 32], "ddot": 12, "m1": 12, "m2": 12, "mn": 12, "physic": [12, 13, 14], "moment": [12, 13], "inertia": 12, "tensor": 12, "graph": [12, 13, 14], "among": [12, 27, 28, 30, 32], "kickoff": 12, "fantast": 12, "coupl": 12, "grid": [12, 13, 14, 25], "nonumb": 12, "z1": 12, "subscript": 12, "isn": [12, 30], "nice": 12, "notic": [12, 32], "verifi": 12, "_": 12, "ij": [12, 32], "x1_": 12, "y1_": 12, "m_add": 12, "m_sub": 12, "rather": [12, 30], "l": 12, "obtain": [12, 25, 28, 32], "th": [12, 30], "compat": 12, "inner": 12, "circ": 12, "m_sca": 12, "m_mul": 12, "4x4": 12, "communit": 12, "m_mul1": 12, "m_mul2": 12, "113": 12, "153": 12, "114": 12, "109": 12, "106": 12, "118": 12, "112": 12, "rrr": 12, "hspace": 12, "1cm": 12, "twice": 12, "notat": 12, "transposit": 12, "x_t": 12, "det": 12, "nonzero": 12, "x_inv": 12, "inv": 12, "81474977e": 12, "62949953e": 12, "12589991e": 12, "mat_x": 12, "mat_i": 12, "mat_": 12, "mat_xi": 12, "mat_xy_t": 12, "mat_xy_t2": 12, "2nd": [12, 22], "mat_xy_inv": 12, "194": 12, "322": [12, 32], "264": 12, "405": 12, "690": 12, "668": 12, "895": [12, 20, 21, 22], "1610": 12, "81926058e": 12, "93203101e": 12, "79964834e": 12, "97348241e": 12, "05242171e": 12, "95975384e": 12, "further": [12, 17, 19, 25], "resourc": 12, "link": 12, "materi": 12, "interest": [12, 13, 15, 20, 26, 27, 30], "essenc": [13, 20], "ai": [13, 14, 28, 33], "curios": 13, "willing": 13, "akin": [13, 14], "lim_": 13, "frac": [13, 17, 18, 25, 27, 30, 32], "instantan": 13, "curv": [13, 14, 18], "imagin": [13, 32], "know": [13, 14, 30], "fast": [13, 30], "growth": 13, "popul": [13, 15, 17, 18, 19, 24, 32], "particular": [13, 19], "df": [13, 18, 20, 21, 31], "dx": [13, 14], "2x": 13, "3x": 13, "4x": 13, "expon": [13, 30], "impli": [13, 19, 27, 28], "concern": [13, 28], "sp": [13, 14], "s_t": 13, "s_prime_t": 13, "remain": [13, 20], "fix": [13, 15, 19, 26, 30], "locat": [13, 17, 30], "t_x": 13, "livrari": 13, "t_prime_x": 13, "conveni": 13, "straight": [13, 30], "road": 13, "p": [13, 15, 24, 28], "2t": 13, "3t": 13, "4t": 13, "p_t": 13, "p_prime_t": 13, "rectangl": 13, "width": [13, 21, 26, 28], "a_x": 13, "a_prime_x": 13, "speedomet": 13, "econom": [13, 31], "revenu": 13, "busi": 13, "safe": 13, "sensit": [13, 20, 21, 24, 28, 31, 32], "aid": [13, 27], "formul": [13, 32], "assist": 13, "node": [13, 28], "abc": [13, 14], "sai": [13, 30], "value_at_x": 13, "rate_of_chang": 13, "sub": 13, "lambda": [13, 14, 32], "func_lambda": [13, 14], "lambdifi": [13, 14], "deriv_lambda": 13, "x_val": [13, 14], "y_val": [13, 14], "tangent_lin": 13, "figur": [13, 14, 18, 19, 21, 22, 25, 26, 27, 28, 30, 32], "figsiz": [13, 14, 19, 21, 22, 25, 26, 27, 30, 31, 32], "linestyl": [13, 18, 30], "dash": [13, 30], "scatter": [13, 21, 27, 30, 31, 32], "tangenc": 13, "legend": [13, 14, 18, 20, 21, 24, 28, 30, 31, 32], "distinguish": 13, "interv": [13, 14, 15, 17], "impart": 13, "mark": 13, "stride": 13, "machinelearningmasteri": [13, 18, 20, 21, 22, 27, 28], "gentl": 13, "partial": 13, "openstax": 13, "book": 13, "page": [13, 19, 32], "towardsai": 13, "net": 13, "master": [13, 22, 27], "towardsdatasci": [13, 18, 21, 22, 24], "peopl": [13, 18], "3cd913c5cf33": 13, "deepen": [14, 15, 20, 22, 25, 28], "profound": 14, "profici": [14, 15, 24], "eager": 14, "accumul": 14, "infinitesim": 14, "small": [14, 19, 32], "piec": 14, "much": [14, 28, 30], "a_b": 14, "indefinit": 14, "antideriv": 14, "famili": 14, "whose": [14, 30], "assert": 14, "a_bf": 14, "dxf": 14, "extens": [14, 31], "roc": [14, 18, 19], "deep": [14, 15, 24, 26, 33], "indefinite_integr": 14, "definite_integr": 14, "integral_lambda": 14, "fill_between": 14, "grai": [14, 30], "alpha": [14, 15, 20, 21, 26, 28, 30, 32], "equip": [15, 27], "keen": 15, "interrel": 15, "sens": [15, 19, 22, 28, 30], "event": 15, "infer": [15, 24, 30, 31, 32], "cannot": [15, 30], "certainti": 15, "subset": [15, 18, 19, 28], "imposs": 15, "likelihood": [15, 20], "occurr": [15, 19], "confid": [15, 28], "uniform": 15, "simplest": [15, 30], "everi": [15, 19, 32], "chanc": 15, "character": 15, "\u03bc": [15, 21], "binomi": 15, "bernoulli": 15, "trial": 15, "poisson": 15, "pd": [15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "tmp": [15, 17, 19, 20, 21, 22, 24, 25, 30], "ipykernel_288453": 15, "584559657": 15, "deprecationwarn": [15, 17, 19, 20, 21, 22, 24, 25, 30], "pyarrow": [15, 17, 19, 20, 21, 22, 24, 25, 30], "major": [15, 17, 19, 20, 21, 22, 24, 25, 30], "releas": [15, 17, 19, 20, 21, 22, 24, 25, 30], "arrow": [15, 17, 19, 20, 21, 22, 24, 25, 30], "interoper": [15, 17, 19, 20, 21, 22, 24, 25, 30], "instal": [15, 17, 19, 21, 22, 24, 25, 30, 31], "dev": [15, 17, 19, 20, 21, 22, 24, 25, 30], "54466": [15, 17, 19, 20, 21, 22, 24, 25, 30], "range_": 15, "ptp": 15, "var": [15, 17, 19, 24, 25, 26], "std_dev": [15, 25], "std": [15, 17, 19, 21, 22, 24, 25], "8722813232690143": 15, "mu": [15, 18], "1000": 15, "bin": [15, 20, 24, 25, 26, 28], "hist": [15, 20, 24, 25, 26, 31], "exp": 15, "linewidth": [15, 19], "lambda_": 15, "null": [15, 17, 19, 24], "\u03bc_0": 15, "altern": [15, 22, 24], "mu_0": 15, "05": [15, 28], "t_statist": [15, 24], "p_valu": [15, 24, 28], "ttest_1samp": [15, 24], "reject": 15, "fail": [15, 28], "5222329678670935": 15, "614117254808394": 15, "rigor": 15, "probabilitycours": 15, "prefac": 15, "php": 15, "vfu": 15, "bg": 15, "bertsekas_tsitsiklis_introduction_to_prob": 15, "pdf": 15, "1uw3qmfa9ho": 15, "plul4u3cngp60hi9atjsfglzpbnj7myag6": 15, "morningsid": 15, "libguid": 15, "raw": 17, "clean": 17, "duplic": 17, "discret": [17, 28], "qualit": 17, "nomin": 17, "blood": 17, "ordin": 17, "ratio": 17, "height": [17, 26, 31], "covid": 17, "ipykernel_288486": 17, "2223182689": [17, 19], "datafram": [17, 18, 19, 20, 21, 22, 28, 31], "covid_data": 17, "read_csv": [17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "inspect": [17, 19], "five": [17, 18, 19, 21], "iso_cod": 17, "contin": 17, "total_cas": 17, "new_cas": 17, "new_cases_smooth": 17, "total_death": 17, "new_death": 17, "new_deaths_smooth": 17, "female_smok": 17, "male_smok": 17, "handwashing_facil": 17, "hospital_beds_per_thousand": 17, "life_expect": 17, "human_development_index": 17, "excess_mortality_cumulative_absolut": 17, "excess_mortality_cumul": 17, "excess_mort": 17, "excess_mortality_cumulative_per_million": 17, "afg": 17, "asia": 17, "afghanistan": 17, "02": [17, 21, 31], "2020": [17, 21, 22, 28], "nan": [17, 20, 21, 22], "746": 17, "511": 17, "tail": [17, 19, 26], "5813": 17, "nga": 17, "africa": 17, "nigeria": 17, "06": [17, 20, 25, 28, 32], "2022": 17, "265741": 17, "236": 17, "286": 17, "3155": 17, "949": 17, "539": 17, "5814": 17, "07": [17, 18], "5815": 17, "265816": 17, "5816": 17, "09": 17, "5817": 17, "info": [17, 19], "rangeindex": [17, 19], "5818": 17, "dtype": [17, 19, 20, 21, 22, 28, 31], "int64": [17, 19, 20, 21], "5788": 17, "float64": [17, 19, 20, 22, 31], "5638": 17, "5627": 17, "5596": 17, "total_cases_per_million": 17, "new_cases_per_million": 17, "new_cases_smoothed_per_million": 17, "total_deaths_per_million": 17, "new_deaths_per_million": 17, "new_deaths_smoothed_per_million": 17, "reproduction_r": 17, "5566": 17, "icu_pati": 17, "2610": 17, "icu_patients_per_million": 17, "hosp_pati": 17, "hosp_patients_per_million": 17, "weekly_icu_admiss": 17, "weekly_icu_admissions_per_million": 17, "weekly_hosp_admiss": 17, "934": 17, "weekly_hosp_admissions_per_million": 17, "total_test": 17, "3174": 17, "new_test": 17, "2948": 17, "total_tests_per_thousand": 17, "new_tests_per_thousand": 17, "new_tests_smooth": 17, "4114": 17, "new_tests_smoothed_per_thousand": 17, "positive_r": 17, "3440": 17, "tests_per_cas": 17, "tests_unit": 17, "4156": 17, "total_vaccin": 17, "2104": 17, "people_vaccin": 17, "2051": 17, "people_fully_vaccin": 17, "2004": 17, "total_boost": 17, "1170": 17, "new_vaccin": 17, "1827": 17, "new_vaccinations_smooth": 17, "3658": 17, "total_vaccinations_per_hundr": 17, "people_vaccinated_per_hundr": 17, "people_fully_vaccinated_per_hundr": 17, "total_boosters_per_hundr": 17, "new_vaccinations_smoothed_per_million": 17, "new_people_vaccinated_smooth": 17, "new_people_vaccinated_smoothed_per_hundr": 17, "stringency_index": 17, "5699": 17, "population_dens": 17, "median_ag": 17, "aged_65_old": 17, "aged_70_old": 17, "gdp_per_capita": 17, "extreme_poverti": 17, "2922": 17, "cardiovasc_death_r": 17, "diabetes_preval": 17, "4860": 17, "1913": 17, "4863": 17, "421": 17, "mb": 17, "covid_datanew": 17, "bar": [17, 18, 22, 25, 26, 27, 28, 30], "newcase_mean": 17, "8814": 17, "365761430045": 17, "middl": [17, 19, 26], "sort": [17, 25], "newcase_median": 17, "261": 17, "moderesult": 17, "modal": [17, 26], "thu": [17, 19], "newcase_mod": 17, "805": 17, "\u03c3\u00b2": [17, 21], "newcase_vari": 17, "451321915": 17, "9280954": 17, "451399502": 17, "6421969": 17, "ddof": [17, 19], "newcase_stdev": 17, "stdev": [17, 19], "21246": 17, "164421895": 17, "freedom": [17, 28, 32], "unbias": [17, 18], "mle": 17, "stackoverflow": 17, "62938495": 17, "stand": [17, 28], "alon": 17, "mislead": [17, 22, 24], "covid_newcases_max": 17, "covid_newcases_min": 17, "287149": 17, "iqr": [17, 25, 26], "sever": [17, 19, 20, 31], "fall": [17, 19, 26], "q1": [17, 19, 26], "q3": [17, 19, 26], "parametr": [17, 28], "segment": 17, "sale": 17, "depict": [17, 26], "quantil": [17, 19], "25th": [17, 19], "percentil": [17, 19], "75th": [17, 19], "3666": 17, "3642": 17, "nehalbirla": 17, "vehicl": 17, "cardekho": 17, "quantinsti": 17, "experfi": 17, "clt": 18, "sim": 18, "unknown": 18, "observ": [18, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32], "homogen": [18, 19, 28], "subgroup": 18, "proport": [18, 19, 22, 26, 28, 31], "strata": 18, "stratum": 18, "sklearn": [18, 19, 20, 21, 22, 28, 30, 31, 32], "model_select": [18, 19, 21, 28, 30, 31, 32], "train_test_split": [18, 19, 21, 28, 30, 31, 32], "train_set": 18, "test_set": 18, "test_siz": [18, 19, 21, 28, 30, 31, 32], "random_st": [18, 19, 20, 21, 28, 30, 31, 32], "pseudo": 18, "reproduc": 18, "softwar": 18, "talk": 18, "intern": 18, "imbalanc": [18, 19], "stratifiedshufflesplit": 18, "n_split": 18, "train_index": 18, "test_index": 18, "stratum_column": 18, "strat_train_set": 18, "loc": [18, 26, 30], "strat_test_set": 18, "fold": [18, 19], "kfold": 18, "cross_val_scor": [18, 19], "ensembl": [18, 19, 29], "randomforestclassifi": [18, 19], "kf": 18, "df_featur": 18, "df_target": 18, "cv": [18, 19], "stratifiedkfold": 18, "skf": 18, "x_train": [18, 19, 21, 28, 30, 31, 32], "x_test": [18, 19, 21, 28, 30, 31, 32], "y_train": [18, 19, 21, 28, 30, 31, 32], "y_test": [18, 19, 21, 28, 30, 31, 32], "subject": 18, "suit": [18, 30], "download": [18, 19], "wine": [18, 24], "100daysofml_notebook": [18, 21, 22], "accord": [18, 19, 28], "wine_data": [18, 19, 24, 25, 26, 27], "winequ": 18, "standardscal": [18, 19, 21, 28, 31, 32], "labelencod": [18, 19, 22, 28], "fillna": [18, 19, 20, 21, 31], "inplac": [18, 19, 20, 21, 31], "categorical_column": [18, 19], "fit_transform": [18, 19, 20, 21, 22, 28, 31, 32], "scaler": [18, 19, 21, 31, 32], "wine_data_sc": [18, 19], "drop": [18, 19, 22, 28, 31, 32], "accuracy_scor": [18, 19, 28], "confusion_matrix": [18, 19], "recal": [18, 19, 21, 22], "f1": [18, 19], "classification_report": [18, 19], "roc_curv": 18, "auc": [18, 19], "predict_proba": 18, "fpr": 18, "tpr": 18, "threshold": [18, 28], "roc_auc": 18, "darkorang": 18, "lw": 18, "navi": 18, "receiv": 18, "outlin": 18, "confidenti": 18, "conduct": [18, 19, 24, 26, 28, 31], "befor": [18, 20, 21, 22, 24, 27, 28, 32], "unseen": [18, 19, 28, 31, 32], "generaliz": 18, "leak": [18, 31], "vigil": 18, "augment": 18, "datasciencewizard": 18, "49a959c95fa1": 18, "8ef4e3a97562": 18, "analyticsvidhya": [18, 20, 21, 22, 25, 28], "2021": [18, 20, 25], "jfrog": 18, "ipykernel_288519": 19, "wine_qu": [19, 24, 25, 26, 27], "acid": [19, 26], "volatil": 19, "citric": 19, "residu": [19, 25, 26, 30, 32], "sugar": [19, 25, 26], "chlorid": 19, "sulfur": [19, 26], "dioxid": [19, 26], "ph": [19, 25, 26], "sulphat": 19, "alcohol": [19, 24, 25, 26], "076": 19, "9978": 19, "098": 19, "9968": 19, "04": [19, 21], "092": 19, "9970": 19, "075": 19, "9980": 19, "1138": 19, "510": 19, "99574": 19, "1592": 19, "1139": 19, "620": [19, 32], "068": 19, "99651": 19, "1593": 19, "1140": 19, "600": 19, "090": 19, "99490": 19, "1594": 19, "1141": 19, "550": 19, "062": 19, "99512": 19, "1595": 19, "1142": 19, "645": 19, "99547": 19, "1597": 19, "1143": 19, "116": 19, "kb": 19, "copi": [19, 20, 21], "wine_datanew": 19, "winequality_mean": 19, "657": 19, "winequality_median": 19, "winequality_var": 19, "6488": 19, "extent": 19, "somewhat": [19, 32], "heterogen": 19, "alongsid": 19, "holist": 19, "winequality_stdev": 19, "8058": 19, "tend": [19, 26, 32], "wider": 19, "typic": [19, 25, 32], "pronounc": 19, "pictur": 19, "winequality_max": 19, "winequality_min": 19, "maximum": [19, 21, 26], "minimum": [19, 21, 26], "highest": [19, 30], "lowest": [19, 30], "presenc": [19, 21, 22, 25, 26], "exploratori": [19, 25, 26, 28, 33], "reveal": 19, "factor": [19, 27, 28, 31, 32], "upper": [19, 26, 30], "third": [19, 26], "closer": [19, 30, 31], "half": 19, "narrow": [19, 26], "higher": [19, 28, 31, 32], "sn": [19, 21, 22, 24, 25, 26, 27, 31], "correlation_matrix": [19, 24], "corr": [19, 21, 24, 27], "annot": [19, 24, 27], "cmap": [19, 24, 27], "coolwarm": 19, "attribut": [19, 28], "decreas": 19, "6731": 19, "6815": 19, "6852": 19, "4074": 19, "5442": 19, "4947": 19, "5463": 19, "2577": 19, "4849": 19, "chemic": 19, "properti": [19, 28], "trust": [19, 32], "On": [19, 30], "unabl": [19, 32], "nbviewer": [19, 32], "nbsp": [19, 32], "randomforestclassifierifittedrandomforestclassifi": 19, "9782": 19, "strong": [19, 24, 27], "significantli": [19, 20, 22, 26, 27, 28], "outnumb": 19, "tell": [19, 30], "categorical_featur": 19, "x_train_scal": [19, 31], "x_test_scal": [19, 31], "diagon": 19, "No": [19, 20, 22], "misclassif": 19, "misclassifi": 19, "failur": 19, "imbal": 19, "zero_divis": 19, "229": 19, "macro": 19, "avg": 19, "breakdown": 19, "identif": 19, "poor": 19, "were": [19, 32], "resampl": 19, "underrepres": 19, "cross_val_scores_round": 19, "9825": 19, "9737": 19, "9345": 19, "9476": 19, "9605": 19, "9649": 19, "slight": 19, "fairli": 19, "stabl": [19, 31], "overli": [19, 30], "advis": 19, "intermedi": [20, 21, 22, 24, 25], "mar": 20, "missing": 20, "unobserv": 20, "titanic_data": [20, 21, 22], "isnul": [20, 21, 31], "passengerid": [20, 21, 22], "pclass": [20, 21], "sex": [20, 21, 22, 31], "892": [20, 21, 22], "kelli": [20, 21, 22], "mr": [20, 21, 22], "jame": [20, 21, 22], "male": [20, 21, 22], "893": [20, 21, 22], "wilk": [20, 21, 22, 28], "ellen": [20, 21, 22], "femal": [20, 21, 22], "894": [20, 21, 22], "myle": [20, 21, 22], "thoma": [20, 21, 22], "franci": [20, 21, 22], "wirz": [20, 21, 22], "albert": [20, 21, 22], "896": [20, 21, 22], "hirvonen": [20, 21, 22], "alexand": [20, 21, 22], "helga": [20, 21, 22], "lindqvist": [20, 21, 22], "sibsp": [20, 21, 22], "parch": [20, 21, 22], "ticket": [20, 21, 22], "fare": [20, 21, 22], "cabin": [20, 21], "surviv": [20, 21, 22], "330911": [20, 21, 22], "8292": [20, 21, 22], "363272": [20, 21, 22], "0000": [20, 21, 22], "240276": [20, 21, 22], "6875": [20, 21, 22], "315154": [20, 21, 22], "6625": [20, 21, 22], "3101298": [20, 21, 22], "2875": [20, 21, 22], "327": [20, 21], "ipykernel_288555": 20, "245541981": 20, "unduli": 20, "preserv": [20, 21, 22], "embarked_mod": 20, "retain": 20, "distort": [20, 31], "unaffect": 20, "conclus": [20, 24, 26], "684399944": 20, "futurewarn": [20, 21], "col": [20, 21, 22], "knnimput": 20, "n_neighbor": 20, "numeric_column": 20, "select_dtyp": [20, 22], "closest": 20, "exhibit": [20, 30], "captur": [20, 28, 32], "smooth": [20, 26], "inaccur": 20, "expens": 20, "predictor": [20, 27, 30, 31, 32], "poorli": [20, 32], "sophist": [20, 28], "intertwin": 20, "experiment": [20, 28], "enable_iterative_imput": 20, "iterativeimput": 20, "linear_model": [20, 30, 31, 32], "bayesianridg": 20, "iterative_imput": 20, "missing_valu": 20, "max_it": [20, 32], "titanic_data_imput": 20, "bayesian": 20, "incorpor": 20, "prior": 20, "belief": 20, "uncertainti": [20, 28], "posterior": 20, "robin": 20, "fashion": 20, "gaug": 20, "frequenc": [20, 22, 24, 25, 26, 28], "titanic_data_origin": 20, "dropna": 20, "hasn": 20, "alter": [20, 21, 32], "lookout": 20, "unusu": [20, 24, 26], "spike": 20, "weren": 20, "robject": 20, "importr": 20, "pandas2ri": 20, "globalenv": 20, "choosecranmirror": 20, "ind": 20, "magic": 20, "load_ext": 20, "ipython": 20, "install_packag": 20, "remot": 20, "install_github": 20, "njtiernei": 20, "naniar": 20, "r_df": 20, "mcar_test": 20, "consult": 20, "simplilearn": [20, 21], "theanalysisfactor": 20, "seven": 20, "dataaspir": 20, "\u03c3z": 21, "xx": 21, "\u03bc\u03bc": 21, "\u03c3\u03c3": 21, "center": [21, 24, 28], "pro": 21, "con": 21, "bound": [21, 28], "rescal": 21, "xnorm": 21, "xmin": 21, "xmax": 21, "xminxmin": 21, "xmaxxmax": 21, "overpow": 21, "knn": 21, "minmaxscal": 21, "load_iri": 21, "iris_data": [21, 28], "feature_nam": [21, 25], "iris_standard": 21, "min_max_scal": 21, "iris_min_max_sc": 21, "inter": 21, "comprehend": 21, "readi": 21, "iloc": [21, 26, 32], "minmaxscalermin_max_scal": 21, "sepallengthcm": [21, 28], "subplot": [21, 22, 26, 30, 31, 32], "histplot": [21, 26], "kde": [21, 26], "accordingli": 21, "sepalwidthcm": 21, "sepal": [21, 28], "snoop": 21, "petallengthcm": [21, 28], "petalwidthcm": [21, 28], "speci": [21, 28], "setosa": [21, 28], "ipykernel_288580": 21, "2131166956": 21, "dancerworld60": 21, "4bb910900ab7": 21, "awar": [21, 24, 28, 31], "e44df654f185": 21, "nsummari": 21, "nmiss": 21, "418": [21, 22], "000000": [21, 22, 28], "332": 21, "1100": [21, 30], "500000": 21, "265550": [21, 22], "272590": 21, "447368": 21, "392344": 21, "120": 21, "810458": 21, "841838": [21, 22], "181209": 21, "896760": 21, "981429": 21, "170000": 21, "996": 21, "250000": 21, "1204": 21, "750000": 21, "1309": 21, "417": 21, "627188": 21, "385167": 21, "907576": 21, "487218": 21, "895800": 21, "454200": 21, "512": 21, "329200": 21, "1279951594": 21, "x_train_standard": 21, "x_test_standard": 21, "x_train_min_max": 21, "x_test_min_max": 21, "tight_layout": [21, 22, 26, 30, 31, 32], "scalingprint": 21, "nstatist": [21, 22], "334": 21, "262": 21, "333": 21, "269461": 21, "115763": 21, "470060": 21, "404192": 21, "909135": 21, "844961": 21, "655775": 21, "944719": 21, "937113": 21, "054690": 21, "330000": 21, "887500": 21, "340000e": 21, "620000e": 21, "330000e": 21, "233742e": 21, "711995e": 21, "127373e": 21, "722904e": 21, "267524e": 21, "001500e": 21, "001914e": 21, "001505e": 21, "504644e": 21, "036246e": 21, "983123e": 21, "319630e": 21, "367217e": 21, "231816e": 21, "006539e": 21, "658800e": 21, "130032e": 21, "873714e": 21, "073537e": 21, "617915e": 21, "606225e": 21, "136788e": 21, "982518e": 21, "186412e": 21, "201500e": 21, "634731": 21, "393627": 21, "058757": 21, "044910": 21, "072042": 21, "422481": 21, "193680": 21, "118090": 21, "104124": 21, "113315": 21, "273160": 21, "015395": 21, "352451": 21, "028213": 21, "511035": 21, "125000": 21, "063436": 21, "alexisbcook": 21, "primarili": 22, "intrins": 22, "gender": 22, "rank": 22, "school": 22, "bachelor": 22, "satisfact": 22, "unsatisfi": 22, "neutral": 22, "pose": 22, "cherbourg": 22, "queenstown": 22, "southampton": 22, "3rd": 22, "c85": 22, "c123": 22, "e46": 22, "curs": [22, 28], "elimin": [22, 28, 32], "treat": 22, "linearli": 22, "spars": [22, 32], "category_encod": 22, "ce": 22, "binaryencod": 22, "titanic_binary_encod": 22, "onehotencod": 22, "titanic_one_hot_encod": 22, "titanic_one_hot_encoded_df": 22, "toarrai": 22, "get_feature_names_out": 22, "pclass_encod": 22, "hierarchi": 22, "leakag": 22, "dummi": 22, "trap": 22, "multicollinear": [22, 27, 31, 32], "mind": [22, 24, 30, 32], "fictiti": 22, "pairwis": [22, 24, 25], "mostli": 22, "preval": 22, "1s": 22, "mix": 22, "passeng": 22, "sink": 22, "ipykernel_288616": 22, "3916798240": 22, "modulenotfounderror": 22, "modul": [22, 33], "ndata": 22, "nuniqu": 22, "363": 22, "nbinari": 22, "value_count": 22, "nameerror": [22, 24], "embarked_c": 22, "embarked_q": 22, "embarked_": 22, "nlabel": 22, "b57": 22, "b59": 22, "b63": 22, "b66": 22, "freq": 22, "270": 22, "244019": 22, "110048": 22, "645933": 22, "430019": 22, "313324": 22, "478803": 22, "aiskunk": 22, "d6296697a40f": 22, "547707acf4e5": 22, "305f3361fd02": 22, "uncov": 24, "trend": [24, 25, 33], "draw": [24, 26, 30, 32], "adopt": 24, "ethic": [24, 33], "ipykernel_288649": 24, "955872667": [24, 25], "spot": 24, "mistak": [24, 32], "erron": 24, "summari": [24, 25, 30], "ts": [24, 25, 27], "wise": [24, 26, 31], "preliminari": 24, "carefulli": 24, "overplot": 24, "violinplot": [24, 25], "diverg": 24, "scheme": 24, "hard": 24, "vmin": 24, "vmax": 24, "diverging_palett": 24, "220": 24, "200": 24, "set_xticklabel": 24, "get_xticklabel": 24, "horizontalalign": 24, "657042869641295": 24, "6493527188260838": 24, "8058242481000952": 24, "asymmetri": [24, 26], "tailed": 24, "2867917004538591": 24, "3146639385893346": 24, "nearli": 24, "enough": 24, "claim": 24, "hypothes": [24, 25, 27], "ii": 24, "popmean": 24, "811761283140333": 24, "0619222323076622e": 24, "compel": 24, "manner": 24, "coincid": 24, "spuriou": 24, "briefli": [24, 26], "main": 24, "seller": 24, "appendix": [24, 26], "visualis": 24, "8151e63ce8f0": 24, "boadziedaniel": 24, "890dc0e79799": 24, "datasciencedojo": 24, "ipykernel_288689": 25, "heavili": 25, "mean_valu": 25, "median_valu": 25, "mode_valu": 25, "oversimplifi": 25, "realiti": [25, 30], "complic": 25, "stori": 25, "symmetri": [25, 26], "interquartil": [25, 26], "whisker": [25, 26], "brief": 25, "clariti": 25, "sure": 25, "narr": 25, "meaningless": 25, "analysis_result": 25, "variance_valu": 25, "std_dev_valu": 25, "nstat": 25, "stat_nam": 25, "stat_valu": 25, "442111402741325": 25, "1711473380358497": 25, "0821956098764445": 25, "3110148731408575": 25, "02454362762448039": 25, "15666405977275194": 25, "5321522309711284": 25, "8385121764551762": 25, "3559174666826799": 25, "market": 25, "hcbravo": 25, "introdatasci": 25, "bookdown": 25, "econometricstutor": 25, "expand": [26, 32], "deepli": 26, "chart": 26, "symmetr": 26, "evenli": 26, "longer": 26, "peak": 26, "unimod": 26, "bimod": 26, "multimod": 26, "spiki": 26, "hide": 26, "value1": 26, "value2": 26, "valuen": 26, "skyblu": 26, "freedman": 26, "diaconi": 26, "disregard": 26, "quartil": 26, "span": 26, "q2": 26, "side": [26, 31], "reli": [26, 28, 30], "descriptive_stat": 26, "methodolog": 26, "plotli": 26, "machinelearningplu": 26, "oreilli": 26, "9781491912126": 26, "ch04": 26, "interconnected": 27, "strength": [27, 32], "direct": 27, "wherea": [27, 32], "monoton": 27, "rho": 27, "d_i": 27, "r_": 27, "rg": 27, "rg_x": 27, "rg_y": 27, "pinpoint": 27, "pearson_corr": 27, "spearman_corr": 27, "cm": 27, "causat": 27, "meet": [27, 28], "corr_matrix": 27, "surpris": 27, "thereof": 27, "deliver": 27, "stage": [27, 30], "thoughtfulli": 27, "geo": 27, "fu": 27, "berlin": 27, "de": 27, "soga": 27, "inferenti": 27, "sound": 28, "heart": 28, "elev": 28, "summat": 28, "unpredict": 28, "ss": 28, "aa": 28, "randomli": 28, "incorrectli": 28, "faster": [28, 31], "intens": 28, "jump": 28, "150": 28, "virginica": 28, "versicolor": 28, "petal": 28, "disord": 28, "decid": 28, "criterion": 28, "puriti": 28, "decisiontreeclassifi": 28, "clf_entropi": 28, "y_pred_entropi": 28, "clf_gini": 28, "y_pred_gini": 28, "importances_entropi": 28, "feature_importances_": 28, "importances_gini": 28, "9777777777777777": 28, "agre": 28, "worth": 28, "redund": 28, "tweak": 28, "prune": 28, "joint": 28, "properli": 28, "tricki": 28, "invari": 28, "suffer": 28, "causal": [28, 30], "misinterpret": 28, "feature_select": 28, "mutual_info_classif": 28, "x_normal": 28, "mi": 28, "08486414": 28, "49537028": 28, "24562179": 28, "9858617": 28, "99351315": 28, "df1": 28, "df2": 28, "shapiro": 28, "leven": 28, "bartlett": 28, "hoc": 28, "factori": 28, "selectkbest": 28, "f_classif": 28, "k_best_featur": 28, "score_func": 28, "pvalues_": 28, "scores_": 28, "6f": 28, "588": 28, "235294": 28, "119": [28, 32], "264502": 28, "364461": 28, "1179": 28, "034328": 28, "959": 28, "324406": 28, "systemat": 28, "forward": 28, "justifi": 28, "statsmodel": 28, "api": 28, "sm": 28, "label_encod": 28, "forward_select": 28, "significance_level": 28, "initial_featur": 28, "tolist": 28, "best_featur": 28, "remaining_featur": 28, "new_pval": 28, "new_column": 28, "ol": 28, "add_const": 28, "pvalu": 28, "min_p_valu": 28, "idxmin": 28, "selected_featur": 28, "pure": 28, "accuracy_entropi": 28, "accuracy_gini": 28, "deem": 28, "argsort": [28, 32], "barh": 28, "ytick": 28, "features_to_keep_entropi": 28, "features_to_keep_gini": 28, "refin": 28, "technic": 28, "realm": [28, 30], "clf_entropy_deep": 28, "max_depth": 28, "y_pred_entropy_deep": 28, "clf_gini_deep": 28, "y_pred_gini_deep": 28, "victorzh": 28, "mlearn": 28, "82c2123bd548": 28, "codex": 28, "cd9f99a26e0d": 28, "advanc": [29, 30, 33], "pip": [30, 31], "unlabel": 30, "cornerston": 30, "importantli": 30, "contrast": 30, "counterpart": 30, "upcom": 30, "y_intercept": 30, "entail": 30, "establish": 30, "slope": 30, "indpend": 30, "hat": 30, "beta": 30, "_1": 30, "_0": 30, "isol": [30, 32], "still": [30, 32], "consequ": 30, "foot": 30, "_i": 30, "2_i": 30, "wors": 30, "linearregress": [30, 31, 32], "intercept_": [30, 32], "coef_": [30, 31, 32], "marker": 30, "o": 30, "vline": 30, "ymin": 30, "ymax": 30, "nsse": 30, "fontsiz": 30, "bbox": 30, "dict": 30, "facecolor": 30, "yellow": 30, "inferior": 30, "inferior_slop": 30, "inferior_intercept": 30, "inferior_predict": 30, "inferior_ss": 30, "purpl": 30, "shown": 30, "scatterplot": 30, "yet": 30, "dimenion": 30, "clinic": 30, "subspac": 30, "ambient": 30, "human": 30, "meaningfulli": 30, "teach": 30, "bend": 30, "cancel": 30, "penal": [30, 32], "2r": 30, "farther": 30, "pm": 30, "thank": 30, "strictli": [30, 31], "inclin": 30, "mine": 30, "static": 30, "anim": 30, "confabul": [30, 31], "against": 30, "publicli": 30, "toi": 30, "housing_data": 30, "squarefeet": 30, "bedroom": 30, "bathroom": 30, "850": 30, "200000": 30, "suburban": 30, "900": 30, "205000": 30, "urban": 30, "1200": 30, "210000": 30, "rural": 30, "950": 30, "215000": 30, "220000": 30, "ipykernel_288722": 30, "737031205": 30, "aim": 30, "reserv": 30, "wasn": 30, "memor": 30, "2d": 30, "suffici": 30, "footag": 30, "sq": 30, "ft": 30, "107": 30, "6641786": 30, "103044": 30, "81439951799": 30, "datapoint": 30, "x_n": [31, 32], "environment": 31, "practition": 31, "beta_0": [31, 32], "beta_1x_1": [31, 32], "beta_2x_2": [31, 32], "beta_nx_n": [31, 32], "beta_1": [31, 32], "beta_2": 31, "beta_n": [31, 32], "hold": 31, "homoscedast": [31, 32], "inflat": 31, "vif": 31, "peek": [31, 32], "hope": 31, "achiev": [31, 32], "incom": 31, "spending_scor": 31, "hopefulli": 31, "ye": 31, "customer_data": [31, 32], "x_var": 31, "y_var": 31, "reg": 31, "fig": 31, "suptitl": 31, "versu": 31, "spend": 31, "eventu": 31, "rare": 31, "x_test_scaled_df": 31, "set_titl": 31, "explanatori": 31, "disproportion": [31, 32], "penalti": [31, 32], "undesir": 31, "punish": 31, "mean_squared_error": [31, 32], "r2_score": [31, 32], "r2": [31, 32], "3183": 31, "330047035957": 31, "13751568541102366": 31, "34198373": 31, "53651751": 31, "put": 31, "predict_original_scale_datafram": 31, "input_df": 31, "input_sc": 31, "50000": 31, "crunch": 31, "31964941598494": 31, "diabet": 31, "toy_dataset": 31, "abl": 31, "load_diabet": 31, "as_fram": [31, 32], "bmi": 31, "bp": 31, "s1": 31, "s2": 31, "s3": 31, "s4": 31, "s5": 31, "s6": 31, "038076": 31, "050680": 31, "061696": 31, "021872": 31, "044223": 31, "034821": 31, "043401": 31, "002592": 31, "019907": 31, "017646": 31, "001882": 31, "044642": 31, "051474": 31, "026328": 31, "008449": 31, "019163": 31, "074412": 31, "039493": 31, "068332": 31, "092204": 31, "085299": 31, "044451": 31, "005670": 31, "045599": 31, "034194": 31, "032356": 31, "002861": 31, "025930": 31, "089063": 31, "011595": 31, "036656": 31, "012191": 31, "024991": 31, "036038": 31, "034309": 31, "022688": 31, "009362": 31, "005383": 31, "036385": 31, "003935": 31, "015596": 31, "008142": 31, "031988": 31, "046641": 31, "151": 31, "141": 31, "206": 31, "135": 31, "fun": [31, 32], "statolog": 31, "astut": 32, "dure": 32, "perfectli": 32, "mx": 32, "steer": 32, "unlimit": 32, "arbitrarili": 32, "unlik": 32, "beta_2x_1": 32, "beta_nx_1": 32, "polynomialfeatur": 32, "demo": 32, "seed": 32, "exactli": 32, "newaxi": 32, "linear_regressor": 32, "y_pred_linear": 32, "poly_features2": 32, "x_poly2": 32, "poly_regressor2": 32, "y_pred_poly2": 32, "poly_features3": 32, "x_poly3": 32, "poly_regressor3": 32, "y_pred_poly3": 32, "poly_features5": 32, "x_poly5": 32, "poly_regressor5": 32, "y_pred_poly5": 32, "r2_linear": 32, "r2_poly2": 32, "r2_poly3": 32, "r2_poly5": 32, "yi": 32, "sorted_axi": 32, "x_1x_2": 32, "2x_2": 32, "appar": 32, "autocorrel": 32, "violat": 32, "drawn": 32, "expans": 32, "bundl": 32, "forget": 32, "preprocessor": 32, "poli": 32, "machineri": 32, "although": 32, "deploi": 32, "reach": 32, "via": 32, "coef": 32, "x_plot": 32, "y_plot": 32, "x27": 32, "pipelineifittedpipelin": 32, "polynomialfeaturespolynomialfeatur": 32, "linearregressionlinearregress": 32, "00193104": 32, "3848762": 32, "00349368": 32, "16571691": 32, "32345315": 32, "absolut": 32, "shrink": 32, "neglig": 32, "littl": 32, "ordinari": 32, "beta_j": 32, "l1": 32, "illustr": 32, "lasso_poli": 32, "10000": 32, "55260439": 32, "72240286": 32, "90811749": 32, "66350745": 32, "19943027115730638": 32, "arbitrari": 32, "shrunk": 32, "trade": 32, "opposit": 32, "mainli": 32, "ridge_poli": 32, "05626925": 32, "75667935": 32, "06069885": 32, "96459941": 32, "14654769263455236": 32, "california": 32, "thought": 32, "art": 32, "starter": 32, "fetch_california_h": 32, "fetch": 32, "medinc": 32, "houseag": 32, "averoom": 32, "avebedrm": 32, "aveoccup": 32, "latitud": 32, "longitud": 32, "3252": 32, "984127": 32, "023810": 32, "555556": 32, "122": 32, "3014": 32, "238137": 32, "971880": 32, "2401": 32, "109842": 32, "2574": 32, "288136": 32, "073446": 32, "496": 32, "802260": 32, "6431": 32, "817352": 32, "073059": 32, "558": 32, "547945": 32, "8462": 32, "281853": 32, "081081": 32, "565": 32, "181467": 32, "standardscalerstandardscal": 32, "ridgeridg": 32, "2980353830641": 32, "472": 32, "3621683634644": 32, "concret": 32, "fraction": 32, "dollar": 32, "20046": 32, "6812": 32, "192201": 32, "022284": 32, "1392": 32, "877437": 32, "70k": 32, "53k": 32, "scientiast": 33, "week": 33, "supervis": 33, "unsupervis": 33, "reduct": 33, "capston": 33, "project": 33, "join": 33, "invit": 33, "v4dsssc5": 33}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"100": [0, 2, 33], "dai": [0, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32, 33], "machin": [0, 1, 2, 11, 14, 33], "learn": [0, 1, 2, 11, 14, 29, 30, 33], "challeng": [0, 1, 8, 33], "overview": [0, 2, 17, 22, 30, 33], "cours": [0, 4, 10, 16, 23, 29, 33], "structur": [0, 2, 4, 7, 8, 9, 10, 16, 23, 29, 33], "modul": [0, 1, 2, 4, 9, 10, 16, 23, 29], "1": [0, 1, 2, 4, 5, 7, 9, 10, 11, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28], "introduct": [0, 1, 2, 4, 10, 11, 12, 13, 14, 15, 17, 21, 22, 24, 25, 28, 30, 31, 32], "python": [0, 1, 2, 4, 5, 6, 8, 10, 11, 12, 13, 14, 15, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31], "basic": [0, 1, 2, 4, 5, 7, 9, 10, 11, 12, 13, 15, 17, 20, 30], "mathemat": [0, 1, 2, 4, 10, 13, 14, 15, 18, 21, 22, 27, 30], "week": [0, 1, 2, 4, 9, 10, 16, 23, 29], "2": [0, 1, 2, 4, 6, 7, 10, 11, 13, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28], "data": [0, 1, 2, 6, 7, 11, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 30], "preprocess": [0, 1, 2, 16, 17, 18, 21, 23, 31], "exploratori": [0, 1, 2, 16, 23, 24], "analysi": [0, 1, 2, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 30], "3": [0, 1, 2, 7, 11, 13, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29], "4": [0, 1, 2, 8, 11, 13, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28], "supervis": [0, 1, 2, 29, 30], "regress": [0, 1, 2, 20, 28, 29, 30, 31, 32], "classif": [0, 1, 2, 19, 29], "5": [0, 1, 2, 9, 11, 13, 18, 19, 20, 21, 22, 24, 29], "6": [0, 1, 2, 11, 19, 20, 21, 24, 29], "unsupervis": [0, 1, 2, 30], "dimension": [0, 1, 2], "reduct": [0, 1, 2], "7": [0, 1, 2, 12, 19, 21], "9": [0, 1, 2, 14], "deep": [0, 1, 2, 22, 25], "foundat": [0, 1, 21, 30], "10": [0, 1, 2, 15], "12": [0, 1, 2, 18, 19], "advanc": [0, 1, 2, 11, 18, 20, 24, 26, 28, 32], "current": [0, 1, 2], "trend": [0, 1, 2], "13": [0, 1, 2, 20], "14": [0, 1, 2, 21], "practic": [0, 1, 6, 13, 18, 20, 21, 22, 24, 25, 26, 27, 28], "aspect": [0, 1], "15": [0, 1, 2, 22], "17": [0, 1, 2, 25], "8": [0, 1, 2, 13, 19, 21], "appli": [0, 1, 2, 13, 21, 24], "ai": [0, 1, 2, 9], "ethic": [0, 1, 2], "consider": [0, 1, 18, 20, 21, 22], "18": [0, 1, 2, 26], "19": [0, 1, 2, 27], "capston": [0, 1, 2], "project": [0, 1, 2, 5, 6, 7, 8, 9, 11], "20": [0, 1, 2, 28], "21": [0, 1, 2, 30], "join": 0, "our": 0, "commun": 0, "social": [0, 33], "media": [0, 33], "contact": [0, 9, 33], "daili": [1, 2, 8], "curriculum": [1, 2], "numer": [1, 2, 4, 17], "oper": [1, 2, 4, 6, 11, 12], "concept": [1, 2, 10, 13, 14, 15, 28, 30, 31], "eda": [1, 2, 23, 24, 25], "ensembl": [1, 2], "method": [1, 2, 20, 28, 30], "neural": [1, 2], "network": [1, 2], "11": [1, 2, 17], "convolut": [1, 2], "cnn": [1, 2], "recurr": [1, 2], "rnn": [1, 2], "reinforc": [1, 2], "topic": [1, 2, 11], "mlop": [1, 2], "16": [1, 2, 24], "etl": [1, 2], "process": [1, 2], "transform": [1, 2], "industri": [1, 2], "sector": [1, 2], "applic": [1, 2, 9, 11, 13, 14], "cybersecur": [1, 2], "resourc": [2, 5, 6, 7, 8, 11, 13, 15, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 31, 32], "jupyt": 2, "notebook": 2, "lesson": [2, 8], "syntax": [2, 5, 9], "variabl": [2, 5, 13, 20, 25], "type": [2, 6, 7, 17, 20, 21, 22], "control": [2, 7, 8], "loop": [2, 7], "condit": [2, 8], "statement": [2, 7, 8, 9], "function": [2, 9, 13], "linear": [2, 11, 12, 30, 31], "algebra": [2, 11, 12], "vector": [2, 11], "matric": [2, 12], "matrix": [2, 12, 19, 27], "calculu": [2, 13, 14], "deriv": [2, 13], "integr": [2, 14, 20], "fundament": [2, 14], "theorem": [2, 14, 24], "probabl": [2, 15], "statist": [2, 15, 17, 19, 20, 21, 22, 24, 26], "relev": [2, 15], "distribut": [2, 15, 24, 26], "handl": [2, 20], "miss": [2, 20], "normal": [2, 21], "scale": [2, 17, 21], "us": [2, 13, 14, 17, 20, 21, 27, 28, 30], "encod": [2, 22], "categor": [2, 22], "split": [2, 18, 19, 20, 21, 30], "train": [2, 18, 20, 21, 30], "test": [2, 9, 18, 20, 21, 24, 28, 30], "set": [2, 5, 20, 21], "visual": [2, 11, 20, 21, 22, 24, 25, 27, 30], "implement": [2, 11, 13, 14, 15, 20, 21, 22, 26, 28, 30, 31], "descript": [2, 13, 15, 24, 26], "techniqu": [2, 18, 19, 20, 21, 22, 24, 25, 28, 32], "correl": [2, 19, 27], "featur": [2, 22, 28], "select": [2, 28], "import": [2, 9, 11, 13, 15, 17, 21, 28, 30], "22": [2, 31], "multipl": [2, 11, 12, 31], "23": [2, 32], "polynomi": [2, 32], "lasso": [2, 32], "ridg": [2, 32], "24": 2, "model": [2, 18, 19, 20, 30, 31], "evalu": [2, 18, 20, 31], "metric": [2, 31], "25": 2, "address": 2, "overfit": 2, "underfit": 2, "26": 2, "logist": 2, "27": 2, "k": 2, "nearest": 2, "neighbor": 2, "nn": 2, "algorithm": 2, "28": 2, "support": 2, "svm": 2, "nonlinear": 2, "29": 2, "decis": [2, 28], "tree": 2, "rule": [2, 12, 13], "base": [2, 20], "30": [2, 28], "naiv": 2, "bay": 2, "classifi": 2, "31": 2, "32": 2, "bag": 2, "random": [2, 20, 28], "forest": [2, 28], "33": 2, "boost": 2, "adaboost": 2, "34": 2, "gradient": 2, "gbm": 2, "xgboost": 2, "35": 2, "Their": 2, "36": 2, "cluster": 2, "37": 2, "mean": [2, 24, 25], "differ": [2, 13, 17, 30], "38": 2, "hierarch": 2, "39": 2, "densiti": 2, "dbscan": 2, "40": 2, "gaussian": 2, "mixtur": 2, "gmm": 2, "expect": 2, "maxim": 2, "41": 2, "pca": 2, "42": 2, "43": 2, "singular": 2, "valu": [2, 9, 19, 25], "decomposit": 2, "svd": 2, "Its": 2, "44": 2, "t": 2, "sne": 2, "45": 2, "other": 2, "46": 2, "understand": [2, 7, 9, 13, 15, 17, 20, 21, 22, 26, 27, 28, 31], "perceptron": 2, "47": 2, "feedforward": 2, "activ": [2, 11, 12, 13, 17, 21, 22, 24, 25, 26, 27, 28], "48": 2, "backpropag": 2, "49": 2, "loss": 2, "optim": 2, "50": 2, "tune": 2, "perform": [2, 19, 20], "51": 2, "layer": 2, "52": 2, "pool": 2, "architectur": 2, "53": 2, "imag": 2, "54": 2, "55": 2, "transfer": 2, "56": 2, "57": 2, "long": 2, "short": 2, "term": 2, "memori": 2, "lstm": 2, "58": 2, "build": [2, 30], "sequenc": 2, "59": 2, "time": 2, "seri": 2, "60": 2, "util": 2, "natur": [2, 28], "languag": 2, "nlp": 2, "61": 2, "62": 2, "markov": 2, "63": 2, "q": 2, "64": 2, "dqn": 2, "65": 2, "polici": 2, "66": 2, "depth": [2, 18, 19, 25, 26], "67": 2, "gener": [2, 20], "adversari": 2, "gan": 2, "68": 2, "attent": 2, "mechan": 2, "69": 2, "autoencod": 2, "70": 2, "research": 2, "emerg": 2, "ml": [2, 9], "71": 2, "lifecycl": 2, "72": 2, "version": [2, 8], "experi": 2, "track": 2, "73": 2, "ci": 2, "cd": 2, "74": 2, "monitor": 2, "mainten": 2, "75": 2, "tool": 2, "platform": 2, "76": 2, "extract": 2, "77": 2, "78": 2, "load": [2, 18, 20, 21, 22], "databas": 2, "manag": 2, "79": 2, "an": 2, "pipelin": 2, "80": 2, "technolog": 2, "81": 2, "82": 2, "self": 2, "posit": 2, "83": 2, "84": 2, "85": 2, "domain": 2, "86": 2, "bia": 2, "fair": 2, "87": 2, "privaci": 2, "secur": 2, "system": [2, 9], "88": 2, "explain": 2, "transpar": 2, "89": 2, "regul": 2, "complianc": 2, "90": 2, "make": [2, 28], "91": 2, "healthcar": 2, "92": 2, "financ": 2, "93": 2, "retail": 2, "94": 2, "manufactur": 2, "95": 2, "transport": 2, "educ": 2, "etc": 2, "96": 2, "97": 2, "identifi": 2, "threat": 2, "vulner": 2, "98": 2, "detect": 2, "prevent": 2, "99": 2, "case": 2, "studi": 2, "incid": 2, "101": 2, "plan": 2, "102": 2, "104": 2, "develop": [2, 9], "105": 2, "final": [2, 18], "present": 2, "errata": 3, "up": [5, 20], "your": [5, 7, 8, 9, 28], "environ": 5, "hand": [5, 6, 11, 17, 21, 24, 25, 26, 27], "On": [5, 6, 11, 17, 21, 24, 31, 32], "arithmet": [5, 7, 25], "further": [5, 6, 7, 8, 11, 13, 15, 28], "more": 6, "about": 6, "logic": [6, 7], "comparison": [6, 21], "calcul": [6, 12, 13, 19, 26], "solut": [6, 7, 8, 19, 25, 26], "problem": [6, 8, 13], "why": [7, 17, 20], "collect": 7, "The": [7, 12, 13, 15, 31, 32], "while": 7, "rang": [7, 17, 19], "object": [7, 13, 14, 15, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28], "break": 7, "continu": 7, "els": 7, "claus": 7, "combin": 7, "boolean": 7, "exampl": [7, 11, 13, 17, 20, 22, 28, 30], "program": [7, 9], "prime": 7, "number": [7, 9], "checker": 7, "quiz": [7, 9], "task": [7, 24, 26], "If": 8, "thi": 8, "Then": 8, "That": 8, "otherwis": 8, "do": [8, 28], "code": [8, 11, 20, 26, 28], "block": [8, 18], "last": 8, "resort": 8, "save": 8, "word": 8, "succinct": 8, "fizzbuzz": 8, "similar": 8, "altern": 8, "temperatur": 8, "analyz": [8, 21, 30], "step": [8, 11, 12, 13, 15, 18, 20, 21, 22, 26, 28], "counter": 8, "write": 9, "first": 9, "paramet": 9, "argument": 9, "arg": 9, "return": 9, "get": 9, "new": 9, "fast": 9, "via": 9, "standard": [9, 17, 19, 21, 24], "librari": [9, 11, 13, 15, 21, 22], "highlight": 9, "everi": 9, "must": 9, "know": 9, "numpi": [9, 17], "mini": 9, "guess": 9, "game": 9, "prompt": 9, "simpl": [9, 30], "book": 9, "warehous": 9, "order": [9, 17], "food": 9, "shop": 9, "cash": 9, "regist": 9, "what": [11, 12, 13], "represent": 11, "repres": 11, "addit": [11, 12, 17, 18, 20, 21, 22, 24, 25, 26, 27, 28, 31, 32], "subtract": [11, 12], "scalar": 11, "One": [11, 22], "x": 11, "magnitud": 11, "direct": 11, "dot": [11, 12], "product": [11, 12, 13], "definit": [11, 30], "geometr": 11, "interpret": [11, 19, 26, 28], "properti": [11, 12], "cross": [11, 18, 19], "norm": 11, "real": [11, 13], "world": [11, 13], "comput": [11, 27], "graphic": [11, 13], "simul": 11, "2d": 11, "movement": 11, "physic": 11, "engin": 11, "scienc": [11, 15], "summari": [11, 17, 19, 21, 22], "conclud": 11, "thought": 11, "field": 11, "beginn": 11, "necessari": [11, 15, 21, 22], "creat": [11, 12, 26], "grid": 11, "defin": [11, 13], "plot": [11, 20, 24, 25, 26], "format": 11, "displai": [11, 13, 17], "master": [12, 24, 26], "core": 12, "complex": 12, "element": 12, "wise": [12, 19], "transpos": 12, "invers": 12, "flip": 12, "revers": 12, "instruct": [12, 24], "prerequisit": [13, 14, 15, 18, 20, 21, 22, 24, 25], "ar": [13, 17], "rate": 13, "chang": 13, "slope": 13, "tangent": 13, "line": [13, 30], "notat": 13, "formula": [13, 20, 28], "power": 13, "result": [13, 28], "constant": 13, "sum": 13, "quotient": 13, "A": [13, 22, 28], "view": 13, "best": [13, 18, 20, 21, 22, 24, 25, 26, 27, 28, 30], "conclus": [13, 15, 19, 25], "expand": [15, 22], "uncertainti": 15, "inferenti": [15, 24], "goal": 17, "workflow": 17, "setup": 17, "In": [17, 18, 19, 25, 26], "abov": [17, 30], "we": 17, "column": 17, "mode": [17, 24, 25], "could": 17, "you": 17, "non": 17, "would": 17, "varianc": [17, 19, 24], "deviat": [17, 19, 24], "between": [17, 30], "panda": 17, "quartil": [17, 19], "interquartil": [17, 19], "explor": [18, 19, 20, 21, 28], "valid": [18, 19], "theoret": [18, 30], "background": 18, "principl": [18, 27], "stratifi": 18, "roll": 18, "homework": [18, 19, 20, 24, 25, 26, 27], "assign": [18, 19, 20, 24, 25, 26, 27], "access": 18, "dataset": [18, 19, 20, 21, 22, 26, 27, 28, 30], "note": 18, "leakag": [18, 20, 21], "qualiti": [19, 25, 26, 27], "wine": [19, 25, 26, 27], "iqr": 19, "notabl": 19, "accuraci": [19, 28], "review": 19, "follow": 19, "overal": 19, "observ": 19, "report": [19, 24, 25, 26], "class": 19, "score": [19, 21], "imput": 20, "fill": 20, "ag": 20, "median": [20, 24, 25], "how": 20, "knn": 20, "mnar": 20, "Not": 20, "approach": 20, "augment": 20, "impact": 20, "histogram": [20, 24, 25, 26], "scatter": 20, "two": [20, 30], "littl": 20, "s": [20, 27, 28], "mcar": 20, "rpy2": 20, "instal": 20, "r": 20, "packag": 20, "tip": 20, "discern": 20, "comprehens": [21, 24, 26], "z": 21, "min": 21, "max": 21, "iri": [21, 28], "post": [21, 22], "analyt": [21, 28], "assess": [21, 28], "effect": 21, "implic": 22, "binari": 22, "high": 22, "cardin": 22, "hot": 22, "nomin": 22, "label": 22, "ordin": 22, "context": 22, "cabin": 22, "embark": 22, "pclass": 22, "dive": [22, 25], "titan": 22, "identif": 22, "b": 22, "c": [22, 30], "boxplot": [24, 25], "violin": [24, 25], "pair": [24, 25], "heatmap": [24, 27], "skew": 24, "kurtosi": 24, "sampl": 24, "central": [24, 25], "limit": 24, "hypothesi": 24, "tendenc": 25, "averag": 25, "middl": 25, "most": 25, "frequent": 25, "compar": 25, "measur": 25, "templat": 25, "dispers": 25, "find": 25, "discuss": 25, "box": 26, "detail": [26, 28], "requir": [26, 28], "compil": 26, "signific": 27, "pearson": 27, "spearman": 27, "coeffici": 27, "rank": 27, "common": 27, "pitfal": 27, "With": 28, "part": 28, "entropi": 28, "sum_": 28, "i": 28, "n": 28, "p_i": 28, "log_2": 28, "inform": 28, "gain": 28, "informationgain": 28, "v": 28, "frac": 28, "s_v": 28, "gini": 28, "impur": 28, "vs": 28, "when": 28, "which": 28, "conceptu": 28, "think": 28, "minut": 28, "filter": 28, "mutual": 28, "don": 28, "ts": 28, "carefulli": 28, "consid": 28, "anova": 28, "f": 28, "wrapper": 28, "stepwis": 28, "pseudo": 28, "embed": 28, "purpos": 30, "explan": 30, "equat": [30, 31], "y": 30, "mx": 30, "hyperplan": 30, "relat": 30, "dimens": 30, "fit": 30, "least": 30, "squar": 30, "scikit": 30, "matplotlib": 30, "hous": 30, "predict": 30, "price": 30, "excercis": 30, "reader": [30, 31, 32], "kei": 31, "exercis": [31, 32], "For": [31, 32], "make_pipelin": 32}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx": 56}}) \ No newline at end of file