diff --git a/Chapter5/better_pandas.ipynb b/Chapter5/better_pandas.ipynb index 990d160..3dd9cec 100644 --- a/Chapter5/better_pandas.ipynb +++ b/Chapter5/better_pandas.ipynb @@ -2289,6 +2289,258 @@ "[Link to Delta Lake](https://github.com/delta-io/delta)." ] }, + { + "cell_type": "markdown", + "id": "6a202591", + "metadata": {}, + "source": [ + "### From Complex SQL to Simple Merges: Delta Lake's Upsert Solution" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e655b5fa", + "metadata": { + "tags": [ + "hide-cell" + ] + }, + "outputs": [], + "source": [ + "!pip install delta-spark" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "32ae71e5", + "metadata": { + "tags": [ + "remove-cell" + ] + }, + "outputs": [], + "source": [ + "import pyspark\n", + "from delta import *\n", + "\n", + "# Configure Spark to use Delta\n", + "builder = (\n", + " pyspark.sql.SparkSession.builder.appName(\"MyApp\")\n", + " .config(\"spark.sql.extensions\", \"io.delta.sql.DeltaSparkSessionExtension\")\n", + " .config(\n", + " \"spark.sql.catalog.spark_catalog\",\n", + " \"org.apache.spark.sql.delta.catalog.DeltaCatalog\",\n", + " )\n", + ")\n", + "\n", + "spark = configure_spark_with_delta_pip(builder).getOrCreate()" + ] + }, + { + "cell_type": "markdown", + "id": "775dcae5", + "metadata": {}, + "source": [ + "Traditionally, implementing upsert (update or insert) logic requires separate UPDATE and INSERT statements or complex SQL. This approach can be error-prone and inefficient, especially for large datasets. \n", + "\n", + "Delta Lake's merge operation solves this problem by allowing you to specify different actions for matching and non-matching records in a single, declarative statement.\n", + "\n", + "Here's an example that demonstrates the power and simplicity of Delta Lake's merge operation:\n", + "\n", + "First, let's set up our initial data:\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "ff393032", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Initial Customers:\n", + "+-----------+-----------+----------------+-------------------+\n", + "|customer_id| name| email| last_updated|\n", + "+-----------+-----------+----------------+-------------------+\n", + "| 1| John Doe|john@example.com|2023-01-01 10:00:00|\n", + "| 2| Jane Smith|jane@example.com|2023-01-02 11:00:00|\n", + "| 3|Bob Johnson| bob@example.com|2023-01-03 12:00:00|\n", + "+-----------+-----------+----------------+-------------------+\n", + "\n", + "Updates:\n", + "+-----------+-----------+--------------------+\n", + "|customer_id| name| email|\n", + "+-----------+-----------+--------------------+\n", + "| 2| Jane Doe|jane.doe@example.com|\n", + "| 3|Bob Johnson| bob@example.com|\n", + "| 4|Alice Brown| alice@example.com|\n", + "+-----------+-----------+--------------------+\n", + "\n" + ] + } + ], + "source": [ + "# Create sample data for 'customers' DataFrame\n", + "customers_data = [\n", + " (1, \"John Doe\", \"john@example.com\", \"2023-01-01 10:00:00\"),\n", + " (2, \"Jane Smith\", \"jane@example.com\", \"2023-01-02 11:00:00\"),\n", + " (3, \"Bob Johnson\", \"bob@example.com\", \"2023-01-03 12:00:00\"),\n", + "]\n", + "customers = spark.createDataFrame(\n", + " customers_data, [\"customer_id\", \"name\", \"email\", \"last_updated\"]\n", + ")\n", + "\n", + "# Create sample data for 'updates' DataFrame\n", + "updates_data = [\n", + " (2, \"Jane Doe\", \"jane.doe@example.com\"), # Existing customer with updates\n", + " (3, \"Bob Johnson\", \"bob@example.com\"), # Existing customer without changes\n", + " (4, \"Alice Brown\", \"alice@example.com\"), # New customer\n", + "]\n", + "updates = spark.createDataFrame(updates_data, [\"customer_id\", \"name\", \"email\"])\n", + "\n", + "# Show the initial data\n", + "print(\"Initial Customers:\")\n", + "customers.show()\n", + "print(\"Updates:\")\n", + "updates.show()" + ] + }, + { + "cell_type": "markdown", + "id": "acb9e489", + "metadata": {}, + "source": [ + "Next, we create a Delta table from our initial customer data:" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "0041f1d4", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Customers Delta Table created successfully\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + } + ], + "source": [ + "# Define the path where you want to save the Delta table\n", + "delta_table_path = \"customers_delta\"\n", + "\n", + "# Write the DataFrame as a Delta table\n", + "customers.write.format(\"delta\").mode(\"overwrite\").save(delta_table_path)\n", + "\n", + "# Create a DeltaTable object\n", + "customers_delta = DeltaTable.forPath(spark, delta_table_path)\n", + "\n", + "print(\"Customers Delta Table created successfully\")" + ] + }, + { + "cell_type": "markdown", + "id": "560b2a9d", + "metadata": {}, + "source": [ + "Now, here's the key part - the merge operation that handles both updates and inserts in a single statement:" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "f0626375", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + } + ], + "source": [ + "# Assume 'customers_delta' is your target table and 'updates' is your source of new data\n", + "customers_delta.alias(\"target\").merge(\n", + " updates.alias(\"source\"),\n", + " \"target.customer_id = source.customer_id\"\n", + ").whenMatchedUpdate(set={\n", + " \"name\": \"source.name\",\n", + " \"email\": \"source.email\",\n", + " \"last_updated\": \"current_timestamp()\"\n", + "}).whenNotMatchedInsert(values={\n", + " \"customer_id\": \"source.customer_id\",\n", + " \"name\": \"source.name\",\n", + " \"email\": \"source.email\",\n", + " \"last_updated\": \"current_timestamp()\"\n", + "}).execute()" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "0ed114dc", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Updated Customers Delta Table:\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "+-----------+-----------+--------------------+--------------------+\n", + "|customer_id| name| email| last_updated|\n", + "+-----------+-----------+--------------------+--------------------+\n", + "| 2| Jane Doe|jane.doe@example.com|2024-08-20 16:05:...|\n", + "| 3|Bob Johnson| bob@example.com|2024-08-20 16:05:...|\n", + "| 4|Alice Brown| alice@example.com|2024-08-20 16:05:...|\n", + "| 1| John Doe| john@example.com| 2023-01-01 10:00:00|\n", + "+-----------+-----------+--------------------+--------------------+\n", + "\n" + ] + } + ], + "source": [ + "# Verify the updated data\n", + "print(\"Updated Customers Delta Table:\")\n", + "customers_delta.toDF().show()" + ] + }, { "attachments": {}, "cell_type": "markdown", @@ -4178,7 +4430,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.4" + "version": "3.11.6" }, "toc": { "base_numbering": 1, diff --git a/docs/Chapter5/better_pandas.html b/docs/Chapter5/better_pandas.html index fe70cec..946f779 100644 --- a/docs/Chapter5/better_pandas.html +++ b/docs/Chapter5/better_pandas.html @@ -524,16 +524,17 @@

Contents

  • 6.12.9. Enforce Data Quality with Delta Lake Constraints
  • 6.12.10. Efficient Data Updates and Scanning with Delta Lake
  • 6.12.11. Simplify Table Merge Operations with Delta Lake
  • -
  • 6.12.12. The Best Way to Append Mismatched Data to Parquet Tables
  • -
  • 6.12.13. Polars: Blazing Fast DataFrame Library
  • -
  • 6.12.14. Polars: Speed Up Data Processing 12x with Lazy Execution
  • -
  • 6.12.15. Polars vs. Pandas for CSV Loading and Filtering
  • -
  • 6.12.16. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing
  • -
  • 6.12.17. Simple and Expressive Data Transformation with Polars
  • -
  • 6.12.18. Harness Polars and Delta Lake for Blazing Fast Performance
  • -
  • 6.12.19. Parallel Execution of Multiple Files with Polars
  • -
  • 6.12.20. Polars’ Streaming Mode: A Solution for Large Data Sets
  • -
  • 6.12.21. Pandas vs Polars: Syntax Comparison for Data Scientists
  • +
  • 6.12.12. From Complex SQL to Simple Merges: Delta Lake’s Upsert Solution
  • +
  • 6.12.13. The Best Way to Append Mismatched Data to Parquet Tables
  • +
  • 6.12.14. Polars: Blazing Fast DataFrame Library
  • +
  • 6.12.15. Polars: Speed Up Data Processing 12x with Lazy Execution
  • +
  • 6.12.16. Polars vs. Pandas for CSV Loading and Filtering
  • +
  • 6.12.17. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing
  • +
  • 6.12.18. Simple and Expressive Data Transformation with Polars
  • +
  • 6.12.19. Harness Polars and Delta Lake for Blazing Fast Performance
  • +
  • 6.12.20. Parallel Execution of Multiple Files with Polars
  • +
  • 6.12.21. Polars’ Streaming Mode: A Solution for Large Data Sets
  • +
  • 6.12.22. Pandas vs Polars: Syntax Comparison for Data Scientists
  • @@ -2037,8 +2038,159 @@

    6.12.11. Simplify Table Merge Operations

    Link to Delta Lake.

    +
    +

    6.12.12. From Complex SQL to Simple Merges: Delta Lake’s Upsert Solution#

    +
    +
    + + +Hide code cell content + +
    +
    !pip install delta-spark
    +
    +
    +
    +
    +
    +

    Traditionally, implementing upsert (update or insert) logic requires separate UPDATE and INSERT statements or complex SQL. This approach can be error-prone and inefficient, especially for large datasets.

    +

    Delta Lake’s merge operation solves this problem by allowing you to specify different actions for matching and non-matching records in a single, declarative statement.

    +

    Here’s an example that demonstrates the power and simplicity of Delta Lake’s merge operation:

    +

    First, let’s set up our initial data:

    +
    +
    +
    # Create sample data for 'customers' DataFrame
    +customers_data = [
    +    (1, "John Doe", "john@example.com", "2023-01-01 10:00:00"),
    +    (2, "Jane Smith", "jane@example.com", "2023-01-02 11:00:00"),
    +    (3, "Bob Johnson", "bob@example.com", "2023-01-03 12:00:00"),
    +]
    +customers = spark.createDataFrame(
    +    customers_data, ["customer_id", "name", "email", "last_updated"]
    +)
    +
    +# Create sample data for 'updates' DataFrame
    +updates_data = [
    +    (2, "Jane Doe", "jane.doe@example.com"),  # Existing customer with updates
    +    (3, "Bob Johnson", "bob@example.com"),  # Existing customer without changes
    +    (4, "Alice Brown", "alice@example.com"),  # New customer
    +]
    +updates = spark.createDataFrame(updates_data, ["customer_id", "name", "email"])
    +
    +# Show the initial data
    +print("Initial Customers:")
    +customers.show()
    +print("Updates:")
    +updates.show()
    +
    +
    +
    +
    +
    Initial Customers:
    ++-----------+-----------+----------------+-------------------+
    +|customer_id|       name|           email|       last_updated|
    ++-----------+-----------+----------------+-------------------+
    +|          1|   John Doe|john@example.com|2023-01-01 10:00:00|
    +|          2| Jane Smith|jane@example.com|2023-01-02 11:00:00|
    +|          3|Bob Johnson| bob@example.com|2023-01-03 12:00:00|
    ++-----------+-----------+----------------+-------------------+
    +
    +Updates:
    ++-----------+-----------+--------------------+
    +|customer_id|       name|               email|
    ++-----------+-----------+--------------------+
    +|          2|   Jane Doe|jane.doe@example.com|
    +|          3|Bob Johnson|     bob@example.com|
    +|          4|Alice Brown|   alice@example.com|
    ++-----------+-----------+--------------------+
    +
    +
    +
    +
    +

    Next, we create a Delta table from our initial customer data:

    +
    +
    +
    # Define the path where you want to save the Delta table
    +delta_table_path = "customers_delta"
    +
    +# Write the DataFrame as a Delta table
    +customers.write.format("delta").mode("overwrite").save(delta_table_path)
    +
    +# Create a DeltaTable object
    +customers_delta = DeltaTable.forPath(spark, delta_table_path)
    +
    +print("Customers Delta Table created successfully")
    +
    +
    +
    +
    +
                                                                                    
    +
    +
    +
    Customers Delta Table created successfully
    +
    +
    +
                                                                                    
    +
    +
    +
    +
    +

    Now, here’s the key part - the merge operation that handles both updates and inserts in a single statement:

    +
    +
    +
    # Assume 'customers_delta' is your target table and 'updates' is your source of new data
    +customers_delta.alias("target").merge(
    +    updates.alias("source"),
    +    "target.customer_id = source.customer_id"
    +).whenMatchedUpdate(set={
    +    "name": "source.name",
    +    "email": "source.email",
    +    "last_updated": "current_timestamp()"
    +}).whenNotMatchedInsert(values={
    +    "customer_id": "source.customer_id",
    +    "name": "source.name",
    +    "email": "source.email",
    +    "last_updated": "current_timestamp()"
    +}).execute()
    +
    +
    +
    +
    +
                                                                                    
    +
    +
    +
    +
    +
    +
    +
    # Verify the updated data
    +print("Updated Customers Delta Table:")
    +customers_delta.toDF().show()
    +
    +
    +
    +
    +
    Updated Customers Delta Table:
    +
    +
    +
                                                                                    
    +
    +
    +
    +-----------+-----------+--------------------+--------------------+
    +|customer_id|       name|               email|        last_updated|
    ++-----------+-----------+--------------------+--------------------+
    +|          2|   Jane Doe|jane.doe@example.com|2024-08-20 16:05:...|
    +|          3|Bob Johnson|     bob@example.com|2024-08-20 16:05:...|
    +|          4|Alice Brown|   alice@example.com|2024-08-20 16:05:...|
    +|          1|   John Doe|    john@example.com| 2023-01-01 10:00:00|
    ++-----------+-----------+--------------------+--------------------+
    +
    +
    +
    +
    +
    -

    6.12.12. The Best Way to Append Mismatched Data to Parquet Tables#

    +

    6.12.13. The Best Way to Append Mismatched Data to Parquet Tables#

    Appending mismatched data to a Parquet table involves reading the existing data, concatenating it with the new data, and overwriting the existing Parquet file. This approach can be expensive and may lead to schema inconsistencies.

    In the following code, the datatype of col3 is supposed to be int64 instead of float64.

    @@ -2195,7 +2347,7 @@

    6.12.12. The Best Way to Append Mismatch

    Link to Delta Lake.

    -

    6.12.13. Polars: Blazing Fast DataFrame Library#

    +

    6.12.14. Polars: Blazing Fast DataFrame Library#

    @@ -2269,7 +2421,7 @@

    6.12.13. Polars: Blazing Fast DataFrame

    Link to polars

    -

    6.12.14. Polars: Speed Up Data Processing 12x with Lazy Execution#

    +

    6.12.15. Polars: Speed Up Data Processing 12x with Lazy Execution#

    @@ -2431,7 +2583,7 @@

    6.12.14. Polars: Speed Up Data Processin

    Link to polars

    -

    6.12.15. Polars vs. Pandas for CSV Loading and Filtering#

    +

    6.12.16. Polars vs. Pandas for CSV Loading and Filtering#

    @@ -2500,7 +2652,7 @@

    6.12.15. Polars vs. Pandas for CSV Loadi

    -

    6.12.16. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing#

    +

    6.12.17. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing#

    @@ -2547,7 +2699,7 @@

    6.12.16. Pandas vs Polars: Harnessing Pa

    Link to Polars.

    -

    6.12.17. Simple and Expressive Data Transformation with Polars#

    +

    6.12.18. Simple and Expressive Data Transformation with Polars#

    Extract features and select only relevant features for each time series.

    @@ -2642,7 +2794,7 @@

    6.12.17. Simple and Expressive Data Tran

    -

    6.12.18. Harness Polars and Delta Lake for Blazing Fast Performance#

    +

    6.12.19. Harness Polars and Delta Lake for Blazing Fast Performance#

    @@ -2863,7 +3015,7 @@

    6.12.18. Harness Polars and Delta Lake f

    Link to delta-rs.

    -

    6.12.19. Parallel Execution of Multiple Files with Polars#

    +

    6.12.20. Parallel Execution of Multiple Files with Polars#

    @@ -2934,7 +3086,7 @@

    6.12.19. Parallel Execution of Multiple

    Link to polars

    -

    6.12.20. Polars’ Streaming Mode: A Solution for Large Data Sets#

    +

    6.12.21. Polars’ Streaming Mode: A Solution for Large Data Sets#

    @@ -2967,7 +3119,7 @@

    6.12.20. Polars’ Streaming Mode: A Sol

    Learn more about Streaming API in Polars.

    -

    6.12.21. Pandas vs Polars: Syntax Comparison for Data Scientists#

    +

    6.12.22. Pandas vs Polars: Syntax Comparison for Data Scientists#

    As a data scientist, you’re likely familiar with the popular data analysis libraries Pandas and Polars. Both provide powerful tools for working with tabular data, but how do their syntaxes compare?

    To begin, we’ll create equivalent dataframes in both Pandas and Polars:

    @@ -3285,16 +3437,17 @@

    6.12.21. Pandas vs Polars: Syntax Compar
  • 6.12.9. Enforce Data Quality with Delta Lake Constraints
  • 6.12.10. Efficient Data Updates and Scanning with Delta Lake
  • 6.12.11. Simplify Table Merge Operations with Delta Lake
  • -
  • 6.12.12. The Best Way to Append Mismatched Data to Parquet Tables
  • -
  • 6.12.13. Polars: Blazing Fast DataFrame Library
  • -
  • 6.12.14. Polars: Speed Up Data Processing 12x with Lazy Execution
  • -
  • 6.12.15. Polars vs. Pandas for CSV Loading and Filtering
  • -
  • 6.12.16. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing
  • -
  • 6.12.17. Simple and Expressive Data Transformation with Polars
  • -
  • 6.12.18. Harness Polars and Delta Lake for Blazing Fast Performance
  • -
  • 6.12.19. Parallel Execution of Multiple Files with Polars
  • -
  • 6.12.20. Polars’ Streaming Mode: A Solution for Large Data Sets
  • -
  • 6.12.21. Pandas vs Polars: Syntax Comparison for Data Scientists
  • +
  • 6.12.12. From Complex SQL to Simple Merges: Delta Lake’s Upsert Solution
  • +
  • 6.12.13. The Best Way to Append Mismatched Data to Parquet Tables
  • +
  • 6.12.14. Polars: Blazing Fast DataFrame Library
  • +
  • 6.12.15. Polars: Speed Up Data Processing 12x with Lazy Execution
  • +
  • 6.12.16. Polars vs. Pandas for CSV Loading and Filtering
  • +
  • 6.12.17. Pandas vs Polars: Harnessing Parallelism for Faster Data Processing
  • +
  • 6.12.18. Simple and Expressive Data Transformation with Polars
  • +
  • 6.12.19. Harness Polars and Delta Lake for Blazing Fast Performance
  • +
  • 6.12.20. Parallel Execution of Multiple Files with Polars
  • +
  • 6.12.21. Polars’ Streaming Mode: A Solution for Large Data Sets
  • +
  • 6.12.22. Pandas vs Polars: Syntax Comparison for Data Scientists
  • diff --git a/docs/_sources/Chapter5/better_pandas.ipynb b/docs/_sources/Chapter5/better_pandas.ipynb index 990d160..3dd9cec 100644 --- a/docs/_sources/Chapter5/better_pandas.ipynb +++ b/docs/_sources/Chapter5/better_pandas.ipynb @@ -2289,6 +2289,258 @@ "[Link to Delta Lake](https://github.com/delta-io/delta)." ] }, + { + "cell_type": "markdown", + "id": "6a202591", + "metadata": {}, + "source": [ + "### From Complex SQL to Simple Merges: Delta Lake's Upsert Solution" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e655b5fa", + "metadata": { + "tags": [ + "hide-cell" + ] + }, + "outputs": [], + "source": [ + "!pip install delta-spark" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "32ae71e5", + "metadata": { + "tags": [ + "remove-cell" + ] + }, + "outputs": [], + "source": [ + "import pyspark\n", + "from delta import *\n", + "\n", + "# Configure Spark to use Delta\n", + "builder = (\n", + " pyspark.sql.SparkSession.builder.appName(\"MyApp\")\n", + " .config(\"spark.sql.extensions\", \"io.delta.sql.DeltaSparkSessionExtension\")\n", + " .config(\n", + " \"spark.sql.catalog.spark_catalog\",\n", + " \"org.apache.spark.sql.delta.catalog.DeltaCatalog\",\n", + " )\n", + ")\n", + "\n", + "spark = configure_spark_with_delta_pip(builder).getOrCreate()" + ] + }, + { + "cell_type": "markdown", + "id": "775dcae5", + "metadata": {}, + "source": [ + "Traditionally, implementing upsert (update or insert) logic requires separate UPDATE and INSERT statements or complex SQL. This approach can be error-prone and inefficient, especially for large datasets. \n", + "\n", + "Delta Lake's merge operation solves this problem by allowing you to specify different actions for matching and non-matching records in a single, declarative statement.\n", + "\n", + "Here's an example that demonstrates the power and simplicity of Delta Lake's merge operation:\n", + "\n", + "First, let's set up our initial data:\n", + "\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "ff393032", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Initial Customers:\n", + "+-----------+-----------+----------------+-------------------+\n", + "|customer_id| name| email| last_updated|\n", + "+-----------+-----------+----------------+-------------------+\n", + "| 1| John Doe|john@example.com|2023-01-01 10:00:00|\n", + "| 2| Jane Smith|jane@example.com|2023-01-02 11:00:00|\n", + "| 3|Bob Johnson| bob@example.com|2023-01-03 12:00:00|\n", + "+-----------+-----------+----------------+-------------------+\n", + "\n", + "Updates:\n", + "+-----------+-----------+--------------------+\n", + "|customer_id| name| email|\n", + "+-----------+-----------+--------------------+\n", + "| 2| Jane Doe|jane.doe@example.com|\n", + "| 3|Bob Johnson| bob@example.com|\n", + "| 4|Alice Brown| alice@example.com|\n", + "+-----------+-----------+--------------------+\n", + "\n" + ] + } + ], + "source": [ + "# Create sample data for 'customers' DataFrame\n", + "customers_data = [\n", + " (1, \"John Doe\", \"john@example.com\", \"2023-01-01 10:00:00\"),\n", + " (2, \"Jane Smith\", \"jane@example.com\", \"2023-01-02 11:00:00\"),\n", + " (3, \"Bob Johnson\", \"bob@example.com\", \"2023-01-03 12:00:00\"),\n", + "]\n", + "customers = spark.createDataFrame(\n", + " customers_data, [\"customer_id\", \"name\", \"email\", \"last_updated\"]\n", + ")\n", + "\n", + "# Create sample data for 'updates' DataFrame\n", + "updates_data = [\n", + " (2, \"Jane Doe\", \"jane.doe@example.com\"), # Existing customer with updates\n", + " (3, \"Bob Johnson\", \"bob@example.com\"), # Existing customer without changes\n", + " (4, \"Alice Brown\", \"alice@example.com\"), # New customer\n", + "]\n", + "updates = spark.createDataFrame(updates_data, [\"customer_id\", \"name\", \"email\"])\n", + "\n", + "# Show the initial data\n", + "print(\"Initial Customers:\")\n", + "customers.show()\n", + "print(\"Updates:\")\n", + "updates.show()" + ] + }, + { + "cell_type": "markdown", + "id": "acb9e489", + "metadata": {}, + "source": [ + "Next, we create a Delta table from our initial customer data:" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "0041f1d4", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Customers Delta Table created successfully\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + } + ], + "source": [ + "# Define the path where you want to save the Delta table\n", + "delta_table_path = \"customers_delta\"\n", + "\n", + "# Write the DataFrame as a Delta table\n", + "customers.write.format(\"delta\").mode(\"overwrite\").save(delta_table_path)\n", + "\n", + "# Create a DeltaTable object\n", + "customers_delta = DeltaTable.forPath(spark, delta_table_path)\n", + "\n", + "print(\"Customers Delta Table created successfully\")" + ] + }, + { + "cell_type": "markdown", + "id": "560b2a9d", + "metadata": {}, + "source": [ + "Now, here's the key part - the merge operation that handles both updates and inserts in a single statement:" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "f0626375", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + } + ], + "source": [ + "# Assume 'customers_delta' is your target table and 'updates' is your source of new data\n", + "customers_delta.alias(\"target\").merge(\n", + " updates.alias(\"source\"),\n", + " \"target.customer_id = source.customer_id\"\n", + ").whenMatchedUpdate(set={\n", + " \"name\": \"source.name\",\n", + " \"email\": \"source.email\",\n", + " \"last_updated\": \"current_timestamp()\"\n", + "}).whenNotMatchedInsert(values={\n", + " \"customer_id\": \"source.customer_id\",\n", + " \"name\": \"source.name\",\n", + " \"email\": \"source.email\",\n", + " \"last_updated\": \"current_timestamp()\"\n", + "}).execute()" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "0ed114dc", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Updated Customers Delta Table:\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + " \r" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "+-----------+-----------+--------------------+--------------------+\n", + "|customer_id| name| email| last_updated|\n", + "+-----------+-----------+--------------------+--------------------+\n", + "| 2| Jane Doe|jane.doe@example.com|2024-08-20 16:05:...|\n", + "| 3|Bob Johnson| bob@example.com|2024-08-20 16:05:...|\n", + "| 4|Alice Brown| alice@example.com|2024-08-20 16:05:...|\n", + "| 1| John Doe| john@example.com| 2023-01-01 10:00:00|\n", + "+-----------+-----------+--------------------+--------------------+\n", + "\n" + ] + } + ], + "source": [ + "# Verify the updated data\n", + "print(\"Updated Customers Delta Table:\")\n", + "customers_delta.toDF().show()" + ] + }, { "attachments": {}, "cell_type": "markdown", @@ -4178,7 +4430,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.4" + "version": "3.11.6" }, "toc": { "base_numbering": 1, diff --git a/docs/searchindex.js b/docs/searchindex.js index a125bbd..82860c0 100644 --- a/docs/searchindex.js +++ b/docs/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": [".pytest_cache/README", "Chapter1/Chapter1", "Chapter1/class", "Chapter1/code_speed", "Chapter1/datetime", "Chapter1/dictionary", "Chapter1/function", "Chapter1/good_practices", "Chapter1/list/apply_functions_to_elements", "Chapter1/list/get_elements", "Chapter1/list/interaction_between_2_lists", "Chapter1/list/join_iterable", "Chapter1/list/list", "Chapter1/list/unpack_iterables", "Chapter1/number", "Chapter1/python_new_features", "Chapter1/string", "Chapter2/Chapter2", "Chapter2/collections", "Chapter2/dataclasses", "Chapter2/functools", "Chapter2/itertools", "Chapter2/operator", "Chapter2/pathlib", "Chapter2/pydantic", "Chapter2/pydash", "Chapter2/sympy", "Chapter2/typing", "Chapter3/Chapter3", "Chapter3/change_values", "Chapter3/combine_dataframes", "Chapter3/create_dataframe", "Chapter3/data_types", "Chapter3/date_time", "Chapter3/filter", "Chapter3/get_values", "Chapter3/sort_dataframe", "Chapter3/string", "Chapter3/style_dataframe", "Chapter3/testing", "Chapter3/transform_dataframe", "Chapter4/Chapter4", "Chapter4/Numpy", "Chapter5/.pytest_cache/README", "Chapter5/Chapter5", "Chapter5/SQL", "Chapter5/best_python_practice_tools", "Chapter5/better_pandas", "Chapter5/feature_engineer", "Chapter5/feature_extraction", "Chapter5/get_data", "Chapter5/llm", "Chapter5/machine_learning", "Chapter5/manage_data", "Chapter5/natural_language_processing", "Chapter5/sharing_downloading", "Chapter5/spark", "Chapter5/speed_up_code", "Chapter5/testing", "Chapter5/time_series", "Chapter5/visualization", "Chapter6/Chapter6", "Chapter6/alternative_approach", "Chapter6/better_outputs", "Chapter6/code_review", "Chapter6/env_management", "Chapter6/git_github", "Chapter6/logging_debugging", "Chapter6/workflow_automation", "Chapter7/.pytest_cache/README", "Chapter7/Chapter7", "Chapter7/example_notebook", "Chapter7/example_notebook2", "Chapter7/jupyter_notebook", "README", "gpt_scripts/.pytest_cache/README", "how_to_read"], "filenames": [".pytest_cache/README.md", "Chapter1/Chapter1.md", "Chapter1/class.ipynb", "Chapter1/code_speed.ipynb", "Chapter1/datetime.ipynb", "Chapter1/dictionary.ipynb", "Chapter1/function.ipynb", "Chapter1/good_practices.ipynb", "Chapter1/list/apply_functions_to_elements.ipynb", "Chapter1/list/get_elements.ipynb", "Chapter1/list/interaction_between_2_lists.ipynb", "Chapter1/list/join_iterable.ipynb", "Chapter1/list/list.md", "Chapter1/list/unpack_iterables.ipynb", "Chapter1/number.ipynb", "Chapter1/python_new_features.ipynb", "Chapter1/string.ipynb", "Chapter2/Chapter2.md", "Chapter2/collections.ipynb", "Chapter2/dataclasses.ipynb", "Chapter2/functools.ipynb", "Chapter2/itertools.ipynb", "Chapter2/operator.ipynb", "Chapter2/pathlib.ipynb", "Chapter2/pydantic.ipynb", "Chapter2/pydash.ipynb", "Chapter2/sympy.ipynb", "Chapter2/typing.ipynb", "Chapter3/Chapter3.md", "Chapter3/change_values.ipynb", "Chapter3/combine_dataframes.ipynb", "Chapter3/create_dataframe.ipynb", "Chapter3/data_types.ipynb", "Chapter3/date_time.ipynb", "Chapter3/filter.ipynb", "Chapter3/get_values.ipynb", "Chapter3/sort_dataframe.ipynb", "Chapter3/string.ipynb", "Chapter3/style_dataframe.ipynb", "Chapter3/testing.ipynb", "Chapter3/transform_dataframe.ipynb", "Chapter4/Chapter4.md", "Chapter4/Numpy.ipynb", "Chapter5/.pytest_cache/README.md", "Chapter5/Chapter5.md", "Chapter5/SQL.ipynb", "Chapter5/best_python_practice_tools.ipynb", "Chapter5/better_pandas.ipynb", "Chapter5/feature_engineer.ipynb", "Chapter5/feature_extraction.ipynb", "Chapter5/get_data.ipynb", "Chapter5/llm.ipynb", "Chapter5/machine_learning.ipynb", "Chapter5/manage_data.ipynb", "Chapter5/natural_language_processing.ipynb", "Chapter5/sharing_downloading.ipynb", "Chapter5/spark.ipynb", "Chapter5/speed_up_code.ipynb", "Chapter5/testing.ipynb", "Chapter5/time_series.ipynb", "Chapter5/visualization.ipynb", "Chapter6/Chapter6.md", "Chapter6/alternative_approach.md", "Chapter6/better_outputs.ipynb", "Chapter6/code_review.ipynb", "Chapter6/env_management.ipynb", "Chapter6/git_github.ipynb", "Chapter6/logging_debugging.ipynb", "Chapter6/workflow_automation.ipynb", "Chapter7/.pytest_cache/README.md", "Chapter7/Chapter7.md", "Chapter7/example_notebook.ipynb", "Chapter7/example_notebook2.ipynb", "Chapter7/jupyter_notebook.ipynb", "README.md", "gpt_scripts/.pytest_cache/README.md", "how_to_read.md"], "titles": ["pytest cache directory", "2. Python Built-in Methods", "2.6. Classes", "2.8. Code Speed", "2.7. Datetime", "2.4. Dictionary", "2.5. Function", "2.9. Good Python Practices", "2.3.5. Apply Functions to Elements in a List", "2.3.1. Get Elements", "2.3.4. Interaction Between 2 Lists", "2.3.3. Join Iterables", "2.3. List", "2.3.2. Unpack Iterables", "2.2. Number", "2.10. New Features in Python", "2.1. String", "3. Python Utility Libraries", "3.1. Collections", "3.7. Data Classes", "3.3. Functools", "3.2. Itertools", "3.6. Operator", "3.9. pathlib", "3.10. Pydantic", "3.4. Pydash", "3.5. SymPy", "3.8. Typing", "4. Pandas", "4.1. Change Values", "4.6. Combine Multiple DataFrames", "4.5. Create a DataFrame", "4.8. Manipulate a DataFrame Using Data Types", "4.3. Work with Datetime", "4.7. Filter Rows or Columns", "4.2. Get Certain Values From a DataFrame", "4.9. Sort Rows or Columns of a DataFrame", "4.10. Work with String", "4.11. Style a DataFrame", "4.12. Test", "4.4. Transform a DataFrame", "5. NumPy", "5.1. NumPy", "pytest cache directory", "6. Data Science Tools", "6.14. SQL Libraries", "6.11. Tools for Best Python Practices", "6.12. Better Pandas", "6.2. Feature Engineer", "6.1. Feature Extraction", "6.3. Get Data", "6.16. Large Language Model (LLM)", "6.5. Machine Learning", "6.4. Manage Data", "6.6. Natural Language Processing", "6.8. Sharing and Downloading", "6.15. PySpark", "6.9. Tools to Speed Up Code", "6.13. Testing", "6.7. Time Series", "6.10. Visualization", "7. Cool Tools", "7.1. Alternative Approach", "7.5. Better Outputs", "7.3. Code Review", "7.7. Environment Management", "7.6. Git and GitHub", "7.4. Logging and Debugging", "7.2. Workflow Automation", "pytest cache directory", "8. Jupyter Notebook", "<no title>", "<no title>", "8.1. Jupyter Notebook", "What Should You Expect From This Book?", "pytest cache directory", "1. How to Read This Book"], "terms": {"thi": [0, 1, 2, 3, 5, 6, 7, 9, 13, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 73, 75], "contain": [0, 27, 32, 43, 47, 48, 50, 54, 58, 59, 65, 67, 68, 69, 73, 75], "data": [0, 3, 4, 5, 7, 15, 20, 23, 28, 29, 34, 43, 46, 57, 61, 62, 63, 65, 66, 67, 68, 69, 70, 74, 75], "from": [0, 2, 3, 4, 7, 10, 13, 14, 15, 16, 18, 19, 20, 21, 24, 25, 26, 27, 29, 30, 32, 33, 39, 43, 46, 48, 53, 56, 57, 58, 60, 62, 65, 67, 69, 73, 75, 76], "s": [0, 2, 4, 15, 19, 23, 26, 29, 31, 33, 36, 38, 43, 45, 46, 47, 53, 54, 55, 56, 58, 60, 62, 63, 65, 68, 69, 75], "plugin": [0, 43, 58, 69, 73, 75], "which": [0, 5, 7, 8, 16, 19, 25, 27, 29, 31, 32, 35, 42, 43, 45, 47, 48, 49, 51, 52, 53, 54, 56, 58, 59, 60, 62, 64, 65, 67, 69, 73, 75], "provid": [0, 2, 4, 6, 15, 16, 24, 26, 32, 34, 43, 45, 47, 50, 51, 52, 53, 54, 55, 58, 59, 60, 62, 63, 69, 73, 75], "lf": [0, 43, 48, 69, 75], "ff": [0, 43, 69, 75], "option": [0, 9, 18, 29, 31, 38, 43, 45, 46, 47, 49, 50, 52, 54, 57, 62, 63, 65, 68, 69, 73, 75], "well": [0, 2, 43, 48, 52, 54, 60, 66, 69, 75], "fixtur": [0, 43, 56, 59, 69, 75], "do": [0, 4, 9, 14, 15, 16, 22, 25, 26, 27, 29, 31, 34, 38, 43, 45, 47, 48, 50, 52, 54, 57, 58, 59, 60, 62, 63, 65, 67, 68, 69, 74, 75], "commit": [0, 43, 45, 48, 51, 53, 58, 64, 69, 73, 75], "version": [0, 26, 36, 43, 46, 48, 50, 52, 54, 58, 59, 60, 62, 64, 65, 67, 68, 69, 75], "control": [0, 2, 7, 43, 46, 51, 60, 69, 75], "see": [0, 3, 7, 16, 26, 29, 31, 43, 46, 47, 48, 50, 52, 54, 57, 58, 59, 60, 63, 65, 67, 68, 69, 73, 75], "doc": [0, 23, 29, 43, 46, 52, 54, 60, 68, 69, 73, 75], "more": [0, 2, 8, 9, 13, 15, 18, 20, 24, 32, 35, 38, 40, 42, 43, 45, 46, 47, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 66, 67, 68, 69, 73, 74, 75], "inform": [0, 7, 24, 25, 43, 47, 48, 49, 50, 51, 52, 60, 65, 67, 68, 69, 75], "chapter": [1, 17, 28, 41, 44, 61, 70], "cover": [1, 17, 28, 40, 44, 46, 47, 48, 50, 53, 54, 55, 57, 60, 61, 62, 64, 68, 70, 73], "some": [1, 2, 3, 7, 11, 15, 18, 20, 21, 22, 24, 25, 26, 27, 28, 29, 31, 35, 40, 41, 44, 46, 48, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 61, 62, 63, 64, 66, 68, 70, 73, 74], "us": [1, 3, 8, 9, 10, 11, 13, 15, 18, 19, 20, 22, 23, 26, 28, 35, 36, 37, 38, 39, 41, 44, 51, 52, 53, 54, 55, 56, 57, 59, 61, 63, 64, 65, 74, 76], "librari": [1, 18, 20, 21, 22, 23, 25, 26, 28, 48, 49, 50, 51, 52, 53, 54, 56, 57, 60, 62, 64, 65, 67, 70, 73, 74], "have": [2, 4, 5, 13, 15, 21, 25, 26, 27, 29, 31, 33, 38, 40, 47, 48, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "you": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 73, 76], "ever": [2, 4, 7, 26, 31, 33, 38, 50, 57, 58, 60, 62, 63, 65, 67, 73], "had": [2, 32, 52, 54, 58, 59], "multipl": [2, 6, 15, 24, 27, 48, 50, 51, 52, 54, 59, 60, 62, 64, 67, 73, 74], "similar": [2, 20, 30, 47, 52, 54, 58, 59, 64, 67], "In": [2, 4, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 19, 20, 21, 24, 27, 29, 30, 31, 32, 33, 34, 35, 39, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 64, 67, 68, 73], "code": [5, 8, 9, 11, 13, 14, 18, 19, 20, 25, 26, 27, 30, 31, 32, 33, 35, 37, 42, 47, 51, 53, 62, 65, 74, 76], "below": [2, 4, 5, 6, 7, 8, 9, 11, 14, 16, 18, 19, 20, 21, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 68, 73], "dachshund": [2, 19, 27, 50], "poodl": 2, "color": [2, 5, 19, 25, 48, 52, 53, 54, 55, 59, 60, 63, 67], "show_info": 2, "def": [2, 3, 6, 7, 8, 9, 14, 15, 18, 19, 20, 21, 25, 27, 29, 34, 38, 40, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 72, 73], "__init__": [2, 19, 24, 27, 57, 58, 62, 64, 65], "self": [2, 19, 27, 34, 39, 52, 58, 59, 62, 64, 67, 68], "str": [2, 3, 7, 8, 15, 16, 19, 24, 27, 29, 38, 40, 45, 47, 48, 50, 51, 55, 58, 59, 60, 63, 64, 67], "print": [2, 3, 4, 6, 7, 9, 10, 11, 13, 14, 15, 18, 20, 21, 23, 27, 29, 30, 31, 32, 34, 35, 40, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 62, 63, 64, 65, 68, 73], "f": [2, 3, 4, 6, 7, 9, 11, 15, 19, 20, 23, 25, 31, 32, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 57, 58, 59, 60, 62, 63, 65, 67, 68, 73], "bim": [2, 15, 19, 24, 27], "black": [2, 19, 54, 59, 73], "If": [2, 3, 5, 6, 8, 9, 11, 13, 14, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74, 76], "so": [2, 7, 19, 21, 27, 42, 47, 48, 50, 52, 54, 60, 62, 63, 65, 66, 68], "organ": [2, 18, 48, 51, 52, 54], "allow": [2, 3, 6, 9, 11, 14, 15, 16, 18, 21, 25, 26, 27, 29, 31, 33, 38, 40, 45, 46, 47, 48, 49, 50, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73, 74], "defin": [2, 6, 15, 31, 45, 48, 49, 52, 55, 56, 58, 59, 62, 63, 64, 68], "parent": [2, 27, 57, 67], "child": 2, "all": [2, 10, 15, 16, 18, 21, 25, 26, 33, 40, 45, 46, 47, 48, 49, 50, 52, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 76], "super": [2, 66, 67], "make": [2, 5, 6, 13, 15, 20, 23, 24, 26, 27, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 60, 62, 64, 66, 67, 68, 73, 74], "its": [2, 3, 7, 16, 19, 25, 26, 32, 38, 45, 49, 50, 52, 54, 60, 63, 65, 67, 73], "we": [2, 3, 7, 13, 14, 16, 20, 25, 26, 27, 31, 32, 34, 45, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 68, 73], "dog": [2, 19, 24, 27, 48, 50, 54, 58, 60, 62, 67], "With": [2, 19, 20, 26, 32, 45, 49, 50, 51, 52, 53, 54, 56, 59, 60, 63, 65, 66, 67, 73], "avoid": [2, 6, 15, 25, 31, 47, 48, 58, 64, 65], "repeat": [2, 6, 7, 15, 25, 52, 54], "same": [2, 6, 7, 11, 13, 15, 16, 21, 22, 25, 30, 31, 34, 35, 40, 42, 48, 52, 54, 56, 57, 60, 62, 65, 67, 68], "piec": [2, 6, 7, 54, 57, 60, 74], "time": [2, 4, 6, 7, 9, 18, 21, 31, 32, 45, 46, 47, 51, 54, 60, 62, 63, 65, 66, 73], "type_": [2, 52], "type": [2, 5, 19, 24, 26, 34, 40, 45, 46, 47, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 73], "coco": 2, "brown": [2, 50, 52], "learn": [2, 24, 26, 47, 49, 50, 54, 56, 58, 60], "about": [2, 3, 7, 13, 24, 46, 47, 48, 49, 52, 53, 54, 55, 56, 58, 59, 62, 63, 65, 66, 67, 68], "here": [2, 16, 37, 47, 49, 50, 52, 53, 54, 55, 56, 58, 60, 62, 63, 64, 66, 67, 68, 73], "sometim": [14, 19, 25, 29, 31, 38, 42, 48, 49, 52, 58, 59, 60, 64, 65, 66, 67, 68], "might": [2, 7, 14, 19, 25, 29, 32, 34, 38, 42, 46, 48, 49, 52, 54, 57, 58, 59, 60, 63, 64, 65, 66, 67, 68], "want": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "differ": [2, 6, 7, 15, 16, 18, 27, 29, 32, 45, 47, 48, 49, 52, 54, 55, 56, 57, 59, 60, 64, 65, 68], "But": [25, 26, 54, 59], "those": [7, 10, 42, 48, 50, 51, 53, 54, 59, 67, 68, 73], "can": [2, 3, 4, 5, 6, 7, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 38, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74, 76], "slightli": [], "each": [3, 7, 9, 11, 18, 21, 25, 31, 39, 45, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 65, 67, 68, 74], "good": [6, 18, 25, 46, 48, 50, 54, 58, 64], "an": [2, 4, 5, 13, 14, 19, 20, 24, 25, 31, 32, 34, 38, 40, 45, 46, 47, 48, 51, 53, 56, 57, 58, 59, 62, 63, 64, 66, 67, 76], "one": [6, 7, 15, 16, 18, 21, 25, 26, 27, 29, 30, 31, 33, 34, 35, 37, 40, 42, 45, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 66, 67, 68, 73, 74], "The": [2, 5, 14, 15, 23, 25, 26, 29, 31, 32, 36, 37, 38, 40, 42, 46, 48, 50, 51, 52, 55, 56, 62, 63, 65, 66, 67, 68], "subclass": [2, 27, 62], "abc": [2, 27], "import": [2, 3, 4, 6, 7, 9, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 67, 71], "abstractmethod": 2, "anim": [50, 62], "name": [2, 5, 6, 15, 18, 19, 24, 25, 30, 33, 35, 39, 42, 45, 46, 47, 48, 50, 51, 52, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73], "make_sound": [], "pass": [2, 8, 18, 29, 45, 46, 47, 50, 52, 54, 58, 64, 65, 73], "sai": 68, "woof": 27, "cat": [2, 29, 34, 36, 45, 47, 48, 52, 56, 58, 60, 64], "meow": 60, "pepper": [5, 15, 19, 50, 54], "bella": [], "when": [2, 4, 5, 8, 14, 15, 16, 19, 21, 24, 25, 26, 27, 29, 34, 38, 40, 45, 46, 47, 50, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 73], "special": [48, 50, 53, 57], "anoth": [2, 7, 11, 14, 25, 26, 40, 47, 48, 50, 54, 58, 59, 60, 65, 68], "follow": [2, 6, 7, 15, 23, 29, 31, 32, 45, 47, 51, 52, 54, 56, 58, 59, 63, 64, 65, 66, 67, 68, 73], "exampl": [2, 3, 7, 14, 15, 21, 27, 29, 31, 32, 34, 35, 38, 40, 42, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 68, 73], "wholemilk": [], "repres": [13, 26, 29, 47, 52, 54, 67, 73], "specif": [7, 9, 24, 35, 45, 46, 47, 48, 50, 52, 57, 59, 60, 62, 63, 65], "milk": [50, 51, 54], "fat_cont": [], "float": [2, 6, 7, 14, 15, 21, 24, 27, 32, 34, 45, 51, 52, 58, 59, 62, 63, 64, 67, 68, 72, 73], "prepar": [51, 52, 54, 60, 67], "serv": [2, 47, 50, 67], "whole": [], "3": [2, 3, 6, 7, 8, 9, 13, 14, 16, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 71, 73], "5": [2, 3, 4, 6, 7, 8, 9, 11, 14, 15, 16, 19, 20, 21, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "cream": [54, 62], "On": [24, 46, 47, 50, 52, 54, 57, 58], "other": [2, 7, 15, 19, 24, 33, 37, 39, 46, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 66, 68, 73, 74], "hand": [24, 47, 50, 59, 73], "form": [26, 40, 54], "ha": [2, 6, 14, 27, 31, 32, 45, 47, 48, 50, 52, 54, 55, 59, 60, 63, 67, 74], "relationship": [40, 60], "milktea": 51, "By": [2, 7, 31, 32, 40, 48, 50, 52, 54, 56, 58, 59, 64, 65], "enabl": [15, 21, 45, 47, 48, 51, 52, 53, 54, 56, 60, 62, 65, 68], "substitut": 45, "impact": [52, 58, 59], "reus": [6, 56, 58], "cake": [], "sugar_percentag": [], "sugar": [50, 54, 67], "milk_tea": [], "10": [2, 3, 6, 7, 8, 9, 16, 19, 21, 24, 27, 31, 33, 35, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "instanti": [2, 47, 52, 54, 58, 59, 60], "oper": [2, 13, 14, 27, 31, 33, 50, 53, 58, 59, 62, 64, 65, 67], "while": [2, 3, 6, 25, 27, 29, 35, 40, 45, 47, 48, 50, 51, 53, 56, 57, 58, 59, 60, 62, 63, 68], "doesn": [2, 21, 29, 48, 51, 63, 68], "t": [2, 13, 19, 20, 21, 25, 26, 27, 29, 45, 47, 48, 49, 50, 51, 52, 54, 58, 60, 62, 63, 65, 67, 68, 73], "altern": [2, 5, 25, 48, 52], "construct": [2, 47, 48, 52, 67], "from_csv": 2, "read": [2, 6, 13, 21, 23, 42, 47, 48, 50, 51, 54, 56, 58, 59, 62, 63], "csv": [2, 3, 7, 48, 54, 59, 60, 63, 66, 68], "file": [2, 3, 15, 21, 24, 27, 31, 38, 39, 42, 45, 52, 53, 54, 59, 60, 63, 67], "panda": [2, 3, 6, 7, 10, 39, 48, 49, 52, 53, 54, 55, 59, 60, 63, 64, 65, 71, 73, 74], "pd": [2, 3, 6, 7, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 64, 65, 67, 71, 73], "dataanalyz": 2, "analyz": [2, 16, 40, 45, 47, 59], "shape": [2, 31, 42, 47, 49, 52, 59, 60, 73], "classmethod": 2, "cl": 2, "csv_path": 2, "read_csv": [2, 7, 31, 33, 47, 48, 54, 59, 60], "return": [2, 3, 5, 7, 8, 9, 14, 15, 16, 19, 20, 21, 25, 27, 29, 31, 34, 35, 36, 38, 40, 47, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 72, 73], "datafram": [2, 3, 6, 7, 52, 53, 54, 55, 59, 60, 63, 64, 65, 67, 73], "1": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 68, 71, 73], "2": [2, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 24, 25, 26, 27, 29, 30, 33, 34, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 71, 73], "b": [2, 6, 7, 8, 11, 13, 14, 16, 18, 20, 21, 25, 29, 30, 31, 32, 33, 34, 35, 38, 40, 42, 45, 47, 48, 49, 52, 54, 56, 58, 60, 62, 63, 64, 65, 67, 68, 73], "4": [2, 3, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 20, 21, 25, 26, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 71, 73], "6": [2, 3, 6, 7, 8, 11, 14, 16, 19, 20, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 73], "csv_file_path": 2, "default": [2, 16, 30, 31, 40, 45, 46, 47, 48, 52, 53, 56, 58, 60, 65, 73], "valu": [2, 6, 15, 16, 19, 20, 30, 31, 32, 39, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 60, 62, 63, 64, 67], "attribute_nam": 2, "simpli": [2, 19, 26, 29, 33, 42, 47, 48, 49, 50, 55, 57, 58, 60, 66, 67, 73, 76], "howev": [2, 6, 7, 11, 19, 21, 25, 34, 35, 45, 46, 52, 53, 56, 58, 59, 60, 62, 68, 73], "found": [2, 7, 16, 27, 45, 47, 48, 58, 60, 63, 65, 67, 76], "food": [2, 15, 18, 48, 54, 57, 62], "appl": [2, 5, 6, 8, 11, 15, 16, 18, 21, 22, 25, 27, 29, 30, 34, 35, 37, 40, 45, 47, 51, 52, 53, 54, 56, 58, 60, 62, 64], "red": [2, 5, 25, 38, 50, 52, 53, 63], "yellow": [2, 5, 48, 50, 53, 54, 60], "flavor": [2, 50, 52, 54, 62], "sweet": [2, 5, 25, 52, 58, 62], "attributeerror": [2, 6, 68], "traceback": [2, 5, 6, 7, 11, 19, 21, 24, 25, 34, 39, 42, 64, 68], "most": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 26, 34, 39, 42, 45, 48, 52, 54, 62, 64, 67, 68], "recent": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 34, 39, 42, 54, 64, 67, 68], "last": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 27, 34, 39, 42, 48, 50, 58, 64, 67, 68, 73], "tmp": [2, 21, 34, 47, 67], "ipykernel_337430": 2, "3178150741": 2, "py": [2, 7, 15, 21, 24, 27, 29, 34, 36, 39, 42, 46, 52, 54, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "modul": [2, 15, 18, 19, 21, 22, 25, 27, 34, 50, 52, 57, 67, 68, 73], "dataload": 2, "data_dir": [2, 46], "data_load": 2, "my_data_dir": 2, "even": [2, 7, 8, 32, 52, 54, 58, 68, 73], "thei": [2, 3, 7, 29, 34, 39, 46, 50, 51, 52, 54, 56, 58, 59, 60, 62, 67, 73, 74], "ar": [2, 3, 5, 6, 7, 11, 13, 14, 16, 21, 27, 29, 30, 32, 33, 34, 35, 37, 45, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 73, 74], "equal": [2, 26, 52, 65], "becaus": [2, 3, 5, 6, 7, 16, 21, 23, 26, 34, 50, 54, 58, 65, 68, 74], "store": [2, 3, 11, 19, 25, 32, 40, 47, 50, 52, 58, 59, 60, 62, 67], "separ": [2, 7, 11, 14, 29, 35, 45, 46, 53, 58, 65, 67, 73], "locat": [2, 5, 15, 40, 48, 52, 53, 54, 58, 68], "To": [2, 3, 5, 6, 7, 8, 10, 11, 14, 16, 19, 21, 22, 25, 26, 29, 30, 31, 33, 34, 35, 37, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73], "how": [2, 4, 7, 14, 16, 25, 27, 30, 33, 34, 37, 39, 45, 46, 47, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 64, 65, 66, 67, 73], "should": [2, 24, 45, 46, 52, 54, 57, 58, 59, 60, 63, 65, 66, 67, 68, 73], "compar": [2, 4, 18, 32, 38, 45, 47, 52, 54, 56, 57, 58, 59, 60, 62, 64, 68, 73], "__eq__": [2, 19], "dog1": 2, "dog2": 2, "fals": [2, 3, 7, 8, 18, 31, 33, 34, 42, 45, 47, 48, 54, 55, 56, 58, 59, 60, 63, 64, 67, 68], "true": [2, 6, 7, 9, 14, 15, 18, 23, 24, 31, 32, 34, 35, 36, 39, 40, 42, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 64, 67, 68, 73], "access": [2, 7, 18, 22, 31, 37, 46, 47, 52, 54, 58, 74], "ani": [2, 6, 7, 34, 47, 48, 50, 57, 58, 59, 60, 64, 66, 68, 74, 76], "fit": [2, 47, 48, 49, 50, 52, 54, 58, 59, 60], "find": [2, 4, 7, 8, 26, 29, 46, 48, 53, 54, 60, 66, 67], "redund": [2, 7], "That": [2, 16, 19, 25, 26, 38, 46, 50, 52, 54, 57, 58, 59, 60, 63, 65, 66, 67, 68, 73, 76], "turn": [2, 5, 10, 25, 29, 31, 38, 50, 54, 68], "need": [2, 6, 7, 11, 15, 16, 18, 19, 20, 21, 22, 25, 45, 47, 48, 49, 50, 52, 53, 54, 55, 58, 59, 60, 65, 66, 67, 73], "staticmethod": 2, "now": [2, 7, 19, 23, 26, 27, 29, 31, 32, 34, 37, 47, 48, 52, 54, 58, 59, 60, 65, 66, 67, 68, 73], "re": [2, 6, 14, 20, 26, 27, 36, 47, 50, 52, 58, 59, 62, 64, 67, 68], "processtext": 2, "text_column": 2, "remove_url": 2, "sampl": [2, 29, 45, 47, 48, 51, 52, 56, 57, 58, 59, 60, 64, 67, 68, 73], "replac": [2, 7, 15, 25, 27, 37, 48, 49, 52, 56, 58, 59, 64, 66, 67], "url": [2, 7, 50, 54, 55, 62, 65, 73], "empti": [2, 5, 52, 58, 64, 66, 68], "space": [2, 16, 45, 48, 54, 67, 73], "sub": [2, 26, 31, 60, 65, 67], "r": [2, 16, 23, 47, 48, 52, 55, 62, 63, 68], "http": [2, 24, 29, 31, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 58, 59, 60, 62, 64, 65, 66, 68, 73], "text": [2, 7, 8, 16, 23, 45, 50, 51, 55, 58, 59, 62, 67, 68], "my": [2, 18, 23, 29, 33, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 58, 60, 62, 63, 65, 66, 67, 68, 73, 74], "favorit": [2, 46, 50], "page": [2, 31, 49, 52, 60, 63], "www": [2, 50, 54], "googl": [2, 48, 54, 59, 68, 76], "com": [2, 31, 34, 45, 47, 48, 49, 50, 54, 55, 59, 60, 62, 64, 66, 68, 73], "restrict": [2, 59], "extern": [2, 24, 73], "modif": 2, "outsid": [2, 18], "doubl": [2, 50, 56], "underscor": 2, "help": [2, 6, 32, 42, 45, 46, 47, 52, 54, 56, 58, 59, 60, 63, 67, 68, 73], "chanc": [2, 52, 59], "unintend": [2, 7], "alter": [2, 6, 47], "groceri": [2, 11, 27, 51], "item": [2, 7, 9, 13, 29, 34, 38, 48, 50, 51, 52, 54, 56, 58, 62, 68, 73], "price": [2, 5, 6, 7, 8, 11, 15, 16, 21, 25, 31, 33, 34, 35, 37, 38, 40, 45, 47, 48, 51, 52, 56, 58, 62, 64], "__price": 2, "get_pric": [2, 15, 25, 27, 62], "grocery_item": [2, 51], "99": [2, 15, 59, 63], "directli": [2, 6, 52, 59, 67, 68, 73, 76], "cell": [2, 5, 6, 7, 11, 19, 24, 39, 42, 50, 52, 59, 63, 64, 67, 68, 73], "line": [2, 5, 6, 11, 15, 18, 19, 21, 24, 25, 26, 29, 31, 39, 42, 45, 47, 53, 60, 66], "18": [2, 26, 33, 47, 48, 49, 50, 57, 59, 60, 65, 67, 68], "15": [2, 14, 16, 26, 31, 33, 35, 42, 47, 48, 49, 50, 52, 56, 57, 58, 59, 60, 68], "17": [2, 4, 35, 47, 48, 49, 50, 56, 59, 60, 63, 64, 67, 68], "behavior": [5, 6, 30, 50, 58, 59], "execut": [6, 7, 31, 45, 50, 51, 53, 56, 57, 62, 64, 73, 76], "set": [2, 6, 15, 21, 22, 27, 29, 33, 48, 50, 51, 52, 53, 54, 56, 59, 60, 64, 65, 67, 68, 73], "onli": [2, 5, 8, 13, 14, 16, 20, 21, 25, 27, 29, 30, 37, 42, 45, 46, 47, 50, 51, 52, 54, 56, 57, 59, 62, 63, 64, 65, 67, 68, 73], "fruit": [5, 8, 11, 18, 21, 22, 25, 27, 34, 35, 37, 40, 45, 47, 51, 53, 56, 58, 60, 62, 64], "_color": [], "isinst": [7, 8, 14, 15, 19, 20, 51, 58, 68], "els": [2, 4, 5, 8, 15, 18, 20, 27, 29, 38, 48, 56, 57, 58, 59, 63, 67, 68], "rais": [2, 7, 11, 15, 19, 20, 27, 34, 39, 42, 58, 63, 64, 67, 68], "must": [7, 19, 21, 45, 47, 52, 68], "var": [7, 16, 29, 67, 68], "folder": [23, 29, 58, 65, 66, 67, 68, 73], "5w": [29, 67], "fg65_rp17lz39z89p0nkv8ch0000gn": [29, 67], "ipykernel_78260": [], "1033431134": [], "3888926808": [], "14": [7, 27, 31, 33, 35, 47, 48, 49, 50, 54, 56, 57, 58, 59, 60, 67, 68], "16": [2, 8, 14, 21, 31, 33, 47, 48, 49, 52, 57, 59, 60, 62, 63, 65, 67, 68, 73], "show": [2, 3, 7, 14, 15, 18, 20, 21, 22, 31, 33, 37, 39, 41, 42, 46, 47, 50, 52, 54, 55, 56, 59, 60, 63, 64, 65, 66, 67, 68, 73], "readabl": [5, 8, 20, 27, 29, 49, 54, 58, 68, 74], "output": [2, 7, 16, 26, 38, 42, 45, 46, 47, 48, 50, 52, 54, 55, 57, 58, 59, 60, 64, 65, 67, 68, 73], "displai": [2, 14, 16, 49, 56, 59, 62], "debug": [2, 15, 47, 52, 64, 65, 68], "str__": 2, "i": [2, 3, 7, 8, 9, 11, 14, 16, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 35, 42, 45, 48, 49, 50, 52, 54, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "ag": [2, 15, 19, 24, 45, 48, 50, 55, 56, 58, 59, 60, 62, 68], "int": [2, 3, 6, 7, 9, 14, 15, 19, 24, 27, 45, 47, 51, 53, 54, 55, 57, 58, 60, 63, 64, 67, 68], "7": [2, 3, 6, 7, 16, 19, 20, 25, 29, 30, 31, 33, 34, 35, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "pip": [2, 3, 24, 25, 26, 27, 29, 31, 32, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 67, 68, 73], "instal": [2, 3, 24, 25, 26, 27, 29, 31, 32, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "memory_profil": [2, 64], "flexibl": [2, 28, 56, 63], "dictionari": [2, 6, 40, 56, 59, 74], "structur": [2, 7, 23, 54, 56, 59, 63, 65, 68], "lot": [2, 25, 48, 50, 53, 58, 60, 65], "effici": [2, 13, 18, 20, 22, 53, 56, 59, 62, 63, 68, 73, 74], "reserv": 2, "ahead": 2, "signific": [2, 31, 32, 52, 58, 59], "reduc": [2, 15, 33, 46, 50, 56, 57, 58, 60], "writefil": [2, 7, 15, 27, 45, 46, 52, 54, 57, 58, 63, 64, 65, 67, 68, 73], "without_slot": 2, "random": [2, 3, 7, 18, 31, 32, 33, 47, 48, 49, 52, 57, 58, 59, 60, 65, 68, 73], "randint": [2, 3, 7, 18, 32, 33, 47, 57, 58, 73], "profil": [2, 47, 48, 50, 53, 58, 64, 65], "main": [2, 7, 24, 46, 47, 50, 54, 58, 59, 63, 64, 65, 67, 68], "0": [2, 3, 4, 6, 7, 8, 9, 13, 14, 15, 16, 18, 21, 24, 25, 26, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "30": [2, 4, 16, 26, 31, 45, 47, 48, 49, 50, 52, 56, 57, 58, 59, 60, 62, 63, 67, 68, 73], "_": [2, 13, 15, 16, 18, 32, 50, 52, 57, 58, 60, 62, 63], "rang": [2, 3, 7, 9, 16, 18, 27, 31, 32, 47, 48, 51, 52, 57, 58, 59, 60, 64, 73], "100000": [2, 31, 58], "__name__": [2, 27, 46, 58, 63, 64, 67, 68], "__main__": [2, 27, 46, 58, 63, 64, 67, 68], "m": [2, 4, 16, 27, 32, 35, 40, 45, 48, 50, 53, 54, 57, 58, 59, 60, 64, 73], "filenam": [2, 57, 58, 64, 67, 68], "mem": [2, 64], "increment": [2, 47, 64], "occurr": [2, 16, 34, 48, 60, 64, 67], "content": [2, 18, 47, 49, 50, 52, 54, 64, 66, 73], "41": [2, 31, 45, 47, 48, 49, 59, 64, 67], "mib": [2, 64], "11": [2, 3, 4, 7, 16, 19, 20, 24, 27, 29, 31, 33, 35, 40, 45, 47, 48, 49, 50, 52, 54, 56, 58, 59, 60, 63, 64, 65, 67, 68, 73], "12": [2, 3, 14, 16, 19, 23, 27, 31, 32, 33, 35, 40, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "57": [2, 48, 59, 60, 63, 68], "8": [2, 3, 6, 7, 8, 15, 16, 20, 21, 25, 27, 30, 31, 33, 34, 36, 38, 40, 42, 47, 48, 49, 50, 52, 53, 54, 56, 58, 59, 60, 63, 64, 65, 67, 68, 73], "100003": 2, "with_slot": 2, "__slots__": 2, "13": [2, 29, 31, 33, 35, 48, 49, 52, 54, 56, 58, 59, 60, 67, 68], "46": [2, 31, 47, 48, 50, 67, 68], "section": [3, 7, 15, 18, 20, 21, 22, 31, 35, 39, 40, 46, 47, 48, 50, 53, 54, 55, 57, 59, 60, 62, 64, 66, 68, 73, 74], "wai": [3, 5, 7, 13, 15, 18, 25, 29, 31, 33, 34, 48, 50, 52, 54, 57, 58, 59, 62, 63, 66, 67, 74], "up": [3, 7, 9, 16, 26, 35, 45, 48, 50, 51, 52, 54, 58, 59, 60, 62, 65, 66, 68, 73], "track": [3, 6, 7, 53, 54, 58, 68], "perform": [3, 7, 29, 31, 40, 52, 54, 56, 60], "your": [3, 4, 6, 15, 25, 26, 32, 33, 34, 35, 37, 42, 46, 48, 50, 51, 56, 59, 62, 63, 65, 74, 76], "python": [3, 8, 19, 20, 22, 23, 26, 35, 41, 51, 56, 73, 74], "run": [3, 7, 9, 25, 31, 46, 47, 50, 52, 54, 57, 59, 60, 62, 63, 64, 65, 66, 67, 74, 76], "faster": [3, 9, 15, 18, 31, 45, 58], "consid": [3, 6, 7, 15, 18, 47, 48, 49, 51, 52, 54, 57, 58, 59, 64, 73], "joblib": [2, 3, 52], "parallel": [3, 56, 60], "It": [2, 3, 7, 15, 16, 26, 34, 40, 46, 50, 52, 54, 58, 59, 60, 62, 63, 65, 66, 68, 73], "easili": [3, 16, 23, 49, 53, 54, 55, 60, 63, 66], "sever": [3, 7, 15, 25, 52, 58, 63], "onc": [3, 6, 7, 25, 50, 52, 54, 55, 59, 68], "own": [3, 25, 37, 50, 63, 67], "processor": [3, 52, 64, 73], "delai": [3, 47], "multiprocess": [3, 47], "add_thre": 3, "num": [3, 6, 7, 8, 9, 11, 14, 15, 16, 21, 35, 40, 42, 47, 52, 57, 58, 62, 64, 67, 68, 73], "num_cor": 3, "cpu_count": [3, 47], "result": [3, 7, 13, 20, 29, 31, 32, 34, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 62, 63, 64, 65, 67, 68], "n_job": [3, 59], "9": [2, 3, 6, 7, 14, 15, 19, 24, 27, 29, 31, 33, 34, 35, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "try": [3, 9, 26, 29, 39, 40, 42, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68], "timeit": [3, 7, 9, 18, 31, 45, 47, 57], "also": [3, 7, 9, 16, 24, 25, 26, 29, 31, 33, 38, 42, 46, 47, 48, 49, 51, 52, 53, 54, 56, 58, 59, 60, 62, 63, 64, 65, 66, 67, 73, 74], "specifi": [3, 6, 16, 19, 25, 38, 40, 42, 46, 47, 48, 55, 58, 59, 60, 62, 65, 67, 68, 73], "number": [3, 4, 7, 8, 9, 21, 26, 29, 31, 32, 47, 48, 52, 56, 57, 58, 59, 62, 63, 64, 67, 68], "rerun": [3, 52], "get": [3, 10, 11, 18, 21, 26, 31, 32, 34, 37, 46, 47, 48, 51, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 67, 68, 74], "better": [3, 5, 7, 29, 31, 52, 54, 58, 59], "estim": 3, "func": [3, 6, 47, 62, 64, 67, 68], "comprehens": [3, 22, 54, 64], "l": [3, 8, 9, 13, 25, 27, 32, 34, 35, 38, 40, 48, 64, 68], "10_000": [3, 59, 68], "func2": 3, "list": [3, 14, 15, 19, 20, 27, 29, 33, 35, 48, 51, 52, 58, 59, 60, 62, 63, 64, 65, 68, 73], "expsiz": [3, 9], "1000": [3, 6, 7, 9, 18, 31, 47, 48, 49, 52, 59, 60], "time1": 3, "time2": 3, "6299518653018685": 3, "than": [3, 9, 11, 18, 24, 31, 32, 34, 35, 42, 45, 47, 49, 52, 54, 56, 57, 58, 59, 60, 68, 74], "averag": [3, 6, 47, 48, 52, 57, 58, 59], "pyarrow": [3, 57], "instead": [2, 3, 5, 6, 8, 18, 21, 22, 25, 26, 27, 29, 31, 32, 33, 34, 35, 37, 40, 42, 47, 48, 52, 54, 57, 58, 59, 62, 64, 65, 66, 67, 73], "compress": 3, "take": [3, 4, 6, 18, 26, 32, 54, 57, 58, 59, 60, 62, 67, 68], "less": [3, 5, 24, 32, 42, 54, 58, 67], "memori": [3, 21, 31, 33, 45, 47, 52, 53, 54, 59], "uncompress": 3, "For": [2, 3, 14, 24, 31, 38, 40, 47, 48, 50, 52, 56, 57, 58, 59, 60, 62, 64, 65, 66, 68, 73], "million": [3, 31, 45, 47, 50, 54], "row": [3, 31, 32, 38, 45, 47, 48, 49, 51, 52, 53, 56, 57, 59], "column": [3, 7, 39, 45, 47, 48, 49, 52, 53, 54, 57, 58, 60, 63, 65, 73], "189": 3, "59": [3, 4, 32, 48, 49, 57, 60, 63, 67, 68], "mb": [3, 32, 52], "around": [3, 50, 60], "78": [3, 49, 57, 59, 67, 68], "96": [3, 48, 49, 52, 59, 60], "approxim": [3, 26, 31, 32, 45, 47, 54], "110": 3, "63": [3, 45, 48, 49, 58, 59, 60, 67], "storag": [3, 45, 47, 52, 53, 55], "numpi": [3, 10, 29, 31, 32, 33, 34, 38, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 65, 66, 67, 71, 73, 74], "np": [3, 29, 31, 32, 34, 38, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 71, 73], "creat": [3, 6, 15, 19, 20, 21, 26, 27, 29, 32, 33, 37, 47, 48, 51, 53, 55, 56, 57, 59, 62, 66, 67, 73], "seed": [3, 9, 18, 32, 47, 48, 52, 54, 57, 59, 60], "123": [3, 46, 52, 57, 59], "size": [3, 32, 34, 47, 48, 49, 52, 54, 55, 56, 58, 59, 60, 63, 67, 74], "1000000": [3, 14, 32, 47], "df": [3, 6, 7, 29, 31, 32, 33, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 63, 65, 67, 73], "col": [3, 29, 36, 47, 54, 56], "write": [3, 23, 25, 38, 42, 46, 47, 54, 57, 59, 60, 63, 64, 65, 66, 67, 68], "to_parquet": [3, 31, 47], "to_csv": [3, 31, 33, 45, 60, 63], "index": [3, 9, 13, 21, 22, 29, 31, 32, 35, 40, 45, 48, 50, 52, 53, 54, 58, 59, 67, 73], "os": [3, 23, 46, 47, 50, 51, 58, 73], "path": [3, 45, 46, 47, 49, 52, 53, 54, 58, 65, 68, 73], "getsiz": 3, "82805080": 3, "198796161": 3, "event": [4, 50, 59, 62, 68], "certain": [4, 19, 25, 32, 48, 50, 54, 58, 62, 67, 68], "minut": [4, 50, 58, 67, 74], "finish": [4, 7, 45, 52, 54, 57, 62], "determin": [4, 48, 54], "sum": [4, 7, 8, 25, 29, 33, 40, 45, 47, 52, 54, 56, 58, 59, 63, 64], "trick": [4, 26, 66, 74], "begin": [4, 38, 42, 46, 47, 50, 52, 63, 73], "2020": [4, 33, 37, 54, 59, 60, 65], "01": [4, 7, 21, 33, 45, 47, 48, 49, 50, 52, 58, 59, 60, 67, 73], "03": [4, 16, 33, 47, 48, 49, 50, 52, 54, 56, 58, 59, 60, 67, 73], "23": [4, 33, 35, 47, 48, 49, 52, 54, 56, 59, 60, 63, 67, 68], "00": [4, 33, 40, 42, 47, 48, 49, 50, 52, 54, 55, 58, 59, 60, 67, 68, 73], "duration_in_minut": 4, "2500": 4, "strptime": [4, 59, 67], "y": [2, 4, 7, 21, 26, 30, 32, 40, 42, 45, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 63, 64, 65, 73], "d": [4, 7, 11, 16, 18, 33, 35, 40, 42, 47, 48, 49, 50, 52, 53, 54, 56, 58, 59, 60, 62, 63, 67], "h": [4, 40, 47, 48, 52, 59, 60], "dai": [4, 16, 31, 33, 47, 48, 50, 52, 54, 58, 60, 67, 68], "39": [4, 48, 49, 57, 58, 59, 65, 73], "seri": [4, 32, 39, 47, 48, 50, 56, 58, 65, 73], "calendar": [4, 59], "monthrang": 4, "year": [4, 15, 37, 47, 48, 50, 54, 55, 59, 60, 67, 73], "like": [4, 7, 9, 18, 25, 26, 32, 33, 34, 38, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 60, 62, 63, 64, 65, 66, 67, 68, 73], "subtract": [4, 52, 59], "date1": 4, "2022": [4, 16, 33, 50, 54, 59, 73], "date2": 4, "diff": [4, 10, 26, 39, 62, 64, 65, 66, 68, 73], "apart": [4, 48], "304": 4, "method": [5, 9, 10, 16, 18, 21, 22, 23, 26, 28, 29, 32, 33, 34, 35, 36, 37, 40, 41, 45, 47, 48, 49, 50, 54, 56, 57, 59, 62, 64, 67, 74], "birth_year": 5, "ben": [5, 40, 60, 62], "1997": 5, "new_birth_year": 5, "michael": [5, 32, 50], "1993": 5, "lauren": [5, 40], "1999": 5, "josh": [5, 40, 60, 62], "1990": [5, 31], "olivia": [5, 50], "1991": 5, "appli": [2, 5, 6, 7, 10, 25, 31, 32, 38, 42, 48, 56, 59, 60, 62, 67, 68], "alex": [5, 47, 56], "2000": [5, 31, 50, 59], "oliv": [5, 18, 50, 57], "1995": 5, "add": [5, 6, 7, 11, 20, 25, 26, 30, 31, 40, 45, 46, 48, 50, 51, 53, 54, 55, 58, 62, 63, 64, 65, 66, 68, 72, 73], "max_val": 5, "sinc": [5, 7, 27, 33, 34, 35, 47, 52, 54, 58, 59, 60, 63, 64, 65, 68], "meeting3": 5, "onlin": 5, "meeting1": 5, "room1": 5, "meeting2": 5, "room2": 5, "assum": [2, 5, 48, 51, 58], "extract": [5, 9, 13, 15, 31, 46, 47, 52, 58, 66], "attr": [5, 18, 65], "tast": [5, 25, 27, 50], "orang": [5, 6, 8, 11, 15, 18, 21, 22, 25, 27, 30, 34, 35, 37, 40, 45, 47, 49, 50, 53, 56, 58, 64], "sour": [5, 27], "grape": [5, 8, 11, 15, 21, 22, 25, 27, 34, 35, 37, 64], "purpl": 5, "banana": [5, 8, 16, 21, 22, 45, 47, 51, 53, 54, 56, 58], "statement": [5, 6, 8, 20, 29, 34, 42, 54, 56, 67, 68], "handl": [5, 15, 23, 46, 47, 52, 53, 56, 58, 67, 68], "lengthi": [5, 7, 21, 34, 54], "unknown": [5, 15], "A": [2, 5, 6, 13, 16, 29, 30, 31, 33, 34, 38, 40, 48, 52, 54, 56, 57, 63, 64, 65], "twice": [5, 7, 15, 42], "abov": [5, 14, 15, 16, 25, 27, 38, 42, 48, 50, 52, 54, 56, 58, 59, 60, 63, 64, 66, 68, 73], "first": [5, 16, 20, 21, 27, 29, 30, 31, 32, 35, 42, 47, 48, 50, 52, 54, 58, 59, 60, 68], "second": [5, 25, 27, 29, 42, 47, 48, 50, 54, 57, 58, 59, 62, 67, 68], "either": [5, 6, 16, 23, 27, 32, 34, 35, 42, 48, 54, 58, 62, 76], "furnitur": 5, "bed": 5, "tabl": [5, 38, 51, 55, 56, 58, 67], "chair": [5, 50], "loc1": 5, "ikea": 5, "furniture_loc": 5, "vice": 5, "versa": 5, "combin": [5, 11, 40, 45, 47, 48, 49, 50, 51, 56, 59, 60, 62, 67, 73], "green": [5, 25, 38, 48, 50, 51, 59, 63], "onion": [5, 50], "pair": [5, 11, 55, 60], "dict_item": [5, 18, 48], "switch": [5, 53, 67], "loop": [5, 8, 18, 25, 31, 45, 47, 67, 68], "v": [5, 24, 50, 58, 59], "k": [5, 9, 52, 54, 59, 64], "befor": [5, 15, 24, 27, 31, 38, 45, 47, 50, 52, 54, 56, 57, 58, 59, 64, 65, 66, 67, 68], "common": [5, 6, 10, 13, 15, 16, 26, 31, 37, 40, 48, 52, 57, 58, 59], "approach": [2, 5, 7, 15, 21, 26, 29, 47, 48, 52, 54, 58, 63], "modifi": [2, 5, 6, 29, 47, 56, 62, 66, 67], "origin": [5, 7, 26, 31, 32, 34, 40, 42, 46, 47, 48, 50, 52, 58, 59, 66, 68], "lead": [2, 5, 6, 7, 11, 15, 16, 29, 47, 48, 52, 56, 58, 59, 60, 62, 67, 73], "unexpect": [5, 29, 59, 60], "place": [5, 7, 50, 52, 54, 59, 67, 68], "accept": [2, 5, 6, 52, 63], "hashabl": 5, "give": [5, 7, 25, 27, 38, 42, 46, 48, 52, 58, 59, 63], "typeerror": [5, 6, 7, 21, 51, 63], "call": [5, 6, 7, 11, 14, 15, 18, 19, 21, 24, 25, 27, 34, 39, 42, 46, 47, 48, 49, 50, 51, 54, 56, 57, 58, 59, 60, 64, 67], "unhash": 5, "tupl": [5, 7, 18, 21, 34, 52, 62, 64, 67], "work": [5, 14, 20, 21, 24, 26, 29, 34, 46, 47, 48, 49, 50, 52, 53, 54, 57, 60, 62, 63, 64, 65, 66, 73, 74], "immut": 5, "ad": [6, 7, 26, 47, 50, 54, 56, 58, 59, 62, 64, 67, 68], "mai": [2, 6, 24, 47, 48, 50, 52, 58, 59, 60, 64, 68], "introduc": [6, 7, 45, 74], "unnecessari": [6, 47, 56, 64], "complex": [6, 15, 45, 47, 48, 52, 58, 59, 62, 67], "condit": [6, 47, 48, 50, 52, 62], "simpler": [6, 22, 23, 50, 56], "easier": [6, 7, 13, 15, 23, 26, 31, 45, 48, 52, 58, 60, 62], "get_discount": 6, "100": [2, 6, 7, 9, 16, 18, 21, 29, 31, 32, 39, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 73], "20": [2, 6, 7, 33, 35, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 64, 65, 68, 73], "50": [2, 6, 45, 48, 49, 51, 52, 54, 56, 58, 59, 60], "necessari": [6, 40, 50, 54, 57], "doe": [6, 7, 21, 47, 48, 50, 52, 56, 58, 59, 68], "requir": [6, 21, 24, 33, 45, 47, 48, 51, 52, 53, 56, 58, 63, 67], "even_numb": 6, "filter": [6, 7, 25, 45, 52, 54, 56, 60, 68], "variou": [6, 27, 45, 52, 56, 57, 58, 63, 65, 73], "part": [6, 48, 57, 58, 67], "is_even": [6, 57], "arg": [6, 27, 36, 46, 51, 52, 54, 62, 63, 67, 68], "kwarg": [2, 6, 36, 62, 67, 68], "variabl": [6, 7, 13, 19, 26, 27, 40, 45, 46, 48, 54, 56, 58, 59, 60, 64, 67, 68, 73], "keyword": [11, 24, 45, 46], "multipli": [6, 8, 21, 27, 42], "add_to_ord": 6, "new_ord": 6, "cart": 6, "updat": [6, 7, 49, 60, 65, 66, 73, 74], "kiwi": 6, "keep": [6, 7, 30, 31, 40, 47, 48, 50, 51, 58, 66], "clean": [6, 48, 59, 60, 63, 64, 65], "without": [6, 7, 14, 15, 19, 21, 25, 31, 32, 34, 45, 47, 48, 52, 54, 56, 58, 59, 60, 65, 66, 67, 68, 73], "time_func": 6, "wrapper": [6, 48, 62, 67], "start": [6, 7, 8, 11, 16, 26, 32, 33, 35, 42, 47, 48, 50, 52, 54, 57, 58, 59, 60, 62, 63, 65, 67, 73], "end": [6, 7, 25, 33, 37, 38, 42, 50, 56, 57, 59, 60, 63, 67, 73], "elaps": [6, 59], "3f": [6, 52], "ms": [6, 31, 45, 47, 57, 59], "num1": [6, 7, 20, 34, 47, 48, 58, 63, 68, 72, 73], "num2": [6, 7, 20, 47, 48, 58, 63, 68, 72, 73], "006m": 6, "027m": 6, "includ": [7, 38, 40, 47, 48, 50, 51, 52, 54, 58, 59, 62, 64, 65, 67, 73, 74], "best": [7, 48, 51, 54, 59, 64], "bad": [7, 54, 58, 64, 68], "vagu": [7, 48], "x": [2, 7, 8, 20, 21, 26, 29, 30, 32, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 67, 73], "z": [7, 30, 40, 48, 64], "role": [7, 58, 60], "declar": [7, 15, 63], "hint": [7, 19, 63, 64], "obviou": 7, "num_memb": 7, "num_guest": 7, "sum_": 7, "confus": [7, 58, 67], "understand": [6, 7, 13, 15, 23, 45, 46, 54, 57, 58, 60, 64, 65, 66, 67], "circle_area": 7, "thu": [7, 14, 26, 31, 47, 52, 56, 58, 65], "them": [7, 14, 16, 27, 29, 32, 46, 48, 49, 52, 54, 56, 57, 58, 59, 62, 64, 65, 66, 74], "pi": [7, 15, 26, 60], "radiu": [7, 15], "too": [7, 48, 54, 58], "improv": [7, 27, 30, 31, 56, 60, 62, 63, 64, 68, 70, 73], "both": [7, 9, 30, 34, 40, 45, 47, 51, 52, 54, 56, 57, 58, 59, 65, 67], "At": [7, 73], "least": [7, 42, 48, 52, 54, 68], "clearer": 7, "x_is_even_and_neg": 7, "y_is_odd_and_posit": 7, "chang": [2, 7, 16, 19, 31, 32, 33, 38, 45, 46, 47, 51, 52, 53, 54, 56, 57, 58, 60, 62, 64, 66, 73], "rememb": [7, 26, 48], "otherwis": [2, 7, 16, 58, 63, 67], "bug": [7, 11], "our": [7, 13, 26, 47, 48, 50, 52, 54, 58, 59, 60], "date": [7, 45, 47, 48, 50, 51, 54, 58, 60, 67, 73], "2021": [7, 16, 33, 37, 45, 48, 50, 52, 57, 59, 65, 73], "arrai": [7, 25, 34, 36, 45, 48, 52, 58, 59, 60, 63, 67, 73], "datetim": [7, 16, 24, 47, 48, 50, 58, 67], "val1": [7, 56, 58], "val2": [7, 56, 58], "iloc": [7, 29, 31, 32, 39, 53, 59, 60], "subset_x": 7, "subset_i": 7, "filt": 7, "futur": [7, 36, 47, 48, 59, 67, 68], "return_two": 7, "care": [7, 13, 14, 58], "hello": [7, 15, 23, 50, 51, 63, 67, 68], "difficult": [7, 14, 50, 52, 58, 59, 60, 62, 73], "hardcod": 7, "imposs": 7, "discern": 7, "mean": [2, 7, 15, 31, 32, 33, 40, 45, 47, 48, 52, 53, 54, 56, 58, 59, 60, 64, 76], "addit": [7, 24, 32, 45, 47, 57, 58, 65], "context": [2, 7, 48, 54, 58, 67, 68], "comment": [7, 66], "price_differ": 7, "transpar": 7, "maintain": [7, 45, 47, 50], "built": [7, 14, 18, 20, 21, 22, 24, 47, 52, 57, 58, 59, 60, 62, 63, 67], "instantli": 7, "januari": [7, 47, 67], "rest": [7, 31, 50, 66], "februari": [7, 47, 50], "len": [7, 15, 47, 54, 58, 59, 60, 63, 64, 68], "particular": [7, 33, 47, 58, 59], "thing": [7, 15, 22, 26, 48, 50, 54, 57, 58, 59, 62, 65], "know": [7, 26, 49, 50, 52, 54, 58, 59, 62, 67], "yet": [7, 59], "put": [7, 46, 55, 68], "high": [7, 26, 47, 48, 50, 54, 56, 57, 59], "level": [7, 47, 48, 54, 56, 57, 59, 67], "go": [2, 7, 26, 29, 48, 50, 51, 54, 60, 66], "back": [7, 14, 26, 50, 58], "prevent": [7, 31, 47, 50, 58], "thought": [7, 58], "being": [7, 16, 46, 48, 50, 67, 73], "disrupt": 7, "say_hello": 7, "ask_to_sign_in": 7, "is_us": 7, "bool": [7, 34, 67, 68], "new": [7, 31, 33, 36, 40, 42, 45, 47, 48, 49, 52, 53, 54, 56, 58, 59, 60, 64, 65, 66, 67, 68, 73, 74], "old": [7, 48, 67], "point": [7, 33, 48, 49, 50, 52, 54, 58, 60, 66, 68], "l1": [7, 52], "l2": [7, 52], "append": [2, 7, 18, 56, 57, 60, 64], "shallow": 7, "deep": [7, 32, 50, 54], "children": [7, 50, 54, 59], "becom": [6, 7, 45, 50, 56, 58, 59, 64], "l3": 7, "stai": [7, 9], "inadvert": 7, "append_four": 7, "nums1": 7, "produc": [7, 47, 51, 52, 59, 62], "much": [7, 39, 48, 52, 58, 59, 60, 63, 66, 73], "cleaner": [7, 15, 56, 58, 62, 73], "arr": [7, 42, 73], "c": [2, 6, 7, 8, 11, 13, 18, 29, 30, 32, 34, 35, 40, 45, 47, 48, 49, 52, 54, 56, 58, 59, 60, 63, 67], "e": [7, 37, 40, 49, 52, 55, 58, 59, 60, 65, 68], "val": [7, 29, 30, 32, 33, 56, 59], "shorten": [7, 34], "between": [7, 15, 30, 40, 45, 47, 48, 51, 52, 54, 55, 56, 57, 59, 64, 65, 67, 68], "two": [7, 9, 16, 18, 20, 21, 33, 35, 38, 40, 47, 48, 53, 54, 56, 59, 60, 68, 73], "char": [7, 18, 21, 67], "10000": [7, 9, 47, 57], "411": [7, 59], "\u00b5s": [7, 31, 45, 47], "98": [7, 47, 49, 54, 59], "per": [7, 15, 31, 45, 47, 48, 54, 59, 74], "std": [2, 7, 31, 45, 47, 59], "dev": [7, 24, 31, 45, 47, 52, 73], "000": [7, 16, 45, 47, 57, 59], "60": [7, 31, 48, 49, 50, 51, 52, 54, 55, 58, 59, 60, 64], "process_data": [7, 20, 63, 68, 73], "violat": [7, 47], "principl": 7, "featur": [7, 32, 46, 47, 50, 58, 60], "although": [7, 52], "explain": [7, 56, 60, 64], "block": [7, 52, 68], "test": [7, 47, 48, 53, 57, 59, 60, 64], "unit": [7, 15, 27, 49, 50, 59], "insid": [7, 16, 23, 58, 60, 62, 68, 73], "challeng": [7, 21, 45, 48, 49, 54, 56, 58, 59, 62, 64], "axi": [6, 7, 29, 32, 34, 35, 40, 42, 47, 49, 50, 52, 59, 60], "split": [7, 40, 52, 54, 59, 60, 67], "smaller": [7, 31, 35, 42, 49, 57, 58], "revis": [7, 64], "accomplish": 7, "These": [7, 52, 58, 62], "pipe": [2, 7, 47, 48, 54, 67], "order": [6, 7, 16, 21, 32, 40, 42, 52, 54, 56, 57, 58, 60, 62, 63], "achiev": [7, 13, 20, 47, 54, 58, 59], "desir": [7, 51, 58], "comprehend": [7, 45, 54, 56, 64], "create_a_copi": 7, "add_new_featur": 7, "add_on": [7, 62], "sum_all_column": 7, "As": [7, 32, 47, 48, 50, 52, 56, 64], "increas": [7, 16, 29, 33, 52, 59, 64], "purpos": [6, 7, 27, 47, 54, 59], "numer": [7, 24, 32, 47, 48, 54, 64, 66, 67, 68], "develop": [7, 15, 27, 48, 52, 64, 68, 74], "bundl": 7, "relat": [7, 50, 57, 59, 68], "cohes": 7, "dataclass": [7, 19, 24], "pydant": [7, 45, 51], "model": [2, 7, 38, 45, 48, 49, 53, 63, 68, 73], "zip_path": 7, "raw_train_path": 7, "raw_test_path": 7, "processed_train_path": 7, "processed_test_path": 7, "none": [2, 6, 7, 27, 30, 32, 34, 39, 45, 46, 48, 50, 52, 54, 57, 58, 60, 62, 64, 67, 68], "class": [7, 15, 18, 32, 33, 45, 47, 48, 51, 52, 54, 55, 56, 57, 59, 62, 64, 67, 74], "rawloc": 7, "path_train": 7, "path_test": 7, "processedloc": 7, "raw_loc": 7, "processed_loc": 7, "get_data": [7, 57, 58, 65, 68], "is_csv": 7, "read_pickl": [7, 48], "pkl": [2, 7, 48, 52, 59], "yourself": [7, 64], "get_csv_data": 7, "get_pickle_data": 7, "short": [7, 48, 50, 59, 62, 67, 68, 73], "purchas": 7, "shipping_fe": 7, "simplifi": [7, 54, 60, 68, 73], "group": [7, 14, 27, 45, 47, 48, 50, 52, 58, 59, 60, 64], "within": [2, 7, 47, 48, 49, 52, 54, 56, 58, 59, 66], "instanc": [7, 19, 48, 52, 54, 56, 58, 59], "is_numb": 7, "flow": [7, 57, 62, 67, 68], "program": [7, 48, 50, 52, 57, 64, 68], "base": [2, 7, 15, 27, 35, 38, 45, 51, 54, 56, 59, 60, 63, 64], "evalu": [7, 25, 34, 52, 59], "encount": [7, 34, 68], "actual": [7, 52, 53, 58, 59, 64, 68], "occur": [7, 29, 47, 54, 59, 60, 68], "possibl": [7, 9, 32, 47, 50, 51, 59], "low": [7, 31, 32, 47, 56, 59], "enhanc": [7, 47, 49, 51, 52, 59, 62], "speed": [7, 9, 31, 32, 54, 62], "divis": [7, 48, 58], "zero": [7, 53, 58, 60, 67], "zerodivisionerror": [7, 68], "explicit": [7, 45, 54, 63], "precis": [7, 32, 47, 50, 52, 68], "caus": [7, 29, 33, 54, 56], "consequ": 7, "messag": [7, 24, 39, 57, 58, 62, 63, 64, 67, 68], "cannot": [2, 7, 19, 21, 25, 26, 27], "divid": [7, 14, 26, 48, 50, 56, 58, 68], "though": [7, 32, 52], "accur": [7, 48, 54, 58, 59, 68], "22": [7, 18, 31, 33, 35, 47, 48, 49, 50, 52, 54, 59, 60, 65, 68, 73], "unsupport": 7, "operand": 7, "potenti": [2, 7, 11, 32, 47, 50, 52], "problemat": 7, "post": [7, 16, 31, 48, 50, 52, 54, 59], "success": [7, 52, 58, 68], "action": [7, 48, 52, 56, 60, 66], "messi": [7, 66, 73], "harder": [7, 58, 68], "clear": [7, 15, 52, 58, 62], "sum_num": 7, "mean_num": 7, "unintention": 7, "trigger": 7, "process": [2, 7, 20, 31, 32, 37, 45, 46, 48, 50, 51, 52, 57, 58, 59, 60, 62, 64, 67, 68, 73], "overwrit": [7, 46, 52, 54, 58, 64, 65, 73], "if__name__": 7, "uppercas": [8, 56, 67], "abcd": [8, 11], "isupp": [8, 67], "satisfi": [8, 42, 48, 67], "given": [6, 8, 33, 51, 52, 54, 58, 59, 65, 67, 68, 73], "lambda": [8, 18, 21, 25, 29, 40, 47, 54, 57, 62, 64], "everi": [8, 21, 33, 47, 54, 58, 64, 66, 67, 68, 73, 74], "kei": [8, 30, 33, 34, 35, 45, 47, 48, 51, 53, 54, 55, 56, 58], "paramet": [8, 9, 21, 31, 32, 33, 36, 46, 49, 52, 56, 65, 68, 73], "by_lett": 8, "revers": [9, 40], "by_pric": 8, "whether": [23, 34, 42, 48, 52, 56, 58, 59, 67], "check_mention_fruit_1": 8, "got": [8, 14, 29, 33, 50, 54, 64], "check_mention_fruit_2": 8, "besid": [9, 49], "home": [9, 36, 47, 50, 52, 53, 54, 55, 58, 60, 65, 67, 73], "wa": [9, 32, 47, 54, 58, 66], "pick": [9, 54, 64], "to_do_tonight": 9, "attend": [9, 59], "parti": 9, "exercis": [9, 31, 60], "weigh": 9, "ten": [9, 19, 24, 63], "random_num": 9, "larg": [9, 16, 29, 36, 40, 48, 50, 52, 54, 56, 58, 59, 60], "sort": [9, 21, 32, 42, 48, 54, 56, 73], "get_n_max_sort": 9, "get_n_max_heapq": 9, "nlargest": [9, 40], "time_sort": 9, "global": [9, 18, 67], "time_heapq": 9, "ratio": [9, 16, 54, 57, 59], "round": [9, 47, 50, 52, 57, 58, 62], "experi": [9, 18, 21, 47, 48, 49, 52, 54, 57, 58, 59, 60, 70], "827": 9, "obtain": [10, 23, 35, 45, 48, 52, 59, 74], "uniqu": [10, 40, 48, 50, 54, 55, 59], "element": [10, 13, 27, 40, 50, 58, 60, 62, 63, 67], "convert": [10, 29, 31, 32, 37, 45, 48, 50, 53, 55, 56, 60, 63, 64, 67, 68, 73], "requirement1": 10, "statsmodel": [10, 52], "requirement2": 10, "matplotlib": [10, 42, 52, 54, 59], "fruits_str": 11, "todai": [11, 16, 24, 29, 52, 54, 58, 60, 67], "comb": [11, 21], "nums_2": 11, "chars_2": 11, "assign": [2, 13, 19, 48, 56, 57], "simultan": [13, 56, 57], "practic": [13, 51, 58, 68], "longer": [11, 13, 50, 58, 65, 68], "subset": [13, 31, 40, 47, 48, 54, 59, 60], "splat": 13, "don": [13, 19, 20, 26, 48, 58, 60, 65, 73], "normal": [14, 18, 20, 21, 22, 25, 26, 35, 48, 49, 52, 54], "6666666666666665": 14, "prefer": [14, 23, 35, 50, 56], "There": [14, 29, 52, 54, 58, 59, 68], "function": [14, 22, 24, 37, 45, 48, 51, 52, 54, 56, 57, 59, 60, 73, 74], "exactli": [14, 26, 47, 48, 50, 52, 54, 59, 60, 62, 67], "3752999689475413": 14, "2251799813685248": 14, "cool": [14, 25, 26, 48, 54, 60, 65], "limit": [14, 16, 21, 32, 45, 48, 51], "limit_denomin": 14, "object": [6, 14, 18, 26, 29, 31, 32, 33, 34, 35, 36, 37, 39, 45, 47, 48, 52, 53, 54, 59, 60, 62, 68, 73], "again": [14, 49, 68], "figur": [14, 26, 48, 49, 52, 54, 59, 67], "out": [14, 26, 31, 34, 47, 48, 50, 54, 59, 62, 64, 66, 67, 68], "mani": [14, 33, 50, 51, 52, 53, 60, 66, 67, 68], "digit": [14, 16, 45, 48, 54, 62, 67], "visual": [14, 49, 59, 63, 66, 73], "thousand": [14, 16, 48, 54], "large_num": 14, "1_000_000": [14, 32, 47], "integ": [14, 16, 19, 21, 24, 27, 32, 45, 49, 51, 64, 68], "check": [14, 15, 24, 27, 31, 47, 50, 52, 65, 66, 67, 68, 73], "remaind": 14, "n": [14, 21, 31, 39, 42, 47, 48, 50, 52, 53, 54, 55, 58, 59, 60, 63, 64, 65, 67, 68], "select": [14, 29, 31, 45, 47, 48, 50, 51, 52, 54, 56, 58, 59, 62], "whose": [14, 29, 33, 34, 35, 37, 42, 60], "get_multiples_of_n": 14, "elif": [2, 6, 15, 34, 56, 58, 59, 68], "case": [15, 21, 37, 38, 42, 45, 48, 52, 54, 56, 59, 67, 73, 74], "get_youngest_pet": 15, "pet_info": 15, "age1": 15, "age2": 15, "min": [15, 31, 32, 40, 45, 47, 53, 58, 67], "dict": [15, 20, 27, 45, 47, 51, 54, 59, 62], "pet_info1": 15, "pet_info2": 15, "compon": [15, 52, 54, 59, 60], "comput": [15, 25, 26, 32, 41, 47, 48, 49, 52, 54, 56, 57, 58, 68], "meaning": [2, 15, 48, 58, 59], "math": [15, 18, 26, 42, 64, 68], "diamet": 15, "circl": [15, 49], "area": [15, 52, 54, 59, 60, 66], "error": [2, 6, 15, 19, 24, 27, 29, 34, 42, 45, 52, 54, 62, 63, 64, 67, 68, 76], "quickli": [15, 31, 47, 48, 50, 52, 54, 60, 67], "identifi": [15, 45, 52, 54, 58, 59, 64, 67, 68], "exact": [15, 48, 49, 52, 54, 58, 62], "illustr": [15, 59], "trackback_test": 15, "greet": 15, "greetng": 15, "typo": [15, 48], "khuyen": [15, 16, 18, 23, 36, 40, 42, 47, 52, 54, 55, 58, 60, 65, 67, 68, 73, 74], "user": [15, 23, 42, 45, 47, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 63, 65, 67, 68, 73], "khuyentran": [15, 52, 54, 55, 58, 59, 60, 67, 73], "book": [15, 23, 24, 34, 36, 39, 42, 47, 48, 50, 52, 54, 55, 58, 60, 63, 64, 65, 67, 68, 73], "efficient_python_tricks_and_tools_for_data_scientist": [15, 23, 42, 52, 58, 73], "chapter1": 15, "nameerror": 15, "did": 15, "shown": [16, 42, 58], "3123": 16, "1f": [16, 38], "2f": [16, 32, 47, 52, 54, 67], "31": [16, 47, 48, 49, 50, 53, 58, 59, 60, 65, 67, 68, 73], "curli": 16, "bracket": [16, 25, 34, 63], "45": [16, 32, 45, 47, 48, 49, 56, 59, 60, 67, 68], "p": [16, 45, 49, 52, 54, 59, 60, 68, 73], "pm": [16, 51, 59, 60], "saturdai": [16, 50, 59], "02": [16, 33, 48, 49, 50, 52, 58, 59, 60, 63, 73], "hour": [16, 33, 47, 48, 58, 59, 60, 67, 68], "am": [16, 48, 54, 58, 60], "wake": 16, "08": [16, 48, 49, 52, 54, 58, 59, 60, 67, 68, 73], "09": [16, 33, 48, 49, 50, 52, 55, 56, 57, 58, 59, 60, 62, 68, 73], "100000000": 16, "total": [16, 32, 33, 45, 48, 56, 57, 58, 59, 60], "itertool": [16, 17, 52, 62], "permut": 16, "j": [16, 21, 48], "sentenc": [16, 50, 54, 58], "nice": [16, 19, 21, 25, 26, 46, 47, 48, 50, 54, 55, 58, 65, 67, 68, 73], "No": [16, 50, 51, 52, 54, 58, 60], "stop": [16, 42, 54, 57, 60], "posit": [6, 16, 21, 35, 38, 45, 47, 49, 51, 52, 54, 59, 73], "search": [16, 46, 49, 59, 64], "pattern": [16, 25, 40, 50, 59, 60], "swap": [2, 16, 62], "sundai": 16, "match_pattern": 16, "sent": [16, 54], "nice_dai": 16, "regrex": 16, "veri": [16, 19, 48, 50, 52, 54, 59, 61, 68], "long": [16, 40, 45, 47, 50, 54, 57, 58, 59, 63, 67], "break": [16, 45, 67, 68], "parenthes": 16, "backslash": 16, "made": [16, 50, 54, 63, 66], "ident": [16, 26, 56, 58], "mayb": 16, "grammar": 16, "three": [16, 50, 59, 60, 63, 67], "cross": [16, 50, 52], "drop": [16, 29, 40, 46, 52, 59], "come": [16, 19, 25, 26, 46, 48, 49, 50, 52, 54, 57, 58, 59, 60, 65, 66, 67, 68, 73], "handi": [16, 19, 25, 26, 46, 48, 50, 52, 54, 57, 58, 59, 60, 65, 66, 67, 68, 73], "text1": 16, "text2": 16, "khuen": 16, "9523809523809523": 16, "tool": [16, 24, 28, 50, 51, 52, 55, 60, 62, 64, 66, 68, 70, 73, 74], "pencil": 16, "pen": [16, 59], "erasor": 16, "ink": 16, "pencel": 16, "closer": [16, 50, 54], "argument": [11, 16, 24, 27, 35, 47, 52, 54, 58, 60, 63, 65, 67, 68], "cutoff": [16, 48, 59], "collect": [17, 40, 47, 48, 52, 54, 56, 58, 59, 60, 67, 68, 73], "functool": 17, "pydash": 17, "deal": [15, 18, 26, 31, 48, 50, 59, 66], "slow": [18, 58], "ineffici": [18, 21, 32], "char_list": 18, "custom_count": 18, "list_": 18, "char_count": 18, "custom": [18, 33, 45, 50, 54, 56, 58, 63, 65, 67, 68, 73], "num_list": [18, 21], "numexp": 18, "custom_tim": 18, "counter_tim": 18, "6199148843686806": 18, "small": [18, 36, 40, 47, 48, 50, 52, 57, 59], "manag": [18, 48, 50, 52, 54, 56, 58, 66], "project": [18, 44, 45, 50, 52, 54, 57, 58, 60, 63, 66, 68, 73, 74], "person": [18, 54], "attribut": [6, 15, 18, 19, 27, 67, 73], "gender": [18, 48, 50, 54, 60], "male": [18, 50, 60], "femal": [18, 50, 60], "just": [2, 18, 25, 50, 51, 52, 53, 54, 59, 60, 63, 65, 66, 68, 73], "obj": [2, 18, 34, 39], "b23": 18, "physic": [18, 47, 56, 73], "d24": 18, "spanish": [18, 48], "cleanest": 18, "food_pric": 18, "ignor": [18, 27, 31, 48, 52, 54, 56, 58, 60, 62, 65, 68, 73], "unordered1": 18, "unordered2": 18, "ordered1": 18, "ordered2": 18, "across": [2, 18, 45, 47, 48, 49, 52, 56, 59, 62, 67], "tomato": 18, "veggi": 18, "carrot": [18, 50, 51], "map": [18, 21, 25, 47, 48, 49, 54, 67, 68], "avail": [19, 27, 47, 48, 50, 52, 59, 65, 67], "represent": [19, 52, 54, 59], "few": [19, 47, 48, 50, 52, 53, 54, 55, 56, 57, 59, 60], "decor": [2, 19, 27, 48, 57, 58, 63, 67, 68], "top": [19, 47, 50, 51, 52, 54, 56, 59, 60, 63, 68, 76], "dataclassdog": 19, "appropri": [19, 20, 58, 73], "__repr__": 19, "present": [19, 47, 50, 54, 58, 59, 63, 67], "cumbersom": [19, 53, 58, 65], "anybodi": 19, "adjust": [19, 35, 47, 52, 56, 63], "throw": [19, 29, 50], "golden": [19, 50], "frozeninstanceerror": 19, "ipython": [19, 25, 48, 62, 67], "input": [15, 19, 24, 25, 45, 46, 51, 52, 56, 59, 60, 63, 67, 68, 73], "0d6f339835b8": 19, "string": [19, 24, 27, 33, 40, 46, 48, 50, 53, 57, 63, 67, 73], "__setattr__": 19, "field": [19, 45, 50, 54, 62, 67, 74], "implement": [19, 20, 24, 29, 52, 54, 58, 59, 68, 73], "automat": [19, 24, 32, 45, 47, 50, 52, 54, 57, 58, 67, 73], "___init__": 19, "initi": [19, 25, 47, 48, 49, 50, 52, 53, 58, 59, 65], "__post_init__": 19, "info": [19, 32, 33, 47, 51, 52, 54, 57, 58, 59, 62, 65, 67, 68, 73], "zip": [19, 52, 54, 55, 59, 64], "fix": [20, 33, 45, 54, 58, 59, 68, 73], "linear_func": 20, "linear_func_parti": 20, "data2": 20, "process_dict": 20, "process_list": 20, "choos": [20, 32, 34, 52, 57], "right": [20, 26, 39, 40, 62, 63, 66, 67, 73, 76], "process_data2": 20, "notimplementederror": 20, "pleas": [20, 47, 50, 52, 55, 60], "regist": [20, 50, 56, 60, 67], "process_dict2": 20, "process_list2": 20, "left": [20, 26, 39, 40, 59, 62, 63, 67, 73], "singl": [20, 29, 45, 47, 48, 52, 56, 59, 63, 68], "add_num": 20, "matter": [21, 48], "naiv": [21, 67], "param": [21, 47, 52, 58], "learning_r": 21, "1e": [21, 52, 59], "batch_siz": 21, "32": [21, 45, 47, 48, 49, 50, 52, 59, 60, 62, 65, 68], "64": [21, 48, 49, 57, 59], "001": [21, 49, 57, 60, 62], "ipykernel_38110": 21, "240000324": 21, "miss": [21, 32, 38, 50, 54, 58], "lemon": 21, "chosen": 21, "ipykernel_40588": 21, "2755098589": 21, "indic": [8, 21, 22, 42, 50, 52, 54, 56, 58, 59], "slice": [21, 29, 50], "key_func": 21, "aggreg": [11, 21, 45, 56, 59], "fill": [21, 30, 54, 67], "fillvalu": 21, "word": [21, 34, 48, 58, 60, 62, 67], "abcnic": 21, "upper": [21, 34, 35, 45, 48, 52, 53, 54, 56, 59, 60, 67], "islow": [21, 67], "join": [21, 23, 37, 40, 42, 45, 47, 54, 67], "export": [22, 52, 60, 63, 65, 73], "correspond": [6, 22, 47, 48, 62, 67], "intrins": 22, "syntax": [15, 22, 49, 55, 56, 62, 63, 66], "easi": [23, 24, 28, 47, 48, 49, 50, 51, 54, 55, 57, 58, 60, 62, 63, 64, 66, 68], "choic": [23, 32, 47, 51, 56, 63, 68], "exist": [23, 45, 47, 51, 59, 60, 62, 65, 68, 73], "makedir": [23, 47], "new_fil": 23, "txt": [23, 46, 52, 58, 60], "open": [21, 23, 28, 48, 50, 52, 59, 62, 65, 67, 73, 74], "w": [23, 48, 52, 62], "world": [23, 31, 50, 51, 54, 59, 63, 68], "mkdir": [23, 58, 68, 73], "exist_ok": [23, 47, 68], "write_text": [23, 58, 68], "read_text": [23, 45, 58], "document": [23, 29, 49, 52, 54, 60, 67, 68], "pictur": [23, 48, 50], "manipul": [23, 28, 45, 47, 56, 60, 63], "touch": [23, 58], "tree": [23, 52, 58, 64], "grep": 23, "grandpar": 23, "cwd": 23, "chapter2": 23, "relative_to": 23, "nlp": 23, "scienc": [23, 47, 48, 49, 50, 52, 54, 60, 61, 66, 74], "root": [23, 26, 52, 54, 58, 67], "posixpath": [23, 58], "samefil": 23, "absolut": [23, 42, 52, 59], "ipynb": [23, 42, 60, 68, 73], "kitchen": [25, 68], "sink": 25, "util": [25, 42, 45, 47, 54, 58, 59, 63, 65, 67, 68], "stuff": [25, 48], "py_": 25, "ye": [25, 26, 60, 66], "could": [25, 26, 38, 47, 48, 49, 54, 60, 63, 65, 66, 67, 73], "done": [25, 26, 38, 52, 66, 73], "walmart": [25, 40, 58, 62], "season": [25, 50, 54, 59, 60], "in_season": 25, "aldi": [25, 40, 58, 62], "out_of_season": 25, "wouldn": [25, 26, 46, 47, 48, 54, 58, 60, 65, 67, 68, 73], "dot": [25, 60], "notat": 25, "filter_fruit": 25, "valueerror": [2, 11, 15, 19, 25, 42, 58, 67, 68], "b01bf8b7ae1a": 25, "0x7f9880491310": 25, "find_index": 25, "what": [25, 32, 47, 48, 50, 51, 52, 53, 54, 58, 60, 62, 65, 66, 67], "filter_": 25, "map_": 25, "bought": 25, "reject": [25, 47], "startswith": [25, 67], "0x7f027895d1f0": 25, "note": [25, 32, 52, 59], "final": [25, 56, 59, 68], "lazi": 25, "hold": [25, 55, 59], "express": [25, 26, 50, 54, 55, 60, 68], "until": [25, 47, 50, 54, 56, 58, 68], "total_pric": 25, "wish": [26, 62, 63, 67], "algebra": 26, "eq": 26, "bore": 26, "mathemat": 26, "let": [26, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 63, 65, 68], "over": [21, 26, 29, 45, 54, 59, 73, 74], "amaz": 26, "squar": [26, 48, 60], "decim": [26, 42, 52, 58, 63, 67], "242640687119285": 26, "sqrt": [26, 51, 63, 68], "displaystyl": [26, 63, 73], "tri": [26, 31, 54, 73], "fraction": [26, 48, 53], "25": [26, 31, 33, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 64, 68], "6666666666666667": 26, "frac": [26, 63], "ration": 26, "real": [26, 45, 51, 54, 58], "power": [26, 28, 45, 47, 51, 52, 58, 62, 65, 66, 68], "abil": [26, 54], "expr": 26, "term": [26, 49, 52, 54, 59, 63], "happen": [26, 47, 58, 67], "aha": 26, "remain": [11, 26, 50, 52, 58], "unevalu": 26, "why": [26, 50, 52, 53, 54, 63, 74], "would": [26, 32, 47, 48, 52, 54, 58, 59], "kind": [26, 31, 32], "school": [26, 48, 50], "life": [26, 48], "expans": 26, "pretti": [26, 45], "isn": 26, "One": [26, 32, 38], "question": [26, 48, 50, 52, 58, 59], "luckili": [26, 48, 60, 73], "6x": 26, "fun": [26, 48, 50], "look": [26, 48, 50, 52, 54, 58, 59, 60, 65, 67, 73], "trigsimp": 26, "sec": [26, 49, 59, 67], "co": [26, 54], "sin": [26, 60, 63], "tan": 26, "cot": 26, "calculu": 26, "worri": 26, "infin": 26, "oo": 26, "factori": [26, 67], "rewrit": [26, 45, 47, 56, 58], "past": [26, 38, 42, 47, 50, 59], "notebook": [26, 38, 42, 52, 59, 65, 67, 74, 76], "markdown": [26, 42, 55, 63, 65, 67, 73], "sure": [27, 52, 54, 58, 73], "correct": [27, 45, 48, 52, 54, 56, 58, 64, 68], "mypi": 27, "callable_exampl": 27, "multiply_then_divide_by_two": 27, "multiply_func": 27, "static": [27, 58], "checker": 27, "inde": 27, "1m": [27, 54, 58, 64, 65, 67, 73], "32msuccess": 27, "issu": [6, 27, 32, 33, 54, 56, 58, 64, 66, 76], "sourc": [24, 27, 28, 47, 48, 54, 59, 60, 62, 63, 64, 65, 66, 67, 68, 74, 76], "fruit_typ": 27, "make_fruit": 27, "type_example_wrong": 27, "31merror": [27, 64, 67], "33m": [27, 58, 67, 73], "incompat": [27, 64, 65], "expect": [27, 52, 59, 64, 68, 73], "31mfound": [27, 64], "type_example_right": 27, "measur": [27, 48, 54, 73], "typing_annot": 27, "get_height_in_feet": 27, "height": [27, 48, 60], "meter": 27, "28084": 27, "typecheck": 27, "safe": [27, 52], "shouldn": 27, "typing_fin": 27, "bark": [27, 58, 60], "ruff": 27, "overrid": 27, "previous": [27, 32, 56], "misc": 27, "typing_liter": 27, "share": [2, 27, 50, 52, 65, 66, 74], "scalabl": [27, 59], "last_int": 27, "last_str": 27, "gener": [27, 31, 32, 47, 48, 51, 52, 64, 66], "adapt": 27, "invok": [27, 56], "infer": [27, 32, 45, 52, 58, 59, 68], "typevar_exampl": 27, "dict_valu": 27, "fast": [28, 48, 50, 53, 68], "analysi": [28, 45, 47, 54, 63, 65, 67], "textblob": [29, 52, 58], "get_sum": 29, "get_diff": [], "col1": [29, 31, 32, 34, 36, 38, 39, 40, 47, 49, 57, 58, 67], "col2": [29, 31, 32, 34, 36, 38, 39, 40, 47, 49, 57, 58, 67], "along": [29, 40, 48, 49, 65], "applymap": 29, "fail": [2, 6, 29, 64, 65, 68, 73], "everyth": [29, 57], "col3": [29, 32, 40, 47, 49], "col4": 29, "103": [29, 57], "309": [29, 58], "204": 29, "816": 29, "dtype": [29, 31, 33, 34, 35, 37, 39, 40, 47, 48, 52, 53, 54, 57, 58, 59, 73], "int64": [29, 31, 32, 33, 34, 35, 40, 45, 47, 52, 57, 59, 73], "insert": [29, 40, 45, 47, 49, 51, 57, 58, 59, 67, 73], "format": [15, 29, 32, 40, 45, 47, 48, 50, 51, 55, 59, 60, 62, 63, 67, 68, 73], "berri": [29, 54], "cherri": [29, 50], "garden": 29, "comma": [29, 65, 73], "fillna": [29, 54], "ffill": 29, "stand": [29, 73], "nan": [29, 30, 33, 35, 38, 40, 47, 48, 53, 54, 58, 60, 73], "mode": [29, 59, 60, 65, 67], "astyp": [29, 32, 36, 60], "encoded_col1": 29, "involv": [29, 47, 52, 54, 56, 58], "intend": [29, 50, 56, 68], "copi": [29, 38, 42, 45, 48, 53, 67], "ipykernel_77093": 29, "431778579": 29, "settingwithcopywarn": 29, "loc": [29, 30, 33, 34, 37, 49, 59], "row_index": 29, "col_index": 29, "caveat": 29, "pydata": 29, "org": [29, 31, 47, 52, 62, 73], "stabl": [29, 60, 73], "user_guid": 29, "html": [29, 48, 50, 52, 59, 60, 63, 73], "view": [29, 31, 46, 47, 49, 53, 54, 55, 57, 60, 65, 66, 74], "versu": 29, "chained_assign": 29, "settingwithcopyerror": 29, "non": [30, 32, 33, 34, 57, 58, 65, 67, 68], "store1": 30, "store2": 30, "df1": [30, 31, 35, 39, 40, 47, 48], "key1": 30, "df2": [30, 31, 35, 39, 40, 47], "key2": 30, "left_on": [30, 48], "right_on": [30, 48], "value_x": 30, "value_i": 30, "a_x": [], "a_i": [], "belong": [52, 60], "left_kei": [], "right_kei": [], "a_left": [], "a_right": [], "_left": [], "_right": [], "match": [24, 30, 34, 35, 47, 52, 56, 58, 59, 60, 63, 65, 68], "outer": [30, 40], "v1": [30, 45, 54, 64], "v2": [30, 54, 64], "tip": [31, 48, 60, 74], "load": [2, 21, 31, 45, 46, 50, 52, 54, 55, 56, 57, 59, 60, 68, 73], "queri": [31, 45, 49, 51, 55, 58, 59, 65, 73], "push": [31, 53], "down": [31, 50, 68], "filer": 31, "engin": [31, 45, 56, 57, 62, 68], "optim": [31, 45, 49, 50, 52, 57, 59, 60, 64], "dataset": [2, 21, 29, 31, 32, 34, 47, 49, 56, 57, 58, 59, 60], "113": [31, 49], "file_path": [2, 31], "num_row": [31, 47], "100_000_000": 31, "id": [30, 31, 45, 46, 47, 50, 51, 54, 55, 56, 59, 60, 64, 68, 73], "rand": [31, 47, 60], "row_group_s": 31, "2_000_000": 31, "read_parquet": [31, 45, 47], "50000": [31, 48], "106": [31, 58], "19": [31, 33, 45, 47, 48, 49, 59, 60, 65, 67, 68, 73], "414": [31, 59], "index_col": [31, 59], "download": [31, 45, 50, 52, 54, 60, 67, 76], "github": [31, 38, 45, 48, 49, 52, 54, 60, 62, 64, 73, 76], "click": [31, 49, 54, 55, 60, 67, 73, 76], "raw": [31, 47, 48, 50, 52, 59, 60, 66], "link": [31, 33, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "githubusercont": [31, 47, 48, 59, 60, 66], "mwaskom": [31, 47], "seaborn": [31, 47, 48, 52, 54, 65], "master": [31, 47, 48, 58, 59, 60, 66], "head": [31, 47, 48, 49, 50, 53, 54, 58, 59, 60, 62, 63, 68], "diet": [31, 48], "puls": 31, "fat": [31, 54], "85": [31, 48, 49, 54, 59], "88": [31, 47, 48, 49, 50, 57, 58, 67, 73], "90": [6, 31, 47, 48, 52, 54, 59, 64], "92": [31, 49, 54, 59, 60], "consum": [2, 31, 32, 47, 50, 52, 54, 58, 60, 63, 67], "amount": [31, 48, 52, 56, 59], "chunksiz": [31, 47], "5495": 31, "warn": [31, 47, 48, 52, 54, 56, 58, 60, 62, 67, 68, 73], "filterwarn": 31, "flight_data_2018_to_2022": 31, "33": [31, 42, 48, 49, 58, 59, 68], "58": [31, 47, 48, 49, 52, 56, 57, 59, 60, 63, 68, 73], "563737": 31, "120": [31, 48, 59, 67, 68], "424": [31, 57], "portion": [21, 31, 57], "df_chunk": 31, "df_": [31, 40, 57], "63737": 31, "read_html": 31, "wikipedia": 31, "en": [31, 50, 54, 60, 73], "wiki": 31, "poverti": 31, "region": [31, 59, 60], "94": [31, 47, 48, 49, 59], "95": [31, 34, 47, 48, 49, 52, 58, 59, 60, 62], "2002": [31, 50, 59], "2004": [31, 50, 59], "1981": 31, "2008": [31, 50], "2010": [31, 48, 59], "2015": [31, 50, 59], "2018": [31, 33, 50], "east": [31, 48, 50, 60], "asia": [31, 48, 59, 63], "pacif": [31, 48], "77": [31, 45, 59, 60, 62, 67, 68], "80": [6, 31, 48, 49, 52, 59, 60, 62, 64], "34": [31, 38, 48, 49, 56, 59, 60, 65, 68, 73], "europ": [31, 59], "central": [31, 48, 50, 59, 60], "latin": 31, "america": [31, 59], "caribbean": 31, "middl": 31, "north": [31, 48, 49, 50, 59], "africa": [31, 63], "south": [31, 48, 50, 59, 60], "35": [31, 35, 45, 48, 49, 52, 54, 56, 57, 59, 60, 62, 65], "61": [31, 48, 49, 59], "36": [31, 48, 49, 50, 52, 56, 57, 59, 60, 62], "49": [31, 42, 47, 48, 49, 56, 58, 59, 60, 62, 64, 68, 73], "26": [31, 48, 49, 50, 57, 58, 59, 60], "saharan": 31, "42": [2, 31, 32, 47, 48, 52, 60, 68], "51": [31, 48, 49, 52, 56, 60, 62], "47": [31, 48, 58, 59, 60, 68, 73], "54": [31, 50, 54, 56, 57, 59, 62], "40": [31, 47, 48, 49, 50, 52, 58, 59, 60, 62, 68], "52": [31, 39, 48, 49, 59, 60], "27": [31, 32, 33, 48, 49, 58, 59, 60, 73], "refer": [31, 54, 57, 62, 63, 68], "affect": [31, 59, 60], "df3": [31, 47], "been": [31, 52, 55, 59, 66, 67], "offer": [24, 31, 32, 47, 51, 53, 58, 59, 62, 63], "copy_on_writ": 31, "manual": [24, 32, 45, 48, 50, 52, 57, 63, 64, 66, 68], "data_typ": 32, "core": [32, 33, 34, 36, 46, 47, 48, 49, 57, 58, 59, 60, 62, 67, 73], "frame": [32, 33, 39, 42, 57, 60, 67], "rangeindex": [32, 33, 57], "entri": [21, 32, 33, 48, 57], "null": [32, 33, 35, 51, 52, 53, 57, 58], "count": [32, 33, 40, 45, 48, 53, 54, 56, 57, 60, 62, 67], "float64": [32, 35, 47, 52, 57, 58, 59], "200": [2, 32, 47, 48, 52, 57, 59], "byte": [32, 33, 50, 52, 57], "cardin": [32, 48, 53], "categori": [32, 34, 36, 47, 49, 51, 52, 54, 56, 59, 60], "sklearn": [2, 32, 48, 49, 50, 53, 54, 57, 58, 60, 64, 67, 73], "load_iri": [32, 48, 52, 53], "as_fram": [32, 49, 50, 52, 53, 57, 60], "return_x_i": [32, 48, 52, 53, 57], "concat": [32, 40, 47, 49, 50, 52, 56], "target": [32, 45, 47, 48, 49, 52, 59, 60, 68], "memory_usag": 32, "128": [32, 48, 59, 68], "sepal": 32, "length": [11, 32, 34, 52, 54, 59, 67], "cm": 32, "1200": 32, "width": [32, 60, 67], "petal": 32, "282": [32, 68], "almost": 32, "fifth": 32, "tell": [24, 32, 48, 52, 60], "smallest": [32, 42], "Or": 32, "sort_valu": [32, 36, 48, 56, 63], "mix": [32, 52, 63], "slower": 32, "still": [32, 58, 59, 68], "after": [31, 32, 48, 49, 50, 54, 57, 59, 64, 65, 67, 73], "remov": [32, 36, 47, 48, 50, 54, 58, 60, 62, 63, 67, 73], "save": [32, 45, 46, 47, 50, 52, 58, 60, 63, 65, 66, 68, 73], "random_numb": 32, "132": [32, 47, 48, 49, 59, 68], "35960884": 32, "inferred_df": 32, "8000000": 32, "loss": [32, 47, 60, 68], "s1": 32, "integr": [32, 47, 48, 50, 53, 58, 63], "apach": [32, 47, 52], "arrow": [32, 45], "solv": [32, 53, 62, 63, 65], "s2": 32, "extra": [33, 47, 48, 65, 73], "step": [2, 33, 48, 52, 53, 54, 59, 60, 62, 66, 67], "date_column_1": 33, "date_column_2": 33, "datetime64": [31, 33], "ns": [31, 33, 58, 60], "usag": [33, 46, 51, 52, 56, 63, 65, 73], "176": [33, 57, 60], "month": [15, 33, 47, 48, 50, 59, 60, 66, 67, 74], "tseri": 33, "offset": [33, 50, 59], "bdai": 33, "ts": 33, "2024": [24, 33, 52, 58, 59, 67], "busi": [33, 59], "simpl": [33, 45, 48, 49, 50, 52, 54, 55, 59, 60, 63], "move": [33, 50, 59], "time_period": 33, "21": [2, 33, 35, 45, 47, 48, 49, 50, 52, 57, 59, 60, 63, 65], "24": [33, 47, 48, 49, 50, 52, 56, 57, 59, 60, 63, 67], "set_index": [33, 59], "imagin": [2, 24, 33, 48, 52, 57, 73], "groupbi": [33, 34, 45, 47, 48, 56, 58, 59], "instruct": [33, 48, 50, 53], "freq": [33, 47, 52, 54, 59, 73], "1w": 33, "week": [33, 48, 58, 59, 60, 67, 68], "to_datetim": [31, 33, 48, 50, 59], "easiest": [33, 50], "05": [24, 33, 34, 47, 48, 49, 50, 52, 54, 58, 59, 60, 73], "exclud": [33, 48, 54, 58], "datetimeindex": 33, "2019": [33, 48, 54, 60], "problem": [33, 50, 52, 53, 58], "date_rang": [33, 47, 60, 73], "07": [33, 47, 48, 49, 50, 56, 58, 59, 60, 63, 73], "new_index": 33, "conform": 33, "new_": 33, "fill_valu": 33, "comparison": [33, 38, 54, 63, 65, 67], "filtered_df": 33, "record": [33, 35, 47, 48, 57, 60], "04": [33, 47, 48, 49, 50, 52, 56, 57, 59, 60, 62, 73], "06": [33, 47, 48, 49, 50, 52, 56, 58, 59, 60, 68, 73], "2d": [33, 54, 60, 73], "dropna": [2, 33, 35, 48, 60, 64], "fastest": [34, 50], "attempt": [2, 34, 47, 64, 68], "o": [34, 47, 48, 59], "shorter": [11, 34], "indexingerror": 34, "ipykernel_791962": 34, "4076731999": 34, "venv": [24, 34, 36, 39, 42, 47, 54, 58, 60, 64, 65, 67, 68], "lib": [24, 34, 36, 39, 42, 47, 54, 59, 60, 64, 65, 67, 68, 73], "python3": [24, 34, 36, 39, 42, 47, 54, 58, 59, 60, 64, 65, 67, 68, 73], "site": [24, 34, 36, 39, 42, 47, 54, 59, 60, 64, 65, 67, 68, 73], "packag": [24, 34, 36, 39, 41, 42, 47, 54, 59, 60, 62, 63, 64, 66, 67, 68], "__getitem__": 34, "929": 34, "930": [34, 59], "maybe_cal": 34, "apply_if_cal": [34, 57], "931": 34, "_getitem_axi": 34, "932": 34, "933": 34, "_is_scalar_access": 34, "1142": 34, "_get_slice_axi": 34, "1143": 34, "is_bool_index": 34, "1144": 34, "_getbool_axi": 34, "1145": 34, "is_list_like_index": 34, "1146": 34, "946": 34, "caller": [6, 34], "respons": [34, 50, 52, 58, 59], "ensur": [34, 40, 45, 47, 48, 52, 53, 55, 56, 58, 59, 68], "947": 34, "label": [34, 35, 40, 45, 49, 51, 52, 54, 56, 59, 60, 63], "_get_axi": 34, "948": 34, "check_bool_index": 34, "949": [34, 68], "ind": 34, "nonzero": 34, "950": 34, "_take_with_is_copi": 34, "2386": 34, "mask": [34, 37, 54], "isna": [34, 58], "_valu": 34, "2387": 34, "2388": 34, "2389": 34, "unalign": 34, "2390": 34, "charact": [34, 49, 67], "cat1": [34, 47, 48], "cat2": [34, 47, 48], "user1": [34, 45, 55, 62], "user2": [34, 45, 62], "user3": [34, 45], "is_all_nan": 34, "unusu": 34, "distort": 34, "statist": [34, 40, 47, 48, 52, 53, 57, 58, 59, 65, 67], "analys": [34, 52], "col0": 34, "trim": [34, 56], "quantil": 34, "lower": [34, 35, 37, 52, 53, 54, 56, 59, 67], "threshold": [34, 48, 52, 54], "bound": [35, 52, 59, 67], "larger": [35, 45, 47], "75": [35, 40, 47, 48, 49, 50, 51, 58, 59, 60, 67], "71": [35, 48, 49, 50, 68], "750000": 35, "714286": 35, "period": [35, 52, 59, 68], "diff2": 35, "leav": [35, 47, 60], "processed_df": [35, 56], "orient": [35, 48], "value_count": 35, "500000": [35, 48], "333333": [35, 53], "166667": 35, "943880": 35, "845154": 35, "roughli": [35, 54], "q": [35, 45, 47, 49, 59, 60], "999": [35, 49, 52], "667": 35, "max": [35, 40, 45, 47, 50, 52, 53, 58, 59, 67], "medium": [36, 50, 56], "mini": 36, "ordered_s": 36, "inplac": [36, 64], "2630": 36, "futurewarn": [36, 48, 52, 54, 56, 60], "deprec": 36, "unus": [36, 64, 73], "alwai": [36, 48, 52, 68], "oranga": 37, "appla": 37, "grapa": 37, "pricel": 37, "price2": [37, 58], "bunni": 37, "monkei": 37, "funni": [37, 50], "flower": [37, 67], "sub_str": 37, "ny": [37, 48], "ey": [37, 50], "join_str": 37, "neg": [2, 38, 45, 47, 49, 51, 52, 54, 58], "ones": [38, 47, 48, 52, 65, 73], "highlight_numb": 38, "white": [38, 50, 60], "nbsp": [38, 58], "predict": [2, 38, 45, 48, 51, 54, 58, 60], "predictions_1": 38, "predictions_2": 38, "real_label": 38, "highlight_cel": 38, "background_gradi": 38, "cmap": [38, 48, 60], "plasma": 38, "excel": [6, 38, 53, 54, 63], "sheet": [38, 53], "titl": [24, 38, 48, 49, 50, 52, 54, 59, 60, 63, 67, 68], "na_rep": 38, "to_excel": [38, 63], "formatted_fil": 38, "xlsx": 38, "tabul": 38, "readm": 38, "jupyt": [38, 42, 52, 59, 68, 74, 76], "tablefmt": 38, "grid": [38, 52, 60], "to_latex": 38, "editor": [38, 54, 60], "tabular": [38, 47, 49, 52, 57, 58, 59], "lrr": 38, "set_table_styl": 38, "selector": [38, 60], "toprul": 38, "prop": 38, "hline": 38, "midrul": 38, "bottomrul": 38, "column_format": 38, "assert_frame_equ": 39, "coll": [39, 40], "assertionerror": [39, 42, 58, 73], "skip": [39, 42, 62, 67], "hidden": [39, 42, 57, 58], "_lib": 39, "pyx": 39, "assert_almost_equ": 39, "167": 39, "_test": 39, "assert": [39, 42, 51, 56, 68, 73], "679": [39, 59], "raise_assert_detail": 39, "index_valu": 39, "676": [39, 47, 59], "677": [39, 59], "msg": [39, 42], "66": [39, 48, 58, 68], "66667": 39, "check_lik": 39, "align": [39, 58, 59], "counter": [40, 48, 54], "count_two": 40, "median": [40, 48, 52, 53, 58, 59], "etc": [40, 45, 49, 50, 52, 58, 64, 68], "g": [40, 48, 50, 52, 55, 58, 59, 65], "reset_index": [40, 59], "agg_method": 40, "mean_pric": 40, "summar": [40, 60], "aggfunc": 40, "compos": [40, 48, 52], "wide": [32, 40, 58, 59, 74], "costco": 40, "id_var": 40, "value_var": 40, "var_nam": 40, "network": [40, 54, 58, 59], "thinh": 40, "friends1": 40, "person1": 40, "person2": 40, "friends2": 40, "symmetr": 40, "friend": 40, "multiindex": 40, "stacked_df": 40, "nstack": 40, "get_dummi": [2, 40], "sep": [40, 67], "often": [15, 40, 45, 48, 50, 52, 53, 54, 56, 58, 59, 67, 68], "ax": [40, 49, 52, 54, 59, 60], "scientif": [41, 60], "multi": [42, 52, 60], "dimension": [42, 54], "new_arr": 42, "new_row_posit": 42, "fewer": [42, 74], "mask_al": 42, "AT": 42, "mask_ani": 42, "largest": [42, 52, 63], "argmax": 42, "highest": [42, 47], "probabl": [42, 48, 52, 59], "array_to_latex": 42, "a2l": 42, "to_ltx": 42, "bmatrix": 42, "greater": [24, 42, 56], "pyplot": [42, 52, 54, 59, 60], "plt": [42, 52, 54, 59, 60], "22222222": 42, "44444444": 42, "66666667": 42, "88888889": 42, "11111111": 42, "33333333": 42, "55555556": 42, "77777778": 42, "arang": [42, 52, 59, 60], "plot": [42, 48, 49, 50, 55, 59, 64], "assert_array_equ": 42, "arr1": 42, "arr2": 42, "chapter4": [42, 55, 58], "48": [42, 48, 52, 57, 59, 60, 73], "href": 42, "vscode": [42, 67], "ch0000052": 42, "truth": 42, "ambigu": 42, "ch0000053": 42, "_privat": 42, "844": 42, "assert_array_compar": 42, "err_msg": 42, "verbos": [42, 52, 54, 63], "header": [42, 45, 54, 63], "equal_nan": 42, "equal_inf": 42, "839": 42, "840": [42, 57], "remark": 42, "841": 42, "build_err_msg": 42, "ox": 42, "oy": 42, "842": 42, "843": 42, "845": [42, 49], "except": [15, 42, 51, 52, 62, 68], "846": 42, "mismatch": [42, 52], "rel": [42, 52, 54, 59], "222": [42, 57, 59], "221": [42, 68], "support": [45, 50, 51, 52, 54, 59, 62, 63, 73], "my_tabl": 45, "where": [45, 47, 48, 51, 52, 56, 59, 60, 62, 64, 67, 73], "start_dat": [31, 45, 47, 58], "pathlib": [45, 58, 68], "placehold": 45, "preprocess": [45, 52, 58, 59, 60], "rich": 45, "connect": [45, 51, 53, 58, 60, 73], "sqlalchemi": 45, "read_sql": 45, "create_engin": 45, "usernam": [45, 46, 50, 53, 54, 66], "password": [45, 46, 50, 53, 54], "host": [45, 49, 50, 53], "port": [45, 47, 49], "database_nam": 45, "table_nam": 45, "fugu": 45, "interfac": [2, 45, 47], "fugue_sql": 45, "fsql": 45, "input_df": [45, 47], "pandasdatafram": 45, "sqlite3": [45, 51], "conn": [45, 51], "db": [45, 51, 58], "cursor": [45, 51, 58], "create_table_sql": 45, "IF": [45, 48, 51], "NOT": [45, 51], "membership": 45, "primari": [2, 45, 51, 58], "autoincr": [45, 51], "activ": [45, 60, 65, 68], "insert_rows_sql": 45, "INTO": [45, 51, 58], "john": [32, 45, 47, 49, 51, 56, 58, 68], "jane": [45, 47, 56, 58], "mike": [45, 51], "close": [45, 50, 51, 54, 59, 67], "har": 45, "leverag": [29, 45, 47, 54, 58, 66], "annot": [45, 48, 51, 54, 63], "intuit": [45, 56, 59, 62], "session": [45, 73, 76], "primary_kei": 45, "through": [2, 45, 53, 54, 56, 58, 59, 60, 62, 64, 68, 73], "coercion": 45, "sqlite": [45, 51, 63], "metadata": [47, 54, 67], "create_al": 45, "lint": 45, "consist": [2, 45, 47, 48, 49, 52, 54, 58, 59], "style": [45, 56, 67, 73], "convent": 45, "free": [45, 50, 54, 58, 59, 76], "focu": 45, "task": [45, 47, 50, 51, 52, 54, 57, 58, 59, 60, 62, 67, 68, 73], "dialect": 45, "ansi": 45, "mysql": 45, "bigqueri": 45, "databrick": 45, "oracl": 45, "teradata": 45, "sqlfluff_exampl": 45, "AS": [45, 56], "foo": [45, 56, 63], "bar": [45, 54, 56, 60], "postgr": [45, 58], "30m": 45, "1msqlfluff_exampl": 45, "0m": [45, 52, 54, 56, 57, 58, 60, 63, 64, 65, 67, 73], "31mfail": 45, "34ml": 45, "lt09": 45, "0mselect": 45, "unless": 45, "34m": [45, 52, 54, 63], "0monli": 45, "1mlayout": 45, "select_target": 45, "st06": 45, "wildcard": 45, "calcul": [45, 57, 59, 60], "0mand": 45, "1mstructur": 45, "column_ord": 45, "lt02": 45, "0mexpect": 45, "indent": 45, "lt01": 45, "whitespac": [45, 54, 63, 67], "nake": 45, "0mbinari": 45, "binari": [45, 52], "cp01": 45, "0mkeyword": 45, "1mcapitalis": 45, "seamlessli": [45, 48, 52, 58, 59], "sentiment": [45, 51, 52, 54, 58], "pgml": 45, "transform": [45, 49, 51, 52, 54, 56, 58, 59, 60, 67], "classif": [45, 52, 58], "love": [45, 48, 50, 54], "amazingli": 45, "ml": [45, 64], "hate": 45, "mundan": 45, "thankless": 45, "score": [6, 45, 48, 52, 54, 58, 60], "9995759129524232": 45, "9903519749641418": 45, "train": [45, 49, 52, 53, 54, 60, 68], "relation_nam": 45, "y_column_nam": 45, "algorithm": [45, 52, 54, 59, 60], "xgboost": 45, "hyperparam": 45, "n_estim": [45, 58], "imag": [45, 50, 60, 65, 73], "quiet": [45, 55, 64], "wget": [45, 47, 54], "cwida": 45, "releas": [45, 47, 54, 57, 73], "lineitemsf1": 45, "snappi": 45, "parquet": [45, 56], "empow": 45, "scientist": [45, 50, 52, 53, 54, 59, 68, 70, 74], "capabl": [2, 45, 54, 56, 68], "alongsid": 45, "tradit": [15, 45, 52, 58, 59], "system": [45, 46, 50, 51, 54, 57, 58, 73], "demand": [45, 59], "dbm": 45, "server": [45, 52, 53, 57, 65, 73], "workflow": [45, 48, 60, 66], "mydf": 45, "to_df": 45, "nearli": [45, 59], "l_returnflag": 45, "agg": [45, 47, 56, 58], "l_extendedpric": 45, "avg": [45, 47, 56, 58, 59], "226": 45, "BY": 45, "37": [45, 48, 49, 56, 60], "deltalak": [45, 47], "delta": [45, 58], "lake": 45, "2906": 45, "writer": [45, 47], "write_deltalak": [45, 47], "delta_lak": [45, 47], "deltat": [45, 47], "quack": 45, "to_panda": [45, 47, 53], "l_quantiti": 45, "108": 45, "to_pyarrow_dataset": 45, "954": 45, "downstream": 45, "sql_queri": [], "employee_nam": 47, "department_nam": 48, "employe": [47, 56, 57], "depart": [48, 56], "ON": 45, "department_id": [], "pars": [24, 54, 59, 63, 67], "token": [54, 55], "newlin": [], "0x10a13e4c0": [], "dml": [], "0x10a1ae040": [], "0x10a1ae100": [], "identifierlist": [], "empl": [], "0x10a198e40": [], "0x10a1ae580": [], "0x10a1ae5e0": [], "0x10a1ae640": [], "emploi": [], "0x10a198c10": [], "0x10a1ae7c0": [], "0x10a1ae820": [], "0x10a1ae880": [], "0x10a198cf0": [], "0x10a1aea00": [], "0x10a1aea60": [], "0x10a1aeac0": [], "depa": [], "0x10a198dd0": [], "0x10a1aee80": [], "get_real_nam": [], "get_identifi": [], "encourag": 46, "script": [46, 55, 65, 73], "wast": 46, "reproduc": [46, 47, 48, 52, 58], "config": [46, 47, 52, 59, 60, 64, 67, 73], "configur": [46, 47, 52, 60, 67], "yaml": [46, 52, 55, 64, 68, 73], "data1": [46, 73], "drop_featur": 46, "iid": 46, "idg": 46, "wave": 46, "categorical_var": 46, "undergra": 46, "zipcod": 46, "seper": 46, "config_nam": 46, "termin": [46, 52, 54, 57, 58, 63, 64, 65, 68, 73], "hydra_exampl": 46, "userwarn": [46, 52, 60, 62], "config_path": 46, "cc": 46, "next": [46, 47, 48, 52, 54, 56, 59, 60, 65], "upgrad": [46, 59], "0_to_1": 46, "changes_to_hydra_main_config_path": 46, "articl": [46, 48, 49, 50, 52, 53, 55, 58, 62, 63, 65, 67, 74], "environ": [48, 51, 52, 54, 57, 58, 67, 68, 73], "load_dotenv": 46, "getenv": 46, "spend": [46, 48, 59], "docstr": 46, "docopt_exampl": 46, "dir": [46, 53, 65, 73], "directori": [46, 47, 53, 63, 65, 66, 67, 68, 73], "input_text": [46, 54], "__doc__": [46, 67], "argv": 46, "input_path": 46, "litt": 47, "bit": 47, "sleep": [47, 54, 57, 58, 62, 67, 68], "progress_appli": 47, "cpu": [47, 53, 54, 57, 73], "progress_bar": 47, "parallel_appli": 47, "worker": [47, 48, 54, 56, 68], "standard": [47, 52, 57, 58, 59, 62, 65, 67, 73], "transfer": [47, 53, 59], "3025": 47, "324": 47, "441": [47, 48], "6561": 47, "5329": 47, "2025": 47, "4900": 47, "1024": [32, 47, 53, 54], "5776": 47, "8100": 47, "3364": 47, "9995": 47, "4761": 47, "9996": 47, "3721": 47, "6889": 47, "9997": 47, "4225": 47, "9025": 47, "1156": 47, "9998": 47, "361": [47, 68], "529": [47, 49, 59], "9999": [47, 67], "5041": 47, "81": [47, 48, 49, 50, 59, 60, 73], "Not": [47, 52], "flight": 47, "passeng": [47, 48, 59, 60], "1949": [47, 50], "112": [47, 49], "118": [47, 49, 68], "march": [47, 48], "april": [47, 50], "129": [47, 48, 57, 67, 68], "121": [47, 49, 57, 59, 60], "june": [47, 51], "135": [47, 48, 57, 68], "juli": [47, 50, 60], "148": [47, 49, 62, 68], "august": 47, "septemb": 47, "136": [47, 48, 68], "octob": 47, "119": [47, 52, 59], "to_markdown": [47, 63], "llm": 47, "openai": [47, 51], "api_token": 47, "your_api_token": 47, "pandas_ai": 47, "convers": [47, 58, 64], "prompt": 47, "five": [47, 50], "1960": [47, 59], "5714": 47, "1959": 47, "5140": 47, "1958": 47, "4572": 47, "1957": 47, "4421": 47, "1956": 47, "3939": 47, "span": [47, 73], "pyspark": [47, 52, 59], "workload": [47, 56], "fugue_spark": 47, "sparkexecutionengin": 47, "map_pric": 47, "map_price_to_fruit": 47, "schema": [45, 47, 52, 58], "hostnam": [47, 53], "7740": 47, "resolv": [47, 52], "loopback": 47, "address": [45, 47, 49, 50, 56, 58, 68], "127": [47, 48, 49, 52, 57, 68], "192": [47, 54, 60, 62], "168": [47, 54], "wlp111s0": 47, "spark_local_ip": 47, "bind": 47, "illeg": 47, "reflect": [47, 59], "unsaf": 47, "platform": [47, 48, 52, 56, 58, 67, 73], "jar": [47, 54], "unsafe_2": 47, "constructor": 47, "java": [47, 56], "nio": 47, "directbytebuff": 47, "report": [47, 50, 52, 53, 55, 57, 59, 60, 64], "further": [24, 47, 54, 58, 64, 74], "deni": 47, "nativecodeload": [47, 56], "unabl": [24, 47, 52, 56], "nativ": [47, 56, 59, 68], "hadoop": [47, 56], "builtin": [47, 56], "applic": [47, 48, 51, 52, 54, 56, 58, 63, 64, 67, 68, 73, 74], "log4j": 47, "properti": [2, 47, 67], "log": [21, 47, 56, 59, 68], "sc": [47, 56], "setloglevel": [47, 56], "newlevel": [47, 56], "sparkr": [47, 56], "servic": [47, 48, 49, 64], "sparkui": 47, "4040": 47, "4041": 47, "stage": [47, 56, 66], "essenti": [47, 52, 54], "undo": [47, 58], "mistak": 47, "review": [47, 51, 66], "audit": 47, "transact": [47, 48, 50], "travel": [47, 48], "4719861e": 47, "1d3a": 47, "49f8": 47, "8870": 47, "225e4e46e3a0": 47, "_delta_log": 47, "00000000000000000000": 47, "json": [47, 50, 52, 55, 58, 63, 68], "dt": [47, 48], "current": [2, 47, 48, 50, 52, 58, 59, 65, 66, 67, 68, 73, 74], "creation": [31, 45, 47], "get_add_act": 47, "flatten": [47, 62], "size_byt": 47, "a6738752": 47, "efca": 47, "4577": 47, "8cbf": 47, "9c69b404f2ee": 47, "1654": 47, "7a6df896": 47, "715a": 47, "4d4a": 47, "b210": 47, "b12e3fe57bc6": 47, "modification_tim": 47, "data_chang": 47, "num_record": 47, "null_count": 47, "2023": [47, 54, 58, 67], "479": [47, 59], "657": [47, 59, 68], "prior": [47, 56], "dt0": 47, "rs": [45, 47], "segment": [47, 54], "rather": [31, 47, 48, 49, 54, 56, 59], "entir": [21, 47, 48, 52, 56, 68], "retriev": [47, 53, 54, 56], "complet": [47, 57, 58, 59, 62, 65, 68], "hourli": [47, 59, 68], "sale": [47, 52, 56, 59], "end_dat": [31, 47, 58], "784": [47, 59], "659": [47, 59, 68], "729": 47, "292": 47, "935": [47, 68], "table_path": 47, "79": [47, 48, 49, 50, 52, 56, 60, 68], "62": [47, 48, 59, 67], "delta_lake2": 47, "partition_bi": 47, "181": 47, "yesterdai": 47, "workaround": 47, "solut": [48, 51, 52], "a6813d0c": 47, "157b": 47, "4ca6": 47, "8b3c": 47, "8d5afd51947c": 47, "untouch": 47, "partition_filt": 47, "00000000000000000001": 47, "b5c9640f": 47, "f386": 47, "4754": 47, "b28f": 47, "90e361ab4320": 47, "disk": [45, 47, 59], "intens": [47, 57], "5000": [47, 52, 54, 56, 58], "6000": [47, 56], "employee_id": 47, "salari": [47, 56], "8000": [47, 52], "existing_data": 47, "recreat": [47, 52], "retain": [47, 56], "columnar": 47, "benefit": [47, 48], "u": [47, 49, 51, 52, 55, 56, 57, 58, 59, 60, 62, 65, 68, 73], "ingest": 47, "accumul": 47, "surg": 47, "compact": 47, "expand": [47, 64, 67], "data_url": 47, "gist": [47, 66], "khuyentran1401": [47, 48, 49, 52, 62, 66], "458905fc5c630d7a1f7a510a04e5e0f9": 47, "5b2d760011c9255a68eb08b83b3b8759ffa25d5c": 47, "numfilesad": 47, "numfilesremov": 47, "filesad": 47, "278115": 47, "totalfil": 47, "totals": 47, "filesremov": 47, "5712": 47, "5717": 47, "5715": 47, "571580": 47, "partitionsoptim": 47, "numbatch": 47, "totalconsideredfil": 47, "totalfilesskip": 47, "preserveinsertionord": 47, "dure": [47, 50, 52, 53, 55, 58, 59, 68], "demonstr": [47, 48, 52, 54, 56, 58, 59], "last_talk": 47, "people_t": 47, "new_df": [47, 48, 56, 57], "older": 47, "statu": [2, 47, 48, 58], "builder": [47, 52, 56, 59], "sql": [47, 52, 54, 59], "sparksess": [47, 52, 56, 59], "appnam": 47, "myapp": 47, "extens": [47, 48, 52, 68, 73], "io": [47, 50, 52, 54, 60], "deltasparksessionextens": 47, "catalog": 47, "spark_catalog": 47, "deltacatalog": 47, "configure_spark_with_delta_pip": 47, "getorcr": [47, 52, 56, 59], "interview": 47, "createdatafram": [47, 52, 56, 59], "todf": 47, "compani": [47, 48, 49, 50, 52], "repartit": 47, "forpath": 47, "new_data": [47, 48], "one_month_ago": 47, "current_d": 47, "interv": [47, 49, 50], "alia": [47, 56], "whenmatchedupd": 47, "whennotmatchedbysourceupd": 47, "concaten": [47, 57, 67], "expens": [47, 57, 58, 59], "inconsist": [47, 56, 59, 67], "datatyp": [31, 32, 47], "suppos": 47, "filepath": 47, "concat_df": 47, "effortlessli": [47, 51, 60, 73], "preserv": [47, 62], "mergeschema": 47, "pandas_api": 47, "api": [47, 52, 53, 58, 59, 68], "pl": 47, "pandas_df1": 47, "value1": [47, 58], "pandas_df2": 47, "value2": [47, 58], "polars_df1": 47, "from_panda": 47, "polars_df2": 47, "start_tim": [47, 62], "pandas_merg": 47, "pandas_tim": [47, 57], "polars_merg": 47, "polars_tim": 47, "6f": 47, "604390": 47, "079080": 47, "lightn": 47, "machin": [2, 47, 48, 49, 53, 58, 59, 60, 73], "eager": 47, "immedi": [47, 54, 62, 68], "contrast": [45, 47, 52, 53, 56, 59], "defer": 47, "10_000_000": 47, "categor": [47, 58], "7292": 47, "7849": 47, "93": [47, 48, 49, 52, 59], "6940": 47, "1265": 47, "2509": 47, "70": [6, 47, 48, 59, 60, 68], "706": [47, 57], "pl_df": 47, "428": [47, 59], "airport": 47, "datahub": 47, "unwant": 47, "scan_csv": 47, "acceler": 47, "particularli": [15, 24, 47, 48], "57k": 47, "heliport": 47, "contin": [47, 55], "eu": 47, "143": [47, 48, 57, 68], "594": 47, "written": [47, 48, 54, 76], "rust": 47, "acid": [47, 50], "enforc": 48, "exception": 47, "moreov": [47, 54], "seamless": [47, 59], "category_col1": 47, "numeric_col1": 47, "tail": [47, 48, 52, 59, 62], "9999995": 47, "9999996": 47, "9999997": 47, "9999998": 47, "87": [47, 49], "9999999": 47, "277": [47, 68], "55": [47, 48, 49, 50, 52, 54, 59, 60], "save_path": 47, "bear_delta_lak": 47, "latest": [47, 50, 59, 65, 66], "read_delta": 47, "i64": 47, "43": [47, 48, 49, 52, 54], "882": 47, "38": [45, 47, 48, 49, 52, 56, 57, 58, 59, 67], "train_test_split": [48, 52, 53, 59, 64], "proport": [48, 60], "model_select": [48, 52, 53, 59, 64], "bincount": [48, 57], "x_train": [48, 52, 53], "x_test": [48, 52, 53, 59], "y_train": [48, 52, 53], "y_test": [48, 52, 53, 59, 60], "random_st": [2, 48, 52, 58, 64], "randomli": [48, 52], "bias": [48, 58], "customer_id": [48, 56], "train_data": [48, 52], "test_data": [47, 48, 52, 56, 59], "test_siz": [48, 52, 64], "cutoff_d": 48, "feature_engin": 48, "dropcorrelatedfeatur": 48, "make_classif": [48, 52], "n_sampl": [2, 48, 52, 59], "n_featur": [2, 48, 52, 59], "n_redund": [48, 52], "n_clusters_per_class": [48, 52], "class_sep": [48, 52], "trabsform": 48, "colnam": 48, "var_": 48, "var_0": 48, "var_1": [48, 67], "var_2": [48, 67], "var_3": [48, 67], "var_4": 48, "var_5": 48, "corr": 48, "000000": [47, 48, 53, 59], "938936": 48, "874845": 48, "654745": 48, "tr": 48, "pearson": 48, "xt": 48, "fit_transform": [48, 49, 52, 54, 58, 60], "correlated_feature_sets_": 48, "mark": [48, 49, 50, 73], "rarelabelencod": 48, "fetch_openml": [48, 54, 60], "dating_profil": 48, "body_typ": 48, "drink": [2, 48], "drug": 48, "educ": [48, 50], "essay0": 48, "essay1": 48, "essay2": 48, "essay3": 48, "essay4": 48, "offspr": 48, "pet": [15, 48, 62], "religion": 48, "sex": [48, 60], "sign": [48, 60], "smoke": 48, "speak": [48, 50], "littl": [48, 50, 73], "strictli": [48, 59], "anyth": 48, "social": 48, "never": [48, 51, 54, 68], "colleg": 48, "univers": [48, 50], "me": [48, 50, 57, 58, 60, 62], "lt": [24, 48, 67], "br": 48, "gt": [24, 48, 63, 65, 67], "ni": [48, 50, 54], "think": [48, 53, 59], "intern": [48, 57, 68], "agent": 48, "fo": 48, "peopl": [48, 49, 54], "laugh": 48, "nrant": 48, "six": [48, 67], "foot": 48, "half": 48, "asian": 48, "nabsurdistan": 48, "republ": 48, "mi": [48, 63], "san": [48, 60], "francisco": 48, "california": [48, 52, 57, 60], "amp": 48, "rsquo": 48, "kid": 48, "straight": 48, "agnostic": 48, "seriou": 48, "gemini": 48, "english": [2, 48, 60], "mostli": 48, "camp": [48, 50], "chef": 48, "n1": [48, 58, 59, 68], "dedic": 48, "everydai": 48, "unbeliev": 48, "silli": 48, "ridicul": 48, "amont": 48, "die": [48, 50], "hard": [2, 48, 50, 57], "christoph": 48, "moor": 48, "fan": [48, 67], "oakland": 48, "cancer": 48, "fluentli": 48, "poorli": [48, 52], "french": 48, "thin": [48, 50], "graduat": 48, "asham": 48, "public": [48, 60, 67], "te": 48, "nerdi": 48, "softwar": [48, 52], "musician": 48, "artist": [24, 48, 50], "improvis": 48, "jaw": 48, "glass": 48, "physica": 48, "okai": 48, "cultur": [48, 59], "matrix": [48, 52], "pisc": 48, "vegetarian": 48, "dead": 48, "plai": [48, 50, 54, 60], "synthes": 48, "acco": 48, "awkward": 48, "batail": 48, "celin": 48, "beckett": 48, "nlynch": 48, "berkelei": 48, "german": 48, "athlet": 48, "hei": [48, 51], "pro": [48, 50, 54], "imageri": 48, "nhttp": [48, 50], "bag": [48, 54], "smile": 48, "inquisit": 48, "natur": [48, 51], "music": [48, 50], "band": [48, 50], "rapper": 48, "nat": [48, 50], "aquariu": 48, "australian": 48, "live": [48, 50, 60, 76], "awesom": [48, 50, 51], "im": 48, "shit": 48, "aforementio": 48, "big": [48, 50], "ask": 48, "kill": 48, "mockingbird": 48, "lord": 48, "ring": [48, 50], "atheism": 48, "tauru": 48, "chines": 48, "lau": 48, "dig": 48, "buri": 48, "treasur": 48, "frolick": 48, "nwitti": 48, "banter": 48, "nuse": 48, "unicorn": 48, "virgo": 48, "meet": [48, 51, 54, 59], "wit": 48, "birthdai": [48, 59], "send": [48, 52, 67], "card": [48, 60], "byproduct": 48, "alphabet": [48, 60, 64, 67], "aquarium": 48, "autobio": 48, "christian": 48, "sagittariu": 48, "oh": [48, 50], "moment": 48, "job": [6, 48, 50, 66], "freakishli": 48, "blond": 48, "willing": 48, "belveder": 48, "tiburon": 48, "jake": 48, "creativ": 48, "gui": 48, "explor": [48, 74], "che": 48, "prob": [48, 52, 54, 59], "tv": [48, 50], "summer": 48, "mateo": 48, "tol": [48, 52], "speci": [48, 60], "minimum": [48, 52, 58, 64], "replace_with": 48, "46107": 48, "45677": 48, "57928": 48, "53127": 48, "33300": 48, "33648": 48, "59701": 48, "57013": 48, "46428": 48, "57123": 48, "percentag": [48, 52, 58, 59], "observ": [48, 52, 59, 62, 68], "countfrequencyencod": 48, "sn": [48, 52, 54, 60], "load_dataset": [48, 60], "diamond": 48, "carat": 48, "cut": 48, "clariti": [48, 62, 67], "depth": [48, 52], "89": [48, 60], "premium": [15, 48], "si2": 48, "2815": 48, "76": [48, 49, 59, 60, 67, 68], "50332": 48, "si1": 48, "53": [48, 54, 57, 58, 59, 60], "2242": 48, "35652": 48, "ideal": [48, 52, 60], "vvs2": 48, "907": 48, "9439": 48, "vs1": 48, "4592": 48, "83": [48, 49], "15824": 48, "vs2": 48, "6332": 48, "45891": 48, "1720": 48, "52416": 48, "2512": 48, "42613": 48, "505": [48, 59], "68": [32, 48, 49, 52, 57, 59, 60, 63, 68], "43567": 48, "1431": 48, "2732": 48, "91": [48, 49, 68], "3246": 48, "40455": 48, "encoding_method": 48, "p_train": 48, "p_test": 48, "10176": 48, "152762": 48, "170436": 48, "4733": 48, "65": [48, 49, 50, 60, 68], "16083": 48, "29": [48, 49, 54, 58, 59, 60, 63, 68], "242022": 48, "56": [48, 50, 52, 57, 59, 73], "6424": 48, "13420": 48, "100531": 48, "5510": 48, "20407": 48, "179409": 48, "8770": 48, "8909": 48, "227314": 48, "4493": 48, "82": [48, 49, 54, 57, 59], "52283": 48, "182005": 48, "094401": 48, "2494": 48, "10789": 48, "fair": 48, "4861": 48, "1190": 48, "2932": 48, "3583": 48, "067384": 48, "3422": 48, "40845": 48, "1173": 48, "13485": 48, "standardscal": [48, 52, 60], "sklearntransformerwrapp": 48, "22474487": 48, "tranform": 48, "scaler": [48, 52, 58], "224745": 48, "captur": [48, 54, 58, 59, 66, 73], "among": [48, 50, 70], "similarityencod": 48, "employee_salari": 48, "fetch_employee_salari": 48, "assignment_categori": 48, "employee_position_titl": 48, "underfilled_job_titl": 48, "date_first_hir": 48, "year_first_hir": 48, "pol": 48, "polic": 48, "msb": 48, "mgmt": 48, "tech": 48, "fulltim": 48, "regular": [48, 50, 52, 58], "offic": [48, 68], "coordin": [48, 49, 50, 73], "1986": 48, "isb": 48, "major": [48, 52], "crime": 48, "fugit": 48, "1988": 48, "hh": [48, 67], "health": 48, "human": [48, 49, 51], "adult": 48, "protect": [46, 48, 50], "iv": 48, "1989": 48, "cor": 48, "rehabilit": 48, "prr": 48, "facil": 48, "secur": [48, 52, 53, 54], "resid": [21, 48], "supervisor": 48, "ii": [48, 49], "2014": [48, 59], "hca": 48, "hous": [48, 52, 57], "commun": [48, 74], "affair": 48, "afford": 48, "plan": [15, 47, 48, 50, 56], "specialist": 48, "iii": 48, "2007": [48, 55, 59], "psb": 48, "6th": 48, "district": [48, 60], "team": [48, 50, 52, 54, 56, 60, 68], "fr": [48, 50, 54], "fire": 48, "rescu": [48, 50], "em": 48, "bill": [48, 52], "account": [2, 48, 52, 59], "auditor": 48, "2016": [48, 50, 59], "administr": [48, 50], "recruit": 48, "firefight": 48, "rescuer": 48, "fsb": 48, "traffic": 48, "autom": [48, 52, 54, 64, 65], "aid": 48, "dirty_column": 48, "x_dirti": 48, "similaryencod": 48, "enc": 48, "ngram": [48, 54], "x_enc": 48, "reshap": [48, 52, 62], "05882353": 48, "03125": 48, "02739726": 48, "19008264": 48, "01351351": 48, "05555556": 48, "20535714": 48, "08088235": 48, "032": [48, 57], "008": 48, "02083333": 48, "056": [48, 49], "02325581": 48, "23076923": 48, "01574803": 48, "02777778": 48, "03738318": 48, "07317073": 48, "05405405": 48, "0733945": 48, "0625": 48, "06542056": 48, "11206897": 48, "07142857": 48, "09756098": 48, "08108108": 48, "04761905": 48, "3539823": 48, "06976744": 48, "09821429": 48, "05343511": 48, "14953271": 48, "26086957": 48, "06451613": 48, "01052632": 48, "03378378": 48, "02631579": 48, "heatmap": 48, "pylabtool": [48, 60], "figsiz": [48, 50, 52, 54, 59, 60], "plot_similar": 48, "normalized_featur": 48, "inner": [48, 56], "font_scal": 48, "xticklabel": 48, "yticklabel": 48, "vmin": 48, "vmax": 48, "ylorrd": 48, "annot_kw": 48, "set_xticklabel": [48, 60], "rotat": 48, "set_titl": 48, "encode_and_plot": 48, "somewhat": 48, "028": 48, "full": [48, 49, 50, 52, 58, 59, 62, 63, 64, 65, 68, 73], "git": [48, 53, 54, 68], "skrub": 48, "frequent": [48, 54, 67], "yemen": [48, 50], "rep": 48, "fuzzy_join": 48, "variat": [48, 58, 63], "happiness_report_2022": 48, "countri": [48, 50, 55, 59], "happi": [48, 58], "fetch_world_bank_ind": 48, "gdppc": 48, "indicator_id": 48, "gdp": 48, "pcap": 48, "cd": [48, 52, 60, 66, 68, 73], "107": 48, "venezuela": 48, "4925": 48, "vietnam": 48, "5485": 48, "131": [48, 68], "4197": 48, "zambia": 48, "3760": 48, "zimbabw": 48, "2995": 48, "146": [48, 57, 59, 68], "xx": [48, 50, 59], "capita": 48, "193": 48, "west": [48, 50, 60], "bank": [48, 63], "gaza": 48, "3789": 48, "327966": 48, "255": 48, "12647": 48, "480789": 48, "258": [48, 58], "701": [48, 59], "714878": 48, "260": 48, "1487": 48, "907764": 48, "261": [48, 57], "1266": 48, "996031": 48, "return_scor": 48, "matching_scor": 48, "merg": [48, 56, 59], "wb": [2, 48, 59], "madagascar": 48, "795045": 48, "egypt": 48, "arab": [48, 54], "654033": 48, "chad": 48, "683373": 48, "130": [48, 68], "ethiopia": 48, "653668": 48, "mauritania": 48, "810736": 48, "133": [48, 68], "jordan": 48, "134": [48, 68], "togo": 48, "india": 48, "137": 48, "malawi": 48, "138": [48, 57], "tanzania": 48, "139": [48, 68], "sierra": 48, "leon": 48, "140": [48, 59, 68], "lesotho": 48, "755238": 48, "141": 48, "botswana": 48, "795825": 48, "142": 48, "rwanda": 48, "754604": 48, "144": [48, 57, 62, 68], "lebanon": 48, "145": [48, 57, 68], "afghanistan": 48, "incom": [48, 68], "fake": [48, 54], "assumpt": [2, 48, 58, 68], "descript": [48, 50, 51, 52, 54, 55], "logo": 48, "simplefilt": [48, 52, 56, 60, 62], "train_df": 48, "blob": [48, 52, 54], "snorkel_exampl": 48, "train_fake_job": 48, "job_id": 48, "salary_rang": 48, "company_profil": 48, "telecommut": 48, "has_company_logo": 48, "has_quest": 48, "employment_typ": 48, "required_experi": 48, "required_educ": 48, "industri": 48, "fraudul": 48, "12276": 48, "12277": 48, "analyst": 48, "gb": [48, 50], "wsm": 48, "london": [45, 48], "product": [45, 48, 51, 56, 58, 59], "op": [48, 57, 58], "qubit": 48, "edg": [48, 54, 58, 60], "engineeringqubit": 48, "ll": [47, 48, 52, 59, 62, 63], "background": 48, "consult": 48, "plenti": 48, "perk": 48, "opportun": [48, 50], "associ": [48, 55, 59, 62], "bachelor": 48, "degre": [48, 68], "internet": 48, "14680": 48, "14681": 48, "advoc": 48, "ga": 48, "savannah": 48, "21st": 48, "centuri": 48, "center": [2, 48, 49, 50, 52, 60, 67], "16518": 48, "16519": 48, "fl": 48, "gainesvil": 48, "352": 48, "inc": [48, 49], "agenc": 48, "crea": 48, "partner": [48, 50], "great": [48, 52, 53, 54, 59], "client": [48, 54, 68], "smart": 48, "mvc": 48, "getfreedom": 48, "trust": [48, 52, 60], "mid": 48, "senior": 48, "technolog": [48, 49], "15478": 48, "15479": 48, "internship": 48, "IN": 48, "bangalor": 48, "pace": 48, "citi": [45, 48, 50, 60], "diver": 48, "deliv": 48, "qualiti": [48, 53, 58, 73], "16348": 48, "16349": 48, "web": [48, 52, 74], "backend": [32, 48, 54], "microservic": 48, "de": [48, 54, 60], "BE": 48, "10969": 48, "airfi": 48, "pr\u00e4gt": 48, "sicher": 48, "und": 48, "einfach": 48, "zu": 48, "bedienend": 48, "design": [48, 49, 52, 54, 59], "esp": 48, "flat": [48, 59], "hierarchi": 48, "fraud": 48, "labeling_funct": 48, "pandaslfappli": 48, "lfanalysi": 48, "abstain": 48, "no_company_profil": 48, "no_company_logo": 48, "conclus": [48, 58], "applier": 48, "l_train": 48, "13410": 48, "5849": 48, "25it": 48, "accuraci": [48, 49, 52, 59, 63], "lf_summari": 48, "polar": [48, 52, 54, 58], "coverag": [48, 52], "overlap": [30, 48], "conflict": [48, 52], "incorrect": [48, 58], "emp": 48, "acc": 48, "186204": 48, "459": [48, 59], "2038": 48, "183821": 48, "205742": 48, "2300": 48, "166365": 48, "244295": 48, "12741": 48, "669": 48, "950112": 48, "detail": [48, 51, 52, 59, 62], "agre": 48, "disagre": 48, "correctli": [48, 52, 58, 67], "incorrectli": 48, "empir": [48, 49], "insight": [48, 52, 54, 59], "taxi": [48, 60], "pickup": [48, 60], "dropoff": [48, 60], "distanc": [48, 49, 54, 59, 60, 63], "fare": [48, 60], "toll": [48, 60], "payment": [48, 60], "pickup_zon": [48, 60], "dropoff_zon": [48, 60], "pickup_borough": [48, 60], "dropoff_borough": [48, 60], "credit": [48, 50, 60], "lenox": [48, 60], "hill": [48, 49, 60], "un": [48, 60], "turtl": [48, 60], "bai": [48, 60], "manhattan": [48, 60], "cash": [48, 59, 60], "side": [48, 50, 52, 59, 60, 73], "villag": [48, 60], "hudson": [48, 60], "sq": [48, 60], "yorkvil": [48, 60], "midtown": [48, 60], "theatr": [48, 60], "batteri": [48, 60], "park": [48, 54, 60], "bridg": [48, 60], "seward": [48, 60], "murrai": [48, 60], "flatiron": [48, 60], "harlem": [48, 60], "lincoln": [48, 60], "friendli": [48, 59], "vehicl": 48, "zone": [48, 59], "borough": 48, "popular": [47, 48, 49, 50, 54, 63, 70, 74], "howto": 48, "pickup_hour": 48, "pickup_dai": 48, "weekday_nam": 48, "pickup_month": 48, "month_nam": 48, "weekdai": [48, 58, 67], "pickup_zone_count": 48, "pickup_zone_far": 48, "pickup_zone_dist": 48, "016667": 48, "857083": 48, "987778": 48, "031597": 48, "944444": 48, "796667": 48, "243830": 48, "198": [48, 67], "994949": 48, "239798": 48, "6428": 48, "72": [32, 48, 50, 52, 56, 59, 68], "550000": 48, "854306": 48, "6429": 48, "74": [48, 67, 68], "jamaica": 48, "concours": 48, "queen": [48, 50, 60], "bronx": [48, 60], "597500": 48, "261667": 48, "6430": 48, "crown": 48, "bushwick": 48, "brooklyn": [48, 60], "549167": 48, "665000": 48, "6431": 48, "york": [45, 48, 50, 60], "flatbush": 48, "remsen": 48, "409000": 48, "086000": 48, "6432": 48, "boerum": 48, "windsor": 48, "terrac": 48, "761905": 48, "812857": 48, "6433": 48, "dist": [49, 65], "norm": 49, "rss": 49, "0037316": 49, "018": [49, 62], "scale": [49, 56, 58, 60], "expon": 49, "1588997": 49, "019": 49, "dweibul": 49, "0079433": 49, "012": [49, 58], "0036884": 49, "873": [49, 68], "genextrem": 49, "0049831": 49, "037": 49, "gamma": 49, "0038504": 49, "101": 49, "098": 49, "089": 49, "lognorm": 49, "0037897": 49, "237": [49, 68], "099": 49, "uniform": [49, 60], "1145382": 49, "469": 49, "loggamma": 49, "0036960": 49, "239": [49, 67, 68], "858": 49, "44": [49, 59], "472": [49, 59], "confid": [49, 52, 59, 64], "parametr": [49, 56, 73], "1000x800": 49, "axessubplot": [49, 50, 52, 60], "nt": 49, "ndf": 49, "xlabel": [49, 50, 52, 59], "ylabel": [49, 52], "frequenc": [49, 52], "detect": [49, 54, 58, 67], "outlier": [49, 54, 58, 59, 67], "deviat": [49, 58, 59], "significantli": [49, 56, 57, 60], "globe": [49, 50], "geocod": 49, "nominatim": 49, "geoloc": 49, "user_ag": 49, "find_loc": 49, "drive": [49, 50, 54], "app": [49, 52, 60, 63, 65, 67, 68], "dogwood": 49, "acr": 49, "chapel": 49, "counti": 49, "carolina": 49, "27516": 49, "state": [2, 49, 50, 57, 59, 62, 66, 67, 68], "8796631": 49, "0770546": 49, "latitud": [49, 50, 52], "longitud": [49, 50, 52], "latitid": 49, "max_card": 49, "cont_nam": 49, "cat_nam": 49, "load_win": [49, 60], "alcohol": 49, "malic_acid": 49, "ash": 49, "alcalinity_of_ash": 49, "magnesium": 49, "total_phenol": 49, "flavanoid": 49, "nonflavanoid_phenol": 49, "proanthocyanin": 49, "color_intens": 49, "hue": [49, 60, 68], "od280": 49, "od315_of_diluted_win": 49, "prolin": 49, "28": [49, 50, 56, 58, 59, 60, 73], "1065": 49, "1050": 49, "67": [49, 58, 59, 68], "1185": 49, "86": [49, 52, 59, 60, 62], "1480": 49, "69": [49, 54, 59], "735": [49, 68], "97": [49, 50, 52, 58, 59], "1450": 49, "1290": 49, "1295": 49, "1045": 49, "dmatric": 49, "designmatrix": 49, "178": [49, 57, 59, 60, 68], "intercept": [49, 52, 59], "1510": 49, "1280": 49, "1320": 49, "1150": 49, "1547": 49, "1310": 49, "1130": 49, "1680": 49, "780": 49, "770": 49, "1035": 49, "1015": 49, "830": 49, "1195": 49, "1285": 49, "915": 49, "omit": [24, 49, 73], "asarrai": 49, "this_obj": 49, "scikit": [49, 60, 67], "linear_model": [48, 49, 52, 59], "linearregress": [49, 52, 59], "query_str": 49, "scheme": [49, 65], "fragment": 49, "with_queri": 49, "new_path": 49, "with_path": 49, "with_frag": 49, "unlabel": 49, "terribl": 49, "definit": [49, 50], "pp": 49, "mr": [49, 50, 58], "owen": 49, "harri": 49, "prefixmarit": 49, "givennam": 49, "surnam": 49, "suffixgener": 49, "kate": 49, "cume": 49, "And": [49, 50, 52, 54, 60, 63], "prefect": [49, 57, 64, 67], "corporationnam": 49, "corporationlegaltyp": 49, "beauti": [49, 50, 52, 54, 60], "screen": [49, 68], "font": [49, 63], "encod": [49, 54, 58, 65, 67, 73], "typic": [49, 54, 59], "pdfreader": 49, "reader": 49, "extract_text": 49, "color_nam": 50, "cornflowerblu": 50, "scott": 50, "881": [50, 59], "patricia": 50, "nsouth": 50, "jeremi": 50, "06087": 50, "date_of_birth": 50, "minimum_ag": 50, "1927": 50, "donald": 50, "teacher": 50, "secondari": 50, "sill": 50, "email": [50, 54], "her": [50, 74], "ringslap": 50, "boatbench": 50, "thirti": 50, "mighti": 50, "hors": [50, 54], "a_th": 50, "khaki": 50, "wad": 50, "tote": 50, "twenti": [50, 54], "four": [50, 73], "eighteen": 50, "garlic": 50, "arm": 50, "god": [50, 54], "himself": 50, "wait": [50, 52, 55, 58, 68], "hat": 50, "birmingpoop": 50, "paragraph": 50, "agustin": 50, "neutral": [50, 52], "jerk": 50, "concern": 50, "badli": 50, "agn": 50, "basil": 50, "box": [50, 60], "slate": 50, "assesford": 50, "testasia": 50, "fantasticheartsound": 50, "hurl": 50, "danc": [50, 54], "arztotzka": 50, "cape": 50, "bui": [50, 59], "tub": 50, "boot": 50, "assembl": [50, 52], "jean": 50, "seth": 50, "violetbag": 50, "laudabl": 50, "lampton": 50, "birmingobject": 50, "cybertron": 50, "urllib": 50, "request": [50, 52, 55, 58, 65, 73], "urlopen": 50, "randomus": 50, "ava": 50, "hansen": 50, "street": 50, "3526": [50, 67], "georg": 50, "worcest": 50, "merseysid": 50, "kingdom": [50, 54], "postcod": 50, "k7z": 50, "3wb": 50, "9627": 50, "6871": 50, "timezon": [50, 59, 67], "tokyo": [45, 50], "seoul": 50, "osaka": 50, "sapporo": 50, "yakutsk": 50, "login": [50, 52], "uuid": [50, 62, 68], "253e53f9": 50, "9553": 50, "4345": 50, "9047": 50, "fb18aec51cf": 50, "heavywolf743": 50, "cristina": 50, "salt": 50, "xwnpqwtd": 50, "md5": 50, "2b5037da7d78258f167d5a3f8dc24edb": 50, "sha1": 50, "fabbede0577b3fed686afd319d5ab794f1b35b02": 50, "sha256": [50, 67], "d42e2061f9c283c4548af6c617727215c79ecafc74b9f3a294e6cf09afc5906f": 50, "dob": 50, "1948": 50, "21t10": 50, "053z": 50, "73": [50, 59, 63, 67, 68], "2011": [50, 52, 60], "19t03": 50, "830z": 50, "phone": [50, 54, 60], "015242": 50, "07811": 50, "0700": 50, "326": 50, "155": [50, 68], "nino": 50, "ht": 50, "portrait": 50, "women": 50, "jpg": [50, 68], "med": 50, "thumbnail": 50, "thumb": 50, "aubin": 50, "martin": [50, 59], "8496": 50, "rue": 50, "du": 50, "b\u00e2t": 50, "argent": 50, "strasbourg": 50, "meurth": 50, "et": [50, 59], "mosel": 50, "franc": 50, "83374": 50, "3192": 50, "0062": 50, "eastern": 50, "australia": [50, 59, 63], "guam": 50, "vladivostok": 50, "54b9bfa9": 50, "5e86": 50, "4335": 50, "8ae3": 50, "164d85df98e7": 50, "heavyladybug837": 50, "kendra": 50, "lcemyr5": 50, "2fbd9e05d992eb74f7afcccec02581fc": 50, "530a1bc71a986415176606ea377961d2ce381e5d": 50, "f5ee7bc47f5615e89f1729dcb49632c6b76a90ba50eb42d782e2790398ebc539": 50, "12t05": 50, "463z": 50, "2006": [50, 59], "28t03": 50, "433z": 50, "inse": 50, "1nnan48231023": 50, "men": 50, "interest": [50, 59], "monk": 50, "attr1": 50, "attr2": 50, "attr3": 50, "attr4": 50, "attr5": 50, "attr6": 50, "websit": [50, 62, 66, 74], "soup": 50, "stackoverflow": 50, "2081586": 50, "wanted_list": 50, "scraper": [], "build": [50, 59, 60, 64, 65, 67], "command": [50, 52, 54, 59, 64, 65, 66], "metaclass": 50, "ternari": 50, "substr": [50, 56, 62, 67], "dataread": [50, 65], "pandas_read": 50, "snippet": [50, 66, 68, 73, 74], "daili": [50, 52, 59, 68, 74], "pandas_dataread": 50, "av": 50, "api_kei": [50, 51, 59], "gehid": 50, "outputtenv": 50, "alphavantage_api_kei": 50, "trendreq": 50, "hl": 50, "tz": [50, 67], "360": [50, 68], "build_payload": 50, "kw_list": 50, "interest_over_tim": 50, "twitter": [50, 54, 55], "reddit": [47, 50], "snsscrape": 50, "tweet": 50, "hashtag": [50, 54], "khuyentran16": 50, "khuyen_tweet": 50, "publicli": 50, "censu": 50, "gov": 50, "cdc": 50, "datacommons_panda": 50, "plotli": [50, 55, 60], "px": [50, 55, 60], "median_incom": 50, "build_time_seri": 50, "geoid": 50, "median_income_person": 50, "overtim": 50, "process_t": 50, "count_person": 50, "usa": [50, 59], "count_person_mal": 50, "count_person_femal": 50, "count_robberi": 50, "count_criminalactivities_robberi": 50, "googlenew": 50, "set_time_rang": 50, "hagan": 50, "nhra": 50, "car": [50, 59], "media": [50, 52], "espn": 50, "feb": 50, "desc": 50, "matt": 50, "quickest": 50, "ngive": 50, "toni": 50, "stewart": 50, "race": 50, "qualifi": 50, "nset": 50, "stori": 50, "33381149": 50, "img": 50, "gif": [50, 63], "base64": 50, "r0lgodlhaqabaiaaap": 50, "yh5baekaaealaaaaaabaaeaaaictaeaow": 50, "fuel": [50, 63], "stock": 50, "promis": [50, 52], "pit": 50, "auto": [2, 50, 52, 60], "club": 50, "racewai": 50, "pomona": 50, "pack": 50, "nworld": 50, "drag": 50, "luca": 50, "oil": 50, "wintern": 50, "cast": [45, 50, 68], "broadwai": 50, "reviv": 50, "girl": [50, 54], "star": [50, 68], "playbil": 50, "newli": 50, "peter": 50, "franci": 50, "jame": 50, "ephi": 50, "naardema": 50, "moran": 50, "benko": 50, "margaret": 50, "hall": 50, "beani": 50, "feldstein": 50, "ramin": 50, "karimloo": 50, "robert": 50, "hight": 50, "fridai": 50, "night": 50, "ncamp": 50, "nwintern": 50, "33324340": 50, "owner": [50, 60], "ron": 50, "capp": 50, "autoweek": 50, "defend": 50, "champion": 50, "enter": [48, 50], "automak": 50, "nlong": 50, "him": 50, "susan": 50, "wade": 50, "a39160639": 50, "dodgemopar": 50, "under": [50, 52, 58, 68], "bu": 50, "video": 50, "highli": [50, 73], "anticip": 50, "nperform": 50, "preview": 50, "naugust": 50, "wilson": [50, 56], "broadwayworld": 50, "rehears": 50, "20220309": 50, "watch": 50, "sitzprob": 50, "theatermania": 50, "nfirst": 50, "orchestra": 50, "nkarimloo": 50, "fe_93550": 50, "stephen": 50, "colbert": 50, "prep": 50, "primetim": 50, "picklebal": 50, "cb": [50, 57], "hollywood": 50, "nthe": 50, "pickl": [2, 50, 53, 59, 62, 68], "celebr": 50, "competitor": 50, "vie": 50, "ngherkin": 50, "hollywoodreport": 50, "1235111617": 50, "randi": 50, "meyer": 50, "debut": 50, "inject": [50, 55, 56], "nitro": 50, "chao": 50, "midwest": 50, "nit": 50, "ntake": 50, "lauri": 50, "zaleski": 50, "talk": [50, 59], "farm": 50, "washington": [50, 59], "entendr": 50, "nanim": 50, "lunat": 50, "joke": 50, "sanctuari": 50, "she": [50, 54, 74], "nbuilt": 50, "washingtonpost": 50, "get_related_quest": 50, "Is": [50, 51, 54, 58, 59, 66], "career": 50, "concept": [50, 54, 62, 67, 68], "get_answ": 50, "has_answ": 50, "related_quest": 50, "stress": 50, "answer": [50, 51, 52, 54, 59], "NO": 50, "primarili": 50, "misconcept": 50, "beginn": 50, "discov": [50, 54, 60, 66], "domain": [50, 62], "realis": 50, "studi": 50, "oct": 50, "projectpro": 50, "522": [50, 54], "20short": 50, "20answer": 50, "20to": 50, "20the": 50, "20learn": 50, "20by": 50, "20work": 50, "20hard": 50, "displayed_link": 50, "snippet_str": 50, "snippet_data": 50, "snippet_typ": 50, "snippet_str_bodi": 50, "raw_text": 50, "ndata": 50, "noct": 50, "facebook_scrap": 50, "get_profil": 50, "get_group_info": 50, "thedachshundown": 50, "2685753618191566": 50, "member": [50, 52, 67], "128635": 50, "welcom": [50, 63], "npost": 50, "advis": 50, "lover": 50, "nyou": 50, "pic": 50, "ve": 50, "viral": 50, "seen": [50, 63], "rule": 50, "AND": [50, 56], "guidelin": [50, 64], "Be": 50, "aggress": 50, "backyard": [50, 60], "breed": 50, "spam": 50, "unrel": 50, "sell": [50, 59], "prohibit": 50, "forward": 50, "risk": [46, 50, 52, 53, 55, 59], "promot": [2, 50], "fish": [50, 60], "buyer": 50, "everyon": 50, "scam": 50, "sir": 50, "ladi": 50, "nwe": 50, "appreci": 50, "approv": 50, "shirt": [50, 62], "mug": 50, "canva": 50, "campaign": [50, 59], "thank": 50, "pawown": 50, "collectio": 50, "zuck": 50, "friend_count": 50, "follower_count": 50, "following_count": 50, "cover_photo": 50, "scontent": 50, "ord5": 50, "fbcdn": 50, "net": 50, "t31": 50, "18172": 50, "19575079_10103832396388711_8894816584589808440_o": 50, "stp": 50, "cp0_dst": 50, "jpg_e15_fr_q65": 50, "_nc_cat": 50, "ccb": 50, "_nc_sid": 50, "ed5ff1": 50, "_nc_ohc": 50, "z5jceahnv3aax9ihcdv": 50, "_nc_ht": 50, "00_afctbrp26zwk0onprfkbpjlrlfdwwlmlv1_xlkevlke_yw": 50, "oe": 50, "63ca953d": 50, "profile_pictur": 50, "t39": 50, "30808": 50, "312257846_10114737758665291_6588360857015169674_n": 50, "jpg_e15_q65_s120x120": 50, "dbb9e7": 50, "x2_muzaxc2cax9w6lz6": 50, "00_afdikcbbddzcymhxd": 50, "yjp2stit_vgpqrm9oeibsydfg8ba": 50, "63a81f9": 50, "zuckerberg": 50, "chan": 50, "ndecemb": 50, "nmeta": 50, "nfounder": 50, "ceo": 50, "nfebruari": 50, "npalo": 50, "alto": 50, "nbring": 50, "togeth": [47, 48, 50, 51, 55, 58, 60, 62], "harvard": 50, "ncomput": 50, "psycholog": 50, "nphillip": 50, "exet": 50, "academi": 50, "nclassic": 50, "nclass": 50, "nardslei": 50, "nhigh": 50, "1998": [50, 59], "php": 50, "104022926303756": 50, "refid": 50, "palo": 50, "105506396148790": 50, "dobb": 50, "ferri": 50, "hometown": 50, "quot": [47, 50, 54], "fortun": 50, "favor": 50, "bold": 50, "virgil": 50, "aeneid": 50, "284": [48, 50], "grow": [50, 64], "pablo": 50, "picasso": 50, "albert": 50, "einstein": 50, "pycausalimpact": 52, "advertis": 52, "effect": [52, 54, 58, 59, 73], "intervent": [52, 59], "tsa": 52, "arima_process": 52, "armaprocess": 52, "r_": 52, "ma": [52, 59], "arma_process": 52, "generate_sampl": 52, "nsampl": [52, 54], "800": [52, 57], "pre_period": [52, 59], "799": [52, 59], "post_period": [52, 59], "ci": [52, 59], "summari": [52, 53, 54, 58, 59, 66, 73], "posterior": [52, 59], "cumul": [52, 59], "18006": 52, "15994": 52, "15871": 52, "16110": 52, "1896": [52, 57], "2135": 52, "approx": [52, 59], "absenc": [52, 59, 60], "counterfactu": [52, 59], "yield": [52, 59], "discuss": [51, 52, 59], "individu": [29, 48, 52, 59], "meaningfulli": [52, 59], "interpret": [52, 59, 65], "overal": [52, 59], "taken": [52, 59, 60], "unlik": [52, 59, 68], "due": [21, 52, 59, 62, 65], "fluctuat": [52, 59], "bear": [52, 59], "substant": [52, 59], "goal": [52, 54, 59, 74], "underli": [52, 54, 59], "bayesian": [52, 59], "advanc": [52, 57, 59], "languag": 52, "zeroshotgptclassifi": 52, "unseen": 52, "skllm": 52, "skllmconfig": 52, "set_openai_kei": 52, "your_kei": 52, "set_openai_org": 52, "your_organis": 52, "get_classification_dataset": 52, "demo": 52, "clf": [52, 59], "openai_model": 52, "gpt": [52, 54], "turbo": 52, "metric": [52, 54, 58, 60, 64, 67], "accuracy_scor": 52, "make_pipelin": [48, 52], "especi": [15, 29, 52, 57, 59, 60, 63, 65, 66, 67], "logisticregress": [48, 52], "logist": 52, "regress": [52, 59], "svm": [2, 52, 64], "svc": [2, 52], "make_pip": 52, "grid_param": 52, "svc__c": 52, "svc__gamma": 52, "hypertun": 52, "cv": 52, "y_pred": [52, 59, 67], "y_actual": 52, "y_predict": 52, "testabl": 52, "deploi": [52, 57, 58], "incorpor": [52, 54, 59, 74], "modellibrari": 52, "wordlist": [52, 54], "nltk": [52, 54], "punkt": [52, 54], "inherit": 52, "_predict": 52, "nounphraseextractor": 52, "noun_phrase_extractor": 52, "noun_phras": [52, 54], "noun_extractor": 52, "strategi": [2, 52, 58], "memory_byt": 52, "model_nam": 52, "microsecond": [52, 67], "time_": 52, "232699939166196e": 52, "test_cas": [52, 58], "3191997974645346e": 52, "sentimentanalyz": 52, "sentiment_analyz": 52, "nlp_model": 52, "assetsmanag": 52, "lazy_load": 52, "remot": [52, 53, 66], "asset": [52, 59], "988200114690699e": 52, "depend": [52, 56, 58], "00894871700074873": 52, "751099964370951e": 52, "006440052002290031": 52, "model_collect": 52, "subject": [52, 54], "techniqu": [52, 54, 59], "pca": [52, 54], "complic": [52, 60, 62], "lucikili": 52, "load_credit": 52, "defaut": 52, "princip": 52, "pc_1": 52, "pc_2": 52, "equival": [45, 47, 52, 54, 56, 58], "sensit": 52, "varianc": [52, 59], "elimin": [45, 48, 52, 53, 58, 63, 66, 73], "Then": [50, 52, 63, 68, 73], "featureimport": 52, "decisiontreeclassifi": [52, 60, 64], "load_occup": 52, "viz": 52, "seem": [52, 59], "light": [52, 60, 68], "co2": 52, "temperatur": [51, 52, 60, 62, 73], "hyperparamet": [52, 60], "neither": 52, "nor": 52, "loader": 52, "validation_curv": 52, "max_depth": [52, 60], "param_nam": 52, "param_rang": 52, "f1": 52, "higher": [52, 58, 59], "spot": 52, "decreas": [2, 52, 57, 63], "decid": [52, 65], "plot_decision_region": 52, "gridspec": 52, "ensembl": 52, "randomforestclassifi": [52, 58], "ensemblevoteclassifi": 52, "iris_data": 52, "clf1": 52, "clf2": 52, "clf3": 52, "eclf": 52, "vote": 52, "soft": [52, 54], "gs": 52, "fig": [52, 54, 59, 60], "lab": 52, "grd": 52, "forest": 52, "rbf": [2, 52, 59], "kernel": [2, 52, 64, 67], "subplot": [52, 59, 60], "legend": [52, 58, 59, 60], "wandb": 52, "monitor": [52, 53], "suit": 52, "eas": 52, "distribut": [59, 60, 67, 73], "label_col": 52, "to_fram": 52, "df_train": 52, "df_test": 52, "stratifi": 52, "rf_clf": 52, "ds_train": 52, "cat_featur": [52, 58], "ds_test": 52, "full_suit": 52, "suite_result": 52, "1mwandb": 52, "33mkhuyentran1401": 52, "relogin": 52, "forc": [52, 59, 65, 73], "to_wandb": 52, "local": [52, 54, 56, 57, 59, 65, 67, 68, 73], "chapter5": [52, 58], "20220314_094658": 52, "1yf63l3g": 52, "sync": [52, 68], "mud": 52, "mouss": 52, "ai": [52, 68], "1yf63l3gsync": 52, "109": 52, "artifact": 52, "minor": 52, "randomoversampl": 52, "linearsvc": 52, "n_inform": 52, "n_repeat": 52, "n_class": 52, "imblearn": 52, "over_sampl": 52, "ro": 52, "x_resampl": 52, "y_resampl": 52, "fit_resampl": 52, "ax0": 52, "ax1": 52, "nrow": [52, 59], "ncol": [52, 59], "sharei": 52, "xi": 52, "yi": 52, "resampl": 52, "mapieregressor": 52, "regressor": 52, "make_regress": 52, "nois": 52, "alpha": [52, 59, 67], "y_pi": 52, "regression_coverage_scor": 52, "coverage_scor": 52, "enumer": 52, "scatter": [52, 55, 60], "c1": [], "argsort": [52, 54], "ls": [52, 58, 60], "fill_between": [52, 59], "ravel": [52, 57], "forecast": 52, "massiv": 52, "distributedmlforecast": 52, "dask": 52, "lgb": 52, "dasklgbmforecast": 52, "target_transform": [52, 59], "series_ddf": 52, "fcst": [52, 59], "lag": [52, 59], "hash": 52, "diabet": 52, "load_diabet": 52, "linear": 52, "render": [52, 60], "nbviewer": 52, "linearregressionlinearregress": 52, "dump": [2, 52, 55, 59], "diabetes_model": 52, "sample_data": 52, "mlemmodel": 52, "rev": [52, 64, 73], "uri": 52, "project_uri": 52, "fs": 52, "fsspec": [52, 65], "localfilesystem": 52, "0x16b631430": 52, "localartifact": 52, "563": [52, 59], "c57e456e8a0768326655a8b52cde4f47": 52, "__root__": 52, "installablerequir": 52, "package_nam": 52, "extra_index": 52, "source_url": 52, "vc": 52, "vcs_commit": 52, "processors_cach": 52, "sklearnmodel": 52, "simplepickleio": 52, "signatur": [52, 55, 67], "numpyndarraytyp": 52, "kw_onli": 52, "vararg": 52, "varargs_typ": 52, "varkw": 52, "varkw_typ": 52, "call_ord": 52, "object_typ": 52, "ndarrai": [52, 62], "init": [53, 59, 65, 66], "gdrive": 53, "lynnbbt": 53, "4j0ida0ekyqqzzbc93juuuubvh": 53, "pull": [53, 68], "checkout": [53, 66], "characterist": [53, 58, 60], "graph": [53, 59, 60, 65, 67], "sv": [53, 58], "show_html": 53, "valuabl": [53, 66], "quantiti": [47, 53, 54, 56, 58], "prof_view": 53, "prof_df": 53, "est": 53, "lower_1": 53, "upper_1": 53, "inf": [53, 59], "frequent_item": 53, "frequent_str": 53, "boolean": [53, 54], "tensor": 52, "00015": 53, "frequentitem": 53, "summarytyp": 53, "q_01": 53, "q_05": 53, "q_10": 53, "q_25": 53, "q_75": 53, "q_90": 53, "q_95": 53, "q_99": 53, "stddev": [53, 58], "cloud": [53, 76], "boilerpl": [53, 58, 63], "ssh": 53, "iter": [52, 53, 58, 59, 62, 67, 74], "who": [53, 54, 57], "interact": [52, 53, 55, 58, 59, 67], "auth": 53, "remoteauth": 53, "awsauth": 53, "authent": 53, "rmt_auth": 53, "from_password": 53, "aw": [53, 54], "aws_auth": 53, "aws_access_key_id": 53, "aws_access_kei": 53, "aws_secret_access_kei": 53, "aws_secret_kei": 53, "remotedir": 53, "awss3dir": 53, "rmt_dir": 53, "bucket": 53, "create_if_miss": 53, "aws_dir": 53, "transfer_to": 53, "dst": [53, 67], "recurs": [53, 62], "noun": 54, "phrase": [51, 54], "spell": 54, "download_corpora": 54, "word_count": 54, "defaultdict": 54, "beuti": 54, "mlxtend": 54, "generalize_nam": 54, "tran": [54, 74], "firstname_output_lett": 54, "kh": 54, "dataquest": 54, "lex": 54, "rank": 54, "blog": 54, "kept": 54, "motiv": 54, "someth": [54, 58, 67, 68], "behind": [54, 56], "skill": [51, 54], "gain": [54, 59], "fundament": [54, 60, 68], "meetup": 54, "teach": 54, "learner": 54, "spaci": [54, 65], "streamlit": 54, "streamlit_app": 54, "en_core_web_sm": 54, "browser": [52, 54, 67, 68], "1mhttp": 54, "localhost": [54, 58], "8501": 54, "ic": [54, 62, 67], "frozen": [54, 57, 67], "sweeten": 54, "num2word": [], "nineteen": 54, "libari": [], "ordin": [54, 67], "nineteenth": 54, "ordinal_num": 54, "2019th": 54, "lang": 54, "vi": [54, 60, 68], "hai": 54, "ngh\u00ecn": 54, "l\u1ebb": 54, "m\u01b0\u1eddi": 54, "ch\u00edn": 54, "es": 54, "mil": 54, "diecinuev": 54, "punctuat": 54, "stopword": 54, "hero": 54, "duck": [54, 58, 67], "pond": 54, "nltk_data": 54, "unzip": 54, "corpora": 54, "pipelin": [2, 47, 54, 58, 59, 62, 68, 73], "chain": [54, 56, 62], "remove_punctu": 54, "remove_stopword": 54, "remove_whitespac": 54, "gdown": 54, "cnn": 54, "kaggl": 54, "uc": [54, 55], "1qpgcz8mud5ptt8qjr79xq6koqnjut": 54, "4d": 54, "small_cnn": 54, "tfidf": 54, "scatterplot": [54, 60], "1000x300": 54, "appear": 54, "word_frequ": 54, "eat": [54, 60], "000135": 54, "0537": 54, "barplot": 54, "_decor": 54, "valid": [2, 47, 54, 60, 63, 64, 67], "misinterpret": 54, "newspap": 54, "mathdatasimplifi": [54, 62, 68], "dbt": 54, "publish_d": 54, "top_imag": 54, "wp": 54, "upload": [54, 55], "con": 54, "png": [54, 60], "dbtyou": 54, "warehous": 54, "snapshot": [54, 59], "cleans": 54, "property_typ": 54, "ramsrigouthamg": 54, "boudinfl": 54, "pke": 54, "universal_tagset": 54, "explos": 54, "sense2vec": 54, "s2v_reddit_2015_md": 54, "tar": [54, 67], "gz": [54, 67], "xvf": 54, "pprint": 54, "payload": 54, "weather": 54, "went": 54, "walk": [54, 58, 59, 60], "chat": 54, "neighbor": [54, 59, 64], "labrador": 54, "qe": 54, "boolqgen": 54, "predict_boolq": 54, "neighborhood": 54, "faq": 54, "qg": 54, "predict_shortq": 54, "wordninja": 54, "surpris": 54, "honeyinthejar": 54, "honei": 54, "ihavetwoappl": 54, "aratherblusterdai": 54, "bluster": 54, "automated_readability_index": 54, "ari": 54, "grade": [6, 54], "10th": 54, "11th": 54, "consciou": 54, "psychologist": 54, "marvel": 54, "acquir": [54, 57], "perfect": [54, 68], "pronunci": 54, "recogn": 54, "face": 54, "reading_tim": 54, "ms_per_char": 54, "fuzz": 54, "indel": 54, "tomorrow": 54, "tommorrow": 54, "24561403508771": 54, "54545454545454": 54, "token_sort_ratio": 54, "torch": [53, 54, 59], "negat": 54, "templat": 54, "po": [54, 58], "war": 54, "window": 54, "facebook": 54, "closur": 54, "tpp": 54, "jointli": 54, "vector": [52, 54, 60], "wordcloud": 54, "to_list": 54, "293": 54, "pre": [52, 54, 62, 64, 67, 73], "285": 54, "joint": 54, "023": 54, "dens": [52, 54], "656": [54, 68], "get_num_top": 54, "topic_word": 54, "word_scor": 54, "topic_num": 54, "get_top": 54, "semant": [], "cosin": 54, "generate_topic_wordcloud": 54, "plural_noun": 54, "he": 54, "plural_verb": 54, "feminin": 54, "singular_noun": 54, "compare_verb": 54, "fruit1": 54, "fruit2": 54, "keywordprocessor": 54, "kw_processor": [], "kw_dict": [], "chief": [], "add_keywords_from_dict": [], "keyword_dict": [], "fluent": [], "extract_keyword": [], "preprocessor": [48, 52, 54], "textpreprocessor": 54, "socialtoken": 54, "emoticon": 54, "text_processor": 54, "allcap": 54, "elong": 54, "emphasi": 54, "censor": 54, "corpu": 54, "unpack_hashtag": 54, "unpack_contract": 54, "unpack": 54, "spell_correct_elong": 54, "lowercas": [54, 67], "emoji": 54, "coolyazzy94": 54, "retweeeet": 54, "suck": 54, "haha": 54, "7rdymcvpkx": 54, "pre_process_doc": 54, "1gram": 54, "2gram": 54, "retweet": 54, "tong": 54, "chromadb": 54, "reli": [54, 58], "sole": 54, "translat": [45, 54, 67], "get_or_create_collect": 54, "man": [51, 54], "noodl": 54, "carri": 54, "babi": 54, "ride": 54, "query_result": 54, "query_text": 54, "pasta": 54, "n_result": 54, "5690374970436096": 54, "5929027199745178": 54, "chart": [54, 55], "bokeh": 55, "altair": 55, "dp": 55, "gapmind": 55, "gdppercap": 55, "lifeexp": 55, "pop": 55, "hover_nam": 55, "log_x": 55, "size_max": 55, "datat": 55, "successfulli": [54, 55, 65, 67, 73], "yourfileid": 55, "1ji1cmxqnwsmc": 55, "vbl8dny6b4anbtbbky3": 55, "120mb": 55, "1mb": 55, "concis": [15, 31, 55, 56, 63], "transmiss": 55, "reconstruct": 55, "serd": 55, "from_json": 55, "to_json": [55, 63], "from_yaml": 55, "to_yaml": 55, "nname": [55, 63], "malici": [53, 55, 68], "safeti": 55, "verifi": [55, 56], "tamper": 55, "urlsafeseri": 55, "auth_": 55, "eyjpzci6nswibmftzsi6imtodxllbnryyw4ifq": 55, "3cqlkhp1myeus8jnqmgv_mbrxsq": 55, "secret": [55, 66], "int8": 57, "float32": 57, "20640": 57, "fetch_california_h": [52, 57, 60], "scipi": [52, 57], "boxcox1p": 57, "pandas_appli": 57, "averoom": [52, 57], "swifter_appli": 57, "num_experi": 57, "swifter_tim": 57, "pandas_vs_swift": 57, "cprofil": 57, "cprofilers_exampl": 57, "246355": 57, "240252": 57, "primit": 57, "311": 57, "ncall": 57, "tottim": 57, "percal": 57, "cumtim": 57, "lineno": [57, 67], "__array_function__": 57, "copyto": 57, "ndim": 57, "prod": 57, "importlib": 57, "_bootstrap": 57, "1002": [56, 57], "_gcd_import": 57, "610": [57, 68], "353": 57, "1017": 57, "_handle_fromlist": 57, "1208": 57, "002": [57, 59], "527": [54, 57, 59], "004": 57, "147": [57, 68], "__enter__": 57, "151": [57, 68], "__exit__": [57, 68], "003": 57, "157": [57, 68], "_get_module_lock": 57, "524": [57, 67], "681": [57, 59], "194": [57, 59], "_lock_unlock_modul": 57, "310": [57, 59], "211": 57, "_call_with_frames_remov": 57, "4196": 57, "_verbose_messag": 57, "232": 57, "_requires_builtin_wrapp": 57, "521": [57, 59], "342": 57, "406": [57, 63], "_new_modul": 57, "880": 57, "005": [57, 58], "376": 57, "cach": [57, 67], "727": 57, "389": [57, 68], "498": [57, 59], "397": 57, "has_loc": 57, "spec_from_load": 57, "009": 57, "477": 57, "_init_module_attr": 57, "495": [57, 59], "549": [57, 59, 67], "module_from_spec": 57, "650": 57, "_load_unlock": 57, "520": 57, "725": 57, "find_spec": 57, "746": [57, 59], "create_modul": 57, "754": 57, "exec_modul": 57, "771": 57, "is_packag": 57, "497": [57, 67], "1530": 57, "863": 57, "867": [57, 68], "890": [57, 59], "_find_spec": 57, "937": [57, 68], "_sanity_check": 57, "956": 57, "_find_and_load_unlock": 57, "986": 57, "_find_and_load": 57, "_bootstrap_extern": 57, "1004": [56, 57], "1029": 57, "get_filenam": 57, "011": 57, "1034": 57, "1075": 57, "path_stat": 57, "1153": 57, "021": 57, "1164": 57, "058": 57, "1172": 57, "3858": 57, "006": 57, "_path_join": 57, "listcomp": 57, "812": 57, "_path_split": 57, "1624": 57, "genexpr": 57, "1317": 57, "_path_hook": 57, "820": 57, "1330": 57, "_path_importer_cach": 57, "007": 57, "_path_stat": 57, "026": 57, "1367": 57, "_get_spec": 57, "1399": 57, "704": [57, 59], "_path_is_mode_typ": 57, "1459": 57, "1465": 57, "474": [57, 59], "1493": 57, "733": [57, 68], "022": [57, 68], "1498": 57, "651": 57, "154": [57, 68], "_path_isfil": 57, "1549": 57, "_fill_cach": 57, "159": 57, "_path_isdir": 57, "1590": 57, "path_hook_for_filefind": 57, "pyinstrument_exampl": 57, "__": [57, 63], "durat": [24, 57, 58, 59, 60], "v4": 57, "31m0": [57, 58], "24m": 57, "15m": 57, "2mpyinstrument_exampl": 57, "2mpanda": 57, "4416": 57, "346": 57, "15mis_even": 57, "new_method": 57, "mod": [57, 59], "2m": [57, 65], "225": 57, "265": 57, "897": 57, "runpi": [57, 67], "_run_cod": [57, 67], "2mrunpi": 57, "textwrap": 57, "prev": 57, "15t09": 57, "restaur": [51, 57], "cook": [50, 57], "waiter": 57, "stove": 57, "sequenti": 57, "shout": 57, "count_to": 57, "highest_numb": 57, "sy": [57, 58, 60], "wall": 57, "submit": [57, 62, 67, 76], "862": 57, "manul": 57, "flow_run": [57, 68], "58a68b34": 57, "713": 57, "776": 57, "781": 57, "824": 57, "829": 57, "837": 57, "848": 57, "850": 57, "task_run": [57, 68], "043": 57, "062": 57, "daunt": [56, 57], "hardwar": 57, "facilit": 57, "costli": 57, "resourc": [57, 64, 74], "forget": [58, 64], "describ": [58, 73], "intention": 58, "idea": 58, "calculate_averag": 58, "todo": [58, 64], "test_calculate_average_two_num": 58, "Will": 58, "test_calculate_average_empty_list": 58, "unclear": 58, "misunderstand": 58, "contain_word": 58, "test_contain_word_1": 58, "test_contain_word_2": 58, "cowork": 58, "test_contain_word_exact": 58, "test_contain_word_different_cas": 58, "pytest_benchmark_exampl": 58, "list_comprehens": 58, "len_list": 58, "test_concat": 58, "linux": [58, 68, 73], "pluggi": [58, 73], "timer": 58, "perf_count": 58, "disable_gc": 58, "min_round": 58, "min_tim": 58, "000005": 58, "max_tim": 58, "calibration_precis": 58, "warmup": 58, "warmup_iter": 58, "rootdir": [58, 73], "hydra": [58, 73], "faker": 58, "anyio": [58, 68, 73], "32m": [56, 58, 65, 67, 73], "iqr": 58, "mop": 58, "286": 58, "4501": 58, "745": [58, 59], "5498": 58, "3872": 58, "6583": 58, "297": 58, "5001": 58, "3500": 58, "2686": 58, "5843": 58, "2322": 58, "162101": 58, "interquartil": 58, "1st": 58, "quartil": 58, "3rd": 58, "1m1": [58, 65, 73], "pytest_parametr": 58, "text_contain_word": 58, "noth": [58, 62], "test_text_contain_word": 58, "darwin": [58, 73], "bin": [58, 60, 65], "cachedir": 58, "pytest_cach": 58, "32mpass": 58, "1m2": [58, 65], "n2": [58, 59], "perc_differ": 58, "test_is_float": 58, "pytest_combin": 58, "directorybasedexampledatabas": 58, "typeguard": [58, 73], "1m4": 58, "pytest_without_id": 58, "1m3": 58, "pytest_id": 58, "pytest_param": 58, "1mcollect": 58, "pytest_fixtur": 58, "extract_senti": 58, "sentimetn": 58, "example_data": 58, "test_extract_senti": 58, "my_data": 58, "test_divis": 58, "test_modulu": 58, "modulu": 58, "scope": 58, "pytest_scop": 58, "pytest_skip": 58, "add_two": 58, "version_info": 58, "reason": 58, "eequir": 58, "test_add_two": 58, "33mskip": 58, "marker": [58, 60], "pytest_mark_xfail": 58, "divide_two_num": [], "test_divide_by_zero": [], "33mx": 58, "caplog": 58, "test_log": 58, "getlogg": 58, "logger": [58, 67], "test_divide_by_0": 58, "rare": 58, "writfil": 58, "pytest_repeat_exampl": 58, "generate_numb": 58, "test_generate_numb": 58, "1m100": 58, "frustrat": 58, "pytest_sugar_exampl": 58, "test_benchmark_exampl": 58, "test_parametr": 58, "test_fixtur": 58, "test_repeat_exampl": 58, "1mtest": 58, "36mpytest_sugar_exampl": 58, "0mtest_benchmark_exampl": 58, "32m1": [58, 65, 73], "40m": 58, "0mtest_fixtur": 58, "32m2": [58, 65], "0mtest_parametr": 58, "32m4": 58, "0mtest_repeat_exampl": 58, "32m23": 58, "32m42": 58, "32m62": 58, "32m81": 58, "32m100": 58, "302": 58, "8003": 58, "328": 58, "2844": 58, "9087": 58, "321": [58, 62], "5999": 58, "2495": 58, "866": [58, 68], "2220": 58, "0461": 58, "90868": 58, "104": [58, 62], "pytest_step": 58, "sum_test": 58, "average_2_num": 58, "steps_data": 58, "test_step": 58, "perc_difference_test": 58, "test_calc_suit": 58, "test_pick": 58, "plus_on": [56, 58, 67], "test_plus_on": 58, "branch": [58, 63], "untrack": 58, "31mtest_pick": 58, "repetit": [58, 68], "get_dog": 58, "test_get_dog": 58, "unittest": [], "testdog": 58, "testcas": 58, "test_walk": 58, "test_bark": 58, "constantli": 58, "verif": 58, "test_freezegun": 58, "freeze_tim": 58, "get_day_of_week": 58, "test_get_day_of_week": 58, "succe": 58, "patch": [58, 60], "connectionerror": 58, "5432": 58, "test_get_data_fail": 58, "mock_get": 58, "side_effect": 58, "test_get_data_succe": 58, "return_valu": 58, "properli": 58, "save_result": 58, "test_pyfakef": [], "file_nam": 58, "test_save_result": 58, "my_fil": 58, "create_dir": [], "poor": [58, 59], "reliabl": [51, 58], "available_fruit": 58, "nearby_stor": 58, "pa": 58, "dataframeschema": 58, "isin": 58, "less_than": [24, 58], "schemaerror": 58, "wise": 58, "failure_cas": 58, "check_input": 58, "get_total_pric": 58, "abbrevi": [58, 67], "price1": 58, "values_chang": 58, "new_valu": 58, "old_valu": 58, "ignore_ord": 58, "experience1": 58, "experience2": 58, "exclude_path": 58, "cmpare": 58, "259": 58, "significant_digit": 58, "dirty_equ": 58, "isnow": 58, "ispartialdict": 58, "islist": 58, "isstr": 58, "istruelik": 58, "timedelta": [58, 59, 67], "shop": 58, "is_mal": 58, "check_ord": 58, "scenario": [15, 52, 58, 59], "against": [56, 58, 60, 65, 73], "commut": 58, "test_hypothesi": 58, "test_floats_are_commut": 58, "37m": [58, 73], "00m": [58, 73], "94mdef": [58, 73], "92mtest_floats_are_commut": 58, "31mtest_hypothesi": 58, "94massert": [58, 73], "31me": [58, 73], "falsifi": [], "saw": [58, 62], "signal": [58, 68], "36m": [58, 67], "0mtest_hypothesi": 58, "31m": [58, 67, 73], "31m100": 58, "31mtest_floats_are_commut": 58, "robust": 58, "categorymismatchtraintest": 58, "new_categori": 58, "train_d": 58, "test_d": 58, "testfind": 58, "percent": [58, 63], "mislabel": 58, "conflictinglabel": 58, "recommend": [54, 58], "categorical_list": 58, "were": [6, 54, 58, 68], "therefor": [48, 58], "heurist": 58, "establish": 58, "phish": 58, "load_data": 58, "load_fitted_model": 58, "train_dataset": 58, "test_dataset": 58, "columntransform": [48, 52, 58], "simpleimput": [48, 52, 58], "urllength": 58, "numdigit": 58, "numparam": 58, "num_": 58, "entropi": 58, "hashttp": 58, "dsr": 58, "dse": 58, "bodylength": 58, "numtitl": 58, "numimag": 58, "numlink": 58, "specialchar": 58, "scriptlength": 58, "sbr": 58, "bscr": 58, "sscr": 58, "imput": [48, 52, 58], "most_frequ": [48, 58], "onehotencod": [48, 52, 58], "ext": 58, "criterion": 58, "simplemodelcomparison": 58, "minmaxscal": 58, "feature_rang": 58, "scaled_data": 58, "invers": 58, "original_data": 58, "inverse_transform": 58, "restor": 58, "crucial": [58, 59, 60], "assess": 58, "launch": [51, 58, 76], "popul": [52, 58, 66], "rate": [58, 59, 60, 73], "ab_test": 58, "lesampl": 58, "conversion_r": 58, "min_detectable_effect": 58, "get_size_per_vari": 58, "20177": 58, "reach": [58, 68], "ledataset": 58, "samplelesuccess": 58, "lesuccess": 58, "confidence_level": 58, "get_verdict": 58, "cleanup": 58, "addition": [48, 56, 58], "isol": 58, "test_postgr": 58, "test_query_result": 58, "cur": 58, "test_tabl": 58, "serial": [2, 45, 58, 59], "varchar": [45, 58], "alic": [32, 45, 58], "fetchal": 58, "dash": 58, "obsolet": 58, "evolv": [58, 73], "formula": 58, "testmod": 58, "ok": [2, 58], "relev": [47, 58], "criteria": 58, "fact": [58, 63], "test_chatbot": 58, "factual_consist": 58, "factualconsistencymetr": 58, "llmtestcas": 58, "run_test": 58, "assert_test": 58, "shoe": 58, "elig": 58, "refund": 58, "actual_output": 58, "factual_consistency_metr": 58, "minimum_scor": 58, "2kdownload": 58, "factualconsistencymodel": 58, "th": 58, "1a": [58, 65], "2k": [58, 65], "0mrun": 58, "teardown": 58, "sessionfinish": 58, "slowest": 58, "vv": 58, "3m": 58, "1mpass": 58, "1mfailur": 58, "1msuccess": 58, "factual": 58, "9911543130874634": 58, "find_dat": 59, "17th": 59, "00am": 59, "hope": 59, "realli": 59, "dayofweek": 59, "dayofyear": 59, "is_month_end": 59, "is_month_start": 59, "is_quarter_end": 59, "is_quarter_start": 59, "is_year_end": 59, "is_year_start": 59, "date_str": 59, "quit": 59, "inconveni": [59, 63], "423992": 59, "tzinfo": [59, 67], "utc": [59, 67], "cst": 59, "to_timezon": 59, "dsttzinfo": 59, "forgot": 59, "working_hour": 59, "timeseri": 59, "histogram": [59, 60], "16666666666666666": 59, "3333333333333333": 59, "166666666666666": 59, "confirm": 59, "us_holidai": 59, "unitedst": 59, "whatev": 59, "abl": [59, 66], "independ": [59, 60], "japan": 59, "us_cal": 59, "luther": 59, "king": 59, "jr": 59, "labor": 59, "columbu": 59, "veteran": 59, "thanksgiv": 59, "christma": 59, "is_working_dai": 59, "get_working_days_delta": 59, "ja_cal": 59, "foundat": 59, "emperor": 59, "vernal": 59, "equinox": 59, "showa": 59, "constitut": 59, "greeneri": 59, "marin": 59, "mountain": 59, "respect": [48, 59, 68, 73], "autumn": 59, "sport": 59, "labour": 59, "load_wineind": 59, "train_siz": 59, "150": [47, 59, 68, 74], "auto_arima": 59, "blue": [59, 63], "sunspot": 59, "boxcoxendogtransform": 59, "load_sunspot": 59, "2700": 59, "boxcox": 59, "lmbda2": 59, "autoarima": 59, "suppress_warn": 59, "rb": [2, 59], "stepwis": 59, "minim": [59, 63], "aic": 59, "10383": 59, "210": [59, 62], "10020": 59, "218": 59, "9831": 59, "422": 59, "10381": 59, "212": 59, "9830": 59, "357": 59, "9817": 59, "480": 59, "508": 59, "413": 59, "996": 59, "9820": 59, "047": 59, "213": [59, 67], "896": 59, "9818": 59, "625": 59, "10385": 59, "9816": 59, "628": 59, "710": 59, "722": [52, 59], "9813": 59, "247": [59, 68], "9819": 59, "401": 59, "9834": 59, "327": 59, "9815": 59, "242": [54, 59, 68], "236": [59, 68], "564": 59, "9811": 59, "253": 59, "230": 59, "9814": 59, "636": 59, "409": 59, "9832": 59, "334": 59, "248": 59, "055": 59, "546": 59, "878": 59, "73630214": 59, "72738664": 59, "33806937": 59, "97670263": 59, "94336951": 59, "27600697": 59, "76335004": 59, "06207145": 59, "18910652": 59, "76778119": 59, "01474934": 59, "41947969": 59, "57286429": 59, "30950555": 59, "63971231": 59, "nicer": 60, "customiz": 60, "set_them": 60, "node": [56, 60], "ab": [56, 60], "bc": 60, "data_science_flowchart": 60, "5236": 60, "122": 60, "6750": 60, "tooltip": 60, "3288": 60, "6625": 60, "popup": 60, "mt": 60, "hood": 60, "meadow": 60, "add_to": 60, "repositori": 60, "wine": 60, "classifi": [48, 59, 60], "target_nam": 60, "wine_typ": 60, "feature_nam": 60, "tune": [52, 54, 60], "hip": 60, "lr": [52, 60], "r2": 60, "sgd": 60, "adam": 60, "from_iter": 60, "javascript": [60, 62, 68], "ipythonexperimentdisplai": 60, "0x10b683730": 60, "strongli": 60, "presenc": 60, "soybean": 60, "_openml": 60, "404": 60, "msno": 60, "dendrogram": 60, "hierarch": 60, "cluster": [2, 52, 54, 60], "nulliti": 60, "fulli": 60, "discolor": 60, "germin": 60, "draw": 60, "matplotlib_venn": 60, "venn2": 60, "set_label": 60, "healthi": [54, 60], "group1": 60, "group2": 60, "cicl": 60, "venn3": 60, "rectangl": 60, "ds": [54, 59, 60], "da": [54, 60], "off": [60, 67], "mass": 60, "inlin": 60, "rc": [], "read_tabl": 60, "susanli2016": 60, "fruit_data_with_color": 60, "fruit_label": 60, "fruit_nam": 60, "fruit_subtyp": 60, "color_scor": 60, "granny_smith": 60, "180": [59, 60], "mandarin": 60, "84": [60, 63], "braeburn": 60, "172": 60, "pairplot": 60, "axisgrid": [], "pairgrid": [], "0x7f30a3be1a30": [], "distinct": [59, 60], "pairwis": [54, 60], "scaled_featur": 60, "lastli": 60, "embed": 60, "color_palett": [], "gca": [], "set_aspect": [], "datalim": [], "fontsiz": [52, 59], "degrad": 60, "dashboard": 60, "tab": [60, 67], "datadrifttab": 60, "california_data_drift_report": 60, "column_map": 60, "classdiagram": 60, "is_mamm": 60, "is_pet": 60, "fur_color": 60, "scale_color": 60, "swim": 60, "logic": [6, 60, 64], "td": 60, "feel": [60, 76], "sick": 60, "doctor": 60, "dress": 60, "confusion_matrix": [60, 64], "prettier": 60, "pretty_confusion_matrix": 60, "pp_matrix_from_data": 60, "purd": 60, "dark": 60, "dracula": 60, "radii": 60, "aura": 60, "ayu": 60, "challenger_deep": 60, "duft": 60, "dufte_bar": 60, "duftifi": 60, "gruvbox": 60, "nord": 60, "onedark": 60, "pacoti": 60, "pitaya_smoothi": 60, "solar": 60, "tab10": [59, 60], "tab20": 60, "tab20r": 60, "tokyo_night": 60, "edece": 60, "edgecolor": 60, "facecolor": 60, "15141b": 60, "labelcolor": 60, "xtick": [52, 60], "ytick": [52, 60], "framealpha": 60, "savefig": 60, "boxplot": 60, "boxprop": 60, "capprop": 60, "flierprop": 60, "markeredgecolor": 60, "whiskerprop": 60, "prop_cycl": 60, "cycler": 60, "82e2ff": 60, "ffca85": 60, "61ffca": 60, "ff6767": 60, "a277ff": 60, "f694ff": 60, "6d6d6d": 60, "nbextens": 60, "prefix": [60, 67], "widgetsnbextens": 60, "32mok": 60, "js": [60, 68], "depict": 60, "sankeywidget": 60, "anna": 60, "chicago": 60, "jose": 60, "milwauke": 60, "bussi": 60, "trip": [59, 60], "famili": [52, 60], "visit": [24, 59, 60], "vacat": 60, "to_dict": 60, "auto_save_png": 60, "audienc": 60, "transit": [59, 60], "coupl": 60, "lai": 60, "egg": [60, 66], "airborn": 60, "zoo": 60, "data_id": 60, "965": [60, 68], "add_data_fram": 60, "640px": 60, "360px": 60, "penguin": 60, "adeli": 60, "ipyvizzustori": 60, "slide": 60, "slide1": 60, "add_slid": 60, "slide2": 60, "suggest": [52, 60, 73], "statannot": 60, "wonder": 60, "test_ind": 60, "apply_and_annot": 60, "00e": 60, "vs": [54, 60], "p_val": 60, "507e": 60, "643e": 60, "508e": 60, "874e": 60, "171": 60, "880e": 60, "adjusttext": 60, "plot_text": 60, "bo": 60, "va": 60, "adjust_text": 60, "chicken": [60, 62], "growth": 60, "chart_typ": 60, "progress": [60, 68], "paper": 60, "x_valu": 60, "y1_valu": 60, "randn": [60, 65], "y2_valu": 60, "y3_valu": 60, "colors10": 60, "colors5": 60, "timestamp": [60, 67], "378": 60, "dpi": 60, "set_xlim": 60, "set_ylim": 60, "set_xtick": 60, "set_ytick": 60, "strftime": [45, 58, 60, 67, 73], "set_yticklabel": 60, "n10": 60, "nhour": 60, "yellowbrick": 60, "countvector": 60, "freqdistvisu": 60, "fetch_20newsgroup": [54, 60], "newsgroups_train": 60, "feature_extract": 60, "stop_word": 60, "get_feature_nam": 60, "openstreetmap": 60, "stad": 60, "van": 60, "zon": 60, "heerhugowaard": 60, "netherland": 60, "vm": 60, "iri": 60, "scatter_chart": 60, "sepal_length": 60, "petal_width": 60, "hist_chart": 60, "sepal_width": 60, "dropdown": [60, 66], "necessarili": [61, 74], "food_box": 62, "time_func_complex": 62, "end_tim": 62, "test_func_complex": 62, "time_func_simpl": 62, "test_func_simpl": 62, "regex": [59, 62], "anybutwhitespac": 62, "quantifi": [54, 59, 62], "oneormor": 62, "any_but_spac": 62, "optional_schem": 62, "get_pattern": 62, "get_match": 62, "deer": 62, "varieti": [50, 59, 62], "fav_food": 62, "temp": 62, "temps_f": 62, "degc": 62, "degf": 62, "celsiu": 62, "fahrenheit": 62, "unyt_arrai": 62, "572": 62, "synchron": [62, 66, 68], "sync_map": 62, "async_map": 62, "copper": 62, "spong": 62, "async": [62, 68], "3c3112ef": 62, "191": 62, "208": 62, "362": [62, 68], "380": 62, "685": 62, "persistedresult": [62, 68], "serializer_typ": [62, 68], "storage_block_id": [62, 68], "45e1a1fc": 62, "bdc8": 62, "4f8d": 62, "8945": 62, "287d12b46d33": 62, "storage_kei": [62, 68], "ad7912161ab44a6d8359f8089a16202d": 62, "fe83574cd0df4fc5838ef902beb34f6b": 62, "ba18fe9c568845ecbad03c25df353655": 62, "orchestr": [62, 68], "tutori": [62, 63, 67, 68], "basic": [15, 62, 67, 68, 74], "delet": [63, 66], "symbol": [6, 63, 65], "strip_interact": 63, "run_interact": 63, "clean_cod": 63, "termcolor": 63, "cprint": 63, "figlet_format": 63, "___": 63, "slant": 63, "____": 63, "bell": [50, 63], "fire_exampl": 63, "get_mean": [58, 63, 64, 68], "get_modulo": 63, "typer_exampl": 63, "add_numb": [6, 63], "invalid": [2, 6, 15, 63, 68], "cyan": 63, "src": 63, "latexifi": 63, "with_latex": 63, "mathrm": 63, "triangleq": 63, "4ac": 63, "2a": [63, 65], "autoencod": 63, "manim": 63, "overwhelm": 64, "navig": [64, 66], "arrang": 64, "unsort": 64, "fl_score": 64, "classification_report": 64, "roc_curv": 64, "gridsearchcv": 64, "stratifiedkfold": 64, "naive_bay": 64, "gaussiannb": [52, 64], "multinomialnb": 64, "kneighborsclassifi": [52, 64], "timeseriessplit": 64, "name_of_your_fil": 64, "repo": [64, 66, 73], "timothycroslei": 64, "hook": [64, 73], "interrogate_exampl": 64, "plus_two": 64, "multiply_thre": 64, "mirror": [62, 64], "mypy_exampl": 64, "union": [64, 68], "get_name_pric": 64, "v0": [51, 64], "910": 64, "test_refurb": 64, "furb109": 64, "furb108": 64, "err": 64, "silenc": 64, "liter": [51, 64], "stick": 64, "dosisod": 64, "eradicate_test": 64, "wemak": 64, "validationerror": [24, 64], "basemodel": [24, 51, 64], "splitconfig": 64, "split_data": 64, "341": 64, "type_error": 64, "stack": [52, 64], "list_rang": 64, "setup": [52, 63, 64, 65, 67, 68], "n_rang": 64, "consumpt": 64, "memory_profiler_test": 64, "del": 64, "mprof": 64, "1s": [64, 65, 66], "202": 64, "152": [64, 68], "pose": [48, 52, 53, 59, 64], "difficulti": 64, "dead_cod": 64, "dataprocessor": 64, "clean_data": 64, "jendrikseipp": 64, "later": [52, 59, 64], "old_venv": 65, "new_venv": 65, "uninstal": 65, "jinja2": [65, 67], "redo": 65, "typer": 65, "htmlmin": 65, "phik": 65, "multimethod": 65, "tangl": 65, "unicod": 65, "vision": 65, "missingno": 65, "freez": [65, 73], "pyinstrument": 65, "pypi": [65, 73], "proxi": [65, 73], "http_proxi": [65, 73], "3128": [65, 73], "https_proxi": [65, 73], "1080": [65, 73], "charset": [65, 73], "savepath": [65, 73], "dynam": 65, "compat": [52, 59, 65, 67, 68], "pin": [65, 73], "flask": [65, 67], "top_github_scrap": 65, "scrape_repo": 65, "scrape_us": 65, "reqs1": 65, "datacommon": 65, "reqs2": 65, "cmpreq": 65, "suddenli": 65, "broke": 65, "36mpanda": 65, "36mnumpi": 65, "34mupdat": 65, "34mresolv": 65, "3s": 65, "34mwrite": 65, "lock": 65, "1mpackag": 65, "34m5": 65, "34m0": 65, "39minstal": 65, "36msix": 65, "39m": [65, 68], "34mpend": 65, "0j": 65, "34minstal": 65, "36mpython": 65, "dateutil": 65, "36mpytz": 65, "1m2021": 65, "3a": 65, "32m2021": 65, "pyproject": 65, "toml": 65, "earlier": 65, "1msolverproblemerror": 65, "1mbecaus": 65, "chapter6": 65, "puzzl": 65, "solver": 65, "1m241": 65, "36m_solv": 65, "2m237": 65, "39mresult": 65, "39mpackag": 65, "2m238": 65, "1mexcept": 65, "39moverrideneed": 65, "1ma": 65, "39me": 65, "2m239": 65, "1mreturn": 65, "1mself": [65, 67], "39msolve_in_compatibility_mod": 65, "39moverrid": 65, "39muse_latest": 65, "2m240": 65, "39msolvefailur": 65, "1mrais": 65, "39msolverproblemerror": 65, "2m242": 65, "2m243": 65, "1mdict": 65, "2m244": 65, "depth_first_search": 65, "2m245": 65, "packagenod": 65, "39m_packag": 65, "39maggregate_package_nod": 65, "34mname": 65, "34mversion": 65, "34mdescript": 65, "34mdepend": 65, "34m4": 65, "39mremov": 65, "34mremov": 65, "publish": 65, "onefil": 65, "spec": [52, 59, 65], "255826": 65, "038615": 65, "850358": 65, "318558": 65, "255311": 65, "618789": 65, "434642": 65, "474813": 65, "676099": 65, "662942": 65, "314174": 65, "142569": 65, "704812": 65, "095609": 65, "156275": 65, "999871": 65, "839902": 65, "366550": 65, "818387": 65, "512015": 65, "conveni": [47, 59, 65], "colleagu": 65, "your_local_fold": 66, "gh": 66, "fetch": [59, 66, 68], "mess": 66, "clone": 66, "highlight": [59, 66], "yournam": 66, "quick": 66, "hassl": 66, "compil": [50, 66, 73], "pr": 66, "outdat": 66, "pull_request": 66, "ubuntu": 66, "permiss": 66, "kanhari": 66, "env": [52, 66, 68, 73], "github_token": 66, "openai_api_kei": [51, 66, 73], "bytes_or_buff": 67, "capit": 67, "casefold": 67, "suitabl": 67, "caseless": 67, "fillchar": 67, "utf": 67, "strict": 67, "codec": 67, "endswith": 67, "suffix": 67, "expandtab": 67, "tabsiz": 67, "format_map": 67, "isalnum": 67, "isalpha": 67, "isascii": 67, "ascii": 67, "isdecim": 67, "isdigit": 67, "isidentifi": 67, "isnumer": 67, "isprint": 67, "printabl": 67, "isspac": 67, "istitl": 67, "ljust": 67, "justifi": 67, "lstrip": 67, "maketran": 67, "usabl": 67, "partit": [52, 56, 67], "rfind": 67, "rindex": 67, "rjust": 67, "rpartit": 67, "rsplit": 67, "maxsplit": 67, "delimit": 45, "rstrip": 67, "trail": 67, "splitlin": 67, "keepend": 67, "boundari": 67, "strip": [50, 67], "swapcas": 67, "titlecas": 67, "zfill": 67, "pad": 67, "edit_data": 67, "log_loc": 67, "1165738010": 67, "struggl": 67, "loguru_vs_log": 67, "logging_exampl": 67, "basicconfig": 67, "asctim": 67, "levelnam": 67, "funcnam": 67, "critic": 67, "802": [59, 67], "loguru_exampl": 67, "catch": [67, 68], "mean_squared_error": 67, "file_": 67, "evaluate_result": 67, "y_true": 67, "mean_square_err": 67, "root_mean_square_err": 67, "ipykernel_174022": 67, "1865479429": 67, "0x7f279588f430": 67, "0x7f27958bfca0": 67, "inner_f": 67, "0x7f27958bfb80": 67, "_regress": 67, "335": 67, "y_type": 67, "multioutput": 67, "_check_reg_target": 67, "0x7f27958b7af0": 67, "check_consistent_length": 67, "0x7f279676e040": 67, "319": 67, "icrecream": 67, "itself": [67, 73], "trace": 67, "alreadi": [54, 67, 68], "heat": [50, 67, 73], "headach": 67, "pyheat_exampl": 67, "ph": 67, "create_heatmap": 67, "show_heatmap": 67, "57aff36d5f6d": 67, "lego": 67, "sklego": 67, "pandas_util": 67, "log_step": 67, "print_fn": 67, "make_copi": 67, "drop_column": [29, 67], "encode_cat_vari": 67, "000239": 67, "n_ob": 67, "n_col": 67, "002117": 67, "003217": 67, "tqdm": [59, 60, 67], "arbitrari": [48, 53, 67], "example1": 67, "example2": 67, "task1": 67, "task2": 67, "my_flow": 67, "ui": 67, "wednesdai": 68, "get_incoming_data": 68, "train_model": 68, "retrain": 68, "run_pend": 68, "file_to_run": 68, "chime": 68, "listen": 68, "awai": [59, 68], "knock": 68, "email_send": 68, "recipient_email": 68, "your_email": 68, "your_second_email": 68, "adress": 68, "sender_email": 68, "grandma": 68, "s_email": 68, "gmail": 68, "train_your_nicest_model": 68, "your_nicest_paramet": 68, "slack": 68, "channel": [52, 68], "everybodi": 68, "sequenc": 68, "echo": 68, "virtual": [56, 68], "poetri": 68, "shell": [67, 68], "pull_data": 68, "dvc": [58, 68, 73], "install_al": 68, "customer_segment": 68, "md": [63, 68], "webbrows": 68, "open_new": 68, "explicitli": 68, "tediou": [67, 68], "star_script": 68, "square_root": 68, "deg_to_rad": 68, "radian": 68, "edit": 68, "earli": 68, "draft": 68, "effort": 68, "monkey_exampl": 68, "stub": 68, "meant": 68, "wifi": 68, "bulb": 68, "laptop": 68, "bedroom": 68, "bathroom": 68, "livingroom": 68, "run_process": 68, "cancel": [67, 68], "timeout_second": 68, "687": 68, "arrog": 68, "goshawk": 68, "979": 68, "e6feb297": 68, "982": 68, "561": 68, "exceed": 68, "timeout": 68, "1239": 68, "orchestrate_task_run": 68, "await": [67, 68], "run_sync": 68, "fn": [51, 68], "asyncutil": 68, "run_sync_in_interruptible_worker_thread": 68, "tg": 68, "start_soon": 68, "_backend": 68, "_asyncio": 68, "658": 68, "__aexit__": 68, "cancellederror": 68, "asyncio": [67, 68], "_core": 68, "_task": 68, "timeouterror": 68, "788": 68, "timedout": 68, "nasyncio": 68, "ndure": 68, "ntimeouterror": 68, "790": [59, 68], "orchestrate_flow_run": 68, "flow_cal": 68, "run_sync_in_worker_thread": 68, "to_thread": 68, "get_asynclib": 68, "3z": 68, "svlh9jv14ps3j6cc964tbjg40000gq": 68, "ipykernel_83306": 68, "3092424982": 68, "__call__": 68, "enter_task_run_engin": 68, "run_async_from_worker_thread": 68, "begin_run": 68, "from_thread": 68, "asynclib": 68, "run_async_from_thread": 68, "970": 68, "commandlinetool": 68, "framework": [48, 52, 53, 67, 68], "concurr": [47, 68], "_base": 68, "445": 68, "__get_result": 68, "390": 68, "_except": 68, "874": 68, "get_task_call_return_valu": 68, "_result": 68, "final_st": 68, "raise_on_failur": 68, "_get_state_result": 68, "get_state_except": 68, "wait_for": 68, "result_factori": 68, "interrupt": 68, "1234": 68, "1235": 68, "1236": 68, "timeout_scop": 68, "1237": 68, "1238": 68, "1241": 68, "exc": 68, "__fn": 68, "send_interrupt_to_thread": 68, "partial": 68, "capture_worker_thread_and_result": 68, "notset": 68, "taskgroup": 68, "exc_typ": 68, "exc_val": 68, "exc_tb": 68, "654": 68, "655": 68, "442": [59, 68], "return_st": 68, "438": 68, "get_call_paramet": 68, "440": 68, "return_typ": 68, "enter_flow_run_engine_from_flow_cal": 68, "443": 68, "444": [59, 68], "446": [54, 68], "447": 68, "in_async_main_thread": 68, "portal": 68, "153": 68, "start_blocking_port": 68, "156": 68, "283": 68, "blockingport": 68, "268": 68, "269": 68, "270": 68, "callabl": [48, 68], "coroutin": [67, 68], "t_retval": 68, "271": 68, "272": 68, "273": 68, "274": 68, "thread": [47, 67, 68], "275": 68, "281": 68, "start_task_soon": 68, "_state": 68, "388": 68, "391": 68, "392": 68, "cycl": [63, 68], "393": 68, "219": 68, "_call_func": 68, "216": [47, 68], "217": 68, "add_done_callback": 68, "callback": 68, "retval": 68, "220": 68, "_cancelled_exc_class": 68, "inject_cli": 68, "with_injected_cli": 68, "client_context": 68, "new_client": 68, "setdefault": 68, "create_then_begin_flow_run": 68, "235": 68, "238": 68, "get_state_result": 68, "backward": 68, "is_crash": 68, "is_fail": 68, "datadocu": 68, "result_from_state_with_data_docu": 68, "partial_flow_run_context": 68, "604": [59, 68], "605": [59, 68], "606": 68, "607": 68, "608": 68, "609": [59, 68], "612": [59, 68], "waited_for_task_run": 68, "wait_for_task_runs_and_report_crash": 68, "613": 68, "flow_run_context": 68, "task_run_futur": 68, "614": 68, "616": 68, "continu": [50, 68], "outcom": [59, 68], "capacitylimit": 68, "sniffio": 68, "current_async_library_cvar": 68, "936": 68, "queue": 68, "put_nowait": 68, "workerthread": 68, "865": 68, "baseexcept": 68, "868": 68, "869": 68, "356": 68, "358": 68, "363": 68, "364": 68, "task_runn": 68, "sequentialtaskrunn": 68, "365": 68, "366": 68, "367": 68, "731": 68, "732": 68, "isasync": 68, "736": 68, "737": [67, 68], "738": 68, "sync_port": 68, "runtimeerror": 68, "964": 68, "966": 68, "967": 68, "run_coroutine_threadsaf": 68, "968": [63, 68], "threadloc": 68, "969": 68, "extra_task_input": 68, "872": 68, "_wait": 68, "875": 68, "876": 68, "prefectfutur": 68, "1233": 68, "1242": 68, "failaftercontextmanag": 68, "116": 68, "_cancel_scop": 68, "117": 68, "cancel_cal": 68, "occasion": [50, 68], "retry_delay_second": 68, "flaky_funct": 68, "bald": 68, "caiman": 68, "906": 68, "8095224b": 68, "908": 68, "1449": 68, "ipykernel_36167": 68, "3817304312": 68, "awaitingretri": 68, "propos": 68, "569": [59, 68], "013": 68, "512": 68, "2c195477": 68, "a9d1": 68, "4b59": 68, "9a9e": 68, "80b00f96c464": 68, "84ff6378ce894b6fb1823e60b1d201b4": 68, "previou": [59, 62, 73], "icon": [73, 76], "corner": [73, 76], "latex": 73, "3x": 73, "papermil": 73, "tag": [59, 73], "parameter": 73, "magic": [], "load_ext": 73, "12t09": 73, "438535": 73, "cpython": 73, "gcc": 73, "x86_64": 73, "architectur": 73, "64bit": 73, "ivers": 73, "pipreqsnb": 73, "pipreq": 73, "scikit_learn": 73, "seppar": 73, "experiment": 73, "pytest": [24, 56, 73], "qq": [56, 73], "autoconfig": 73, "multiply_by_two": 73, "test_multiply_by_two": 73, "31mf": 73, "failur": 73, "1m_____________________________": 73, "sample1": 73, "expected1": 73, "______________________________": [58, 73], "33msampl": 73, "92mtest_multiply_by_two": 73, "56d7928444c9": 73, "tmpospmc1tm": 73, "isort": 73, "flake8": 73, "example_notebook": 73, "ipnb": 73, "reformat": [], "cell_1": 73, "f401": 73, "chapter7": 73, "rede": 73, "spread": 74, "awar": 74, "knowledg": 74, "bite": 74, "700": [59, 74], "mailbox": 74, "subscrib": 74, "wrote": 74, "100k": 74, "toward": 74, "500": [2, 56, 59, 63, 74], "mission": 74, "button": 76, "colab": 76, "subsequ": [45, 48, 59], "set_output": 48, "60000": 48, "70000": 48, "414214": 48, "neat": 51, "sk": 51, "dude": 51, "ness": 51, "dudeifi": 51, "bodi": [51, 67], "yo": 51, "functioncal": 51, "tea": [2, 51], "sweetness_percentag": 51, "create_milk_tea": 51, "boba": 51, "froth_milk": 51, "textur": 51, "foami": 51, "hot": [50, 51], "cold": 51, "froth": 51, "coffee_typ": 51, "configure_coffe": 51, "latt": 51, "pandas_on_spark": 56, "familiar": [47, 56], "ps": 56, "psdf": 56, "006482": [], "201401": [], "959126": [], "712733": [], "369599": [], "396453": [], "392501": [], "822455": [], "156499": [], "169058": [], "646378": [], "789393": [], "902216": [], "127352": [], "269125": [], "638909": [], "04922": [], "090836": [], "83575": [], "174097": [], "spark_data": 56, "numeric_featur": 48, "categorical_featur": 48, "numeric_transform": [48, 52], "categorical_transform": [48, 52], "sparse_output": 48, "verbose_feature_names_out": 48, "x_transform": 48, "cat1_a": 48, "cat1_b": 48, "cat1_c": 48, "cat2_x": 48, "cat2_i": 48, "cat2_z": 48, "791093": 48, "393167": 48, "707107": 48, "174741": 48, "266871": 48, "043685": 48, "wrong": 6, "calculate_grad": 6, "constraint": [24, 58], "test_processing_fn": 58, "in_rang": 58, "out_schema": 58, "add_column": 58, "val3": 58, "check_output": 58, "processing_fn": 58, "nullabl": 58, "spark": 52, "collabor": 52, "reduct": [52, 54], "linalg": 52, "maxit": 52, "regparam": 52, "model1": 52, "aggregationdepth": 52, "treeaggreg": 52, "elasticnetparam": 52, "elasticnet": 52, "penalti": 52, "binomi": 52, "multinomi": 52, "featurescol": 52, "fitintercept": 52, "labelcol": 52, "lowerboundsoncoeffici": 52, "coeffici": 52, "constrain": 52, "undefin": 52, "lowerboundsonintercept": 52, "beequal": 52, "oflass": 52, "maxblocksizeinmb": 52, "maximum": [52, 59], "predictioncol": 52, "probabilitycol": 52, "calibr": 52, "treat": [52, 56, 73], "rawpredictioncol": 52, "rawpredict": 52, "converg": 52, "toler": 52, "upperboundsoncoeffici": 52, "upperboundsonintercept": 52, "weightcol": 52, "0019392203169556147": 52, "9980607796830444": 52, "995731919571047": 52, "004268080428952992": 52, "01200463023637096": 52, "987995369763629": 52, "cond": 68, "time_of_week": 68, "file_exist": 68, "myfil": 68, "do_work": 68, "time_of_dai": 68, "do_hourly_at_night": 68, "weekli": 68, "mon": 68, "sat": 68, "do_twice_a_week": 68, "fill_dict": 29, "variant": 48, "skub": 48, "dedupl": 48, "duplic": [48, 56], "make_deduplication_data": 48, "duplicated_food": 48, "chocol": 48, "broccoli": 48, "jalapeno": 48, "zucchini": 48, "entries_per_exampl": 48, "300": [2, 47, 48, 52, 56], "prob_mistake_per_lett": 48, "letter": 48, "cgocol": 48, "chqcolat": 48, "chocoltt": 48, "most_common": 48, "195": [48, 67], "jalaoeno": 48, "chocdlat": 48, "ehocol": 48, "chocolatw": 48, "brocroli": 48, "brojcoli": 48, "broccsli": 48, "broccqli": 48, "bxoccoli": 48, "sroccoli": 48, "brzccoli": 48, "jylapeno": 48, "jalaponi": 48, "closest": 48, "deduplicated_data": 48, "translation_t": 48, "qalapeno": 48, "jalapenh": 48, "jalapeto": 48, "oalapeno": 48, "jalqceno": 48, "jzlapeno": 48, "dotenv": 46, "expos": 46, "codebas": 46, "unauthor": 46, "myusernam": 46, "playlist": 68, "resolut": [67, 68], "yt": 68, "youtu": 68, "ukctvrjsol0": 68, "thumbnail_url": 68, "ytimg": 68, "hq720": 68, "stream": 68, "itag": 68, "mime_typ": 68, "3gpp": 68, "144p": 68, "fp": 68, "8fp": 68, "vcodec": 68, "mp4v": 68, "acodec": 68, "mp4a": 68, "mp4": 68, "360p": 68, "30fp": 68, "avc1": 68, "42001e": 68, "720p": 68, "64001f": 68, "webm": 68, "vp9": 68, "480p": 68, "4d401f": 68, "244": 68, "4d401e": 68, "243": 68, "240p": 68, "4d4015": 68, "160": [59, 68], "4d400c": 68, "278": 68, "audio": 68, "abr": 68, "48kbp": 68, "128kbp": 68, "249": 68, "50kbp": 68, "opu": 68, "250": [2, 68], "70kbp": 68, "251": 68, "160kbp": 68, "mime": 68, "plnk6m_jbrvnopnqnvrwaytz2g4nftngz": 68, "si": 68, "bk4o05ihmgqsynk2": 68, "proper": 2, "current_statu": 2, "gate": 2, "statuscod": 2, "trend": 59, "trendforecast": 59, "fh": 59, "distance_bas": 59, "kneighborstimeseriesclassifi": 59, "dtw": 59, "_x": 30, "_y": 30, "merged_df": 30, "val_x": 30, "val_i": 30, "_df1": 30, "_df2": 30, "val_df1": 30, "val_df2": 30, "a3d9b1": 52, "06b1cf": 52, "f8d347": 52, "e48789": 52, "linewidth": [52, 59], "group_column": 58, "value_column": [58, 59], "test_cget_mean": 58, "thrown": 58, "pytest_to_fail": 58, "test_get_mean": 58, "u4": 59, "integer_column": 47, "select_dtyp": 47, "other_column": 47, "abi64str1": 47, "anomali": 59, "rpt": 59, "sigma": 59, "num_breakpoint": 59, "true_breakpoint": 59, "pw_constant": 59, "noise_std": 59, "algo": 59, "pelt": 59, "predicted_breakpoint": 59, "datapipelin": 2, "drop_missing_data": 2, "standardize_data": 2, "processed_data": 2, "encode_categorical_data": 2, "c_a": 2, "c_b": 2, "024695": 2, "161895": 2, "439155": 2, "387298": 2, "146385": 2, "317465": 2, "refactor": 2, "pluggabl": 2, "dataprocessingstrategi": 2, "dropmissingdatastrategi": 2, "standardizedatastrategi": 2, "add_strategi": 2, "extend": 2, "reorder": [2, 62], "encodedatastrategi": 2, "pickleablemodel": 2, "kmean": [2, 54], "make_blob": 2, "to_pickl": 2, "from_pickl": 2, "deseri": 2, "pickleablekmean": 2, "n_cluster": [2, 54], "pickleablesvm": 2, "n_init": 2, "kmeans_file_path": 2, "kmeans_model": 2, "pickleablemixin": 2, "safeguard": 56, "attack": 56, "item_price_panda": 56, "item_id": 56, "item_pric": 56, "id_val": 56, "heartbeatreceiv": [], "executor": [], "driver": [], "heartbeat": [], "976371": [], "exce": [], "120000": [], "sparkcontext": [], "schedul": [], "inbox": [], "sparkexcept": [], "awaitresult": [], "sparkthreadutil": [], "scala": [], "threadutil": [], "rpc": [], "rpctimeout": [], "rpcenv": [], "setupendpointrefbyuri": [], "102": 67, "setupendpointref": [], "rpcutil": [], "makedriverref": [], "blockmanagermasterendpoint": [], "driverendpoint": [], "lzycomput": [], "124": [], "isexecutoral": [], "688": 59, "anonfun": [], "receiveandrepli": [], "applyorels": [], "netti": [], "safelycal": [], "messageloop": [], "receiveloop": [], "anon": [], "threadpoolexecutor": [], "runwork": [], "1149": [], "624": [], "750": 56, "rpcendpointnotfoundexcept": [], "endpoint": [52, 59], "coarsegrainedschedul": [], "mbp": [], "62398": [], "nettyrpcenv": [], "asyncsetupendpointrefbyuri": [], "flatmap": [], "307": [], "impl": [], "transformwith": [], "callbackrunn": [], "executioncontextimpl": [], "executewithvalu": [], "defaultpromis": [], "trycomplet": [], "288": [], "187": [], "batchingexecutor": [], "batch": 47, "processbatch": [], "runtim": [], "java8": [], "jfunction0": [], "mcv": [], "sp": [], "blockcontext": [], "withblockcontext": [], "internalcallbackexecutor": [], "unbatchedexecut": [], "trysuccess": [], "onsuccess": [], "askabort": [], "localnettyrpccallcontext": [], "nettyrpccallcontext": [], "repli": [], "rpcendpointverifi": [], "rpcendpointref": [], "asksync": [], "blockmanagermast": [], "registerblockmanag": [], "blockmanag": [], "reregist": [], "642": [], "reportheartbeat": [], "1223": [], "295": [], "loguncaughtexcept": [], "1928": [], "runnableadapt": [], "511": 59, "futuretask": [], "runandreset": [], "308": [], "scheduledthreadpoolexecutor": [], "scheduledfuturetask": [], "301": [], "294": [], "dispatchoraddcallback": [], "316": [], "oncomplet": [], "306": [], "exit": [], "62413": [], "opt": 67, "homebrew": 67, "cellar": 67, "6_1": 67, "socketserv": [], "317": [], "_handle_request_noblock": [], "process_request": [], "client_address": [], "348": [], "finish_request": [], "requesthandlerclass": [], "755": [], "poll": [], "accum_upd": [], "267": [], "rfile": [], "num_upd": [], "read_int": [], "596": [], "eoferror": [], "jupyter_ai": 73, "your_api_key_her": 73, "chatgpt": 73, "spatial": 73, "laplacian": 73, "commonli": 73, "conduct": 73, "monthli": [59, 73], "yyyi": [67, 73], "mm": [67, 73], "monthly_d": 73, "unnot": 11, "unequ": 11, "mistralai": 51, "mistral": 51, "7b": 51, "assist": 51, "pyfakef": 58, "filesystem": 58, "test_tmp_path": 58, "lazypredict": 52, "supervis": 52, "lazyclassifi": 52, "load_breast_canc": 52, "ignore_warn": 52, "custom_metr": 52, "balanc": [2, 52, 59], "roc": 52, "auc": 52, "989474": 52, "987544": 52, "989462": 52, "0150008": 52, "sgdclassifi": 52, "0109992": 52, "mlpclassifi": 52, "985965": 52, "986904": 52, "985994": 52, "426": [52, 67], "perceptron": 52, "984797": 52, "0120046": 52, "98269": 52, "985934": 52, "0200036": 52, "logisticregressioncv": 52, "262997": 52, "982456": 52, "979942": 52, "982437": 52, "0140011": 52, "calibratedclassifiercv": 52, "975728": 52, "982357": 52, "0350015": 52, "passiveaggressiveclassifi": 52, "975439": 52, "974448": 52, "975464": 52, "0130005": 52, "labelpropag": 52, "0429988": 52, "labelspread": 52, "0310006": 52, "97193": 52, "969594": 52, "033": 52, "gradientboostingclassifi": 52, "967486": 52, "971869": 52, "166998": 52, "quadraticdiscriminantanalysi": 52, "964912": 52, "966206": 52, "965052": 52, "0119994": 52, "histgradientboostingclassifi": 52, "968421": 52, "964739": 52, "968387": 52, "682003": 52, "ridgeclassifiercv": 52, "963272": 52, "971736": 52, "0130029": 52, "ridgeclassifi": 52, "960525": 52, "968242": 52, "0119977": 52, "adaboostclassifi": 52, "961404": 52, "959245": 52, "961444": 52, "204998": 52, "extratreesclassifi": 52, "957138": 52, "961362": 52, "0270066": 52, "95503": 52, "961276": 52, "0560005": 52, "baggingclassifi": 52, "947368": 52, "954577": 52, "947882": 52, "0559971": 52, "bernoullinb": 52, "950877": 52, "951003": 52, "951072": 52, "0169988": 52, "lineardiscriminantanalysi": 52, "950816": 52, "961089": 52, "0199995": 52, "954386": 52, "949536": 52, "954337": 52, "0139935": 52, "nusvc": 52, "943215": 52, "954014": 52, "019989": 52, "936842": 52, "933693": 52, "936971": 52, "0170023": 52, "nearestcentroid": 52, "933506": 52, "946801": 52, "0160074": 52, "extratreeclassifi": 52, "922807": 52, "912168": 52, "922462": 52, "0109999": 52, "checkingclassifi": 52, "361404": 52, "191879": 52, "0170043": 52, "dummyclassifi": 52, "512281": 52, "489598": 52, "518924": 52, "0119965": 52, "add_constraint": 47, "salary_gt_0": 47, "deltaprotocolerror": 47, "invari": 47, "sql_metdata": 45, "sql_metadata": 45, "parser": [45, 63], "parsed_queri": 45, "alias1": 45, "columns_dict": 45, "alias": [45, 62], "columns_alias": 45, "limit_and_offset": 45, "unchang": 73, "themselv": 73, "example_notebook2": 73, "test_exampl": 73, "test_func": 73, "tb": 73, "hypothesi": 73, "pyenv": [58, 59, 73], "jupyter_cli": 73, "deprecationwarn": 73, "migrat": 73, "platformdir": 73, "jupyter_platform_dir": 73, "jupyter_cor": 73, "v6": 73, "jupyter_data_dir": 73, "jupyter_runtime_dir": 73, "secure_writ": 73, "advers": 59, "streamlin": [], "pandasdataset": 59, "deeparestim": 59, "aileennielsen": 59, "timeseriesanalysiswithpython": 59, "airpasseng": 59, "parse_d": [59, 60], "training_data": 59, "test_gen": 59, "generate_inst": 59, "prediction_length": 59, "trainer_kwarg": 59, "max_epoch": 59, "1954": 59, "ticket": 62, "_ticket": 62, "get_ticket": 62, "_price": 62, "discount": 62, "discount_amount": 62, "apply_discount": 62, "deepli": [54, 62], "unread": 62, "calculate_discounted_pric": 62, "concert": 62, "bind_opt": 62, "from_opt": 62, "bring": [50, 56], "56976095832509": [], "43383865728208": [], "68113195098398": [], "col_nam": 29, "market": [56, 59], "coincid": 59, "causalimpact": 59, "willianfuk": 59, "arma_data": 59, "125": [24, 59], "3756": 59, "3609": 59, "3592": 59, "3628": 59, "164": [24, 59], "galact": 54, "unstructur": 54, "galacticdataset": 54, "filter_func": 54, "from_hugging_face_stream": 54, "tiiuae": 54, "falcon": 54, "refinedweb": 54, "dedup_field": 54, "max_sampl": 54, "detect_languag": 54, "__languag": 54, "4975": 54, "ru": 54, "nl": 54, "pt": [53, 54], "sh": 54, "eo": 54, "ceb": 54, "detect_pii": 54, "__pii__email": 54, "__pii__phon": 54, "__pii__credenti": 54, "1443": 54, "pii": 54, "__pii__ani": 54, "blogspot": 54, "filter_str": 54, "107937": 54, "get_embed": 54, "input_field": 54, "get_cluster_info": 54, "__cluster": 54, "overwritten": 54, "fine": [50, 54], "4902": 54, "31476": 54, "1095": 54, "1125": 54, "709": 54, "1224": 54, "749": 54, "cluster_id": 54, "cluster_s": 54, "advantag": [32, 52], "superior": [32, 52], "data_s": 32, "s_numpi": 32, "s_pyarrow": 32, "numpy_memori": 32, "pyarrow_memori": 32, "helper": 56, "showcas": 56, "bob": [45, 56], "array_append": 56, "array_prepend": 56, "array_contain": 56, "array_distinct": 56, "withcolumn": 56, "has_": 56, "beforehand": 47, "maxim": 47, "glob": 47, "group_bi": 47, "collect_al": 47, "pytorch": 53, "upon": 53, "unpickl": 53, "guarante": 53, "therebi": 53, "safe_open": 53, "save_fil": 53, "weight1": 53, "weight2": 53, "devic": 53, "get_tensor": 53, "suffici": 59, "pytz": 59, "pari": [45, 59], "paris_tim": 59, "toronto": 59, "toronto_timezon": 59, "toronto_tim": 59, "astimezon": [59, 67], "future_datetim": 59, "843320": 59, "in_timezon": 59, "398059": 59, "qs": 59, "extend_panda": 59, "download_return": 59, "spy": 59, "peach": 15, "54095055783208": 56, "46593810642427": 56, "52092805080465": 56, "smith": 56, "johnson": 56, "temporari": [], "createorreplacetempview": 56, "modified_nam": 56, "encapsul": 56, "modify_nam": 56, "stringtyp": 56, "returntyp": 56, "simplefunctionregistri": 56, "py3": 67, "whl": 67, "kb": 67, "contourpi": [], "fonttool": [], "kiwisolv": [], "pillow": [], "pypars": [], "zipp": [], "49mnotic": [], "49m": [], "49m23": [], "49m24": [], "49mpip": [], "restart": [], "curvatur": 59, "far": 59, "datagener": 59, "kneeloc": 59, "figure2": 59, "kneedl": 59, "curv": 59, "concav": 59, "direct": [45, 58, 59], "plot_knee_norm": 59, "log1p": 48, "69314718": 48, "09861229": 48, "38629436": 48, "feature1": 48, "feature2": 48, "log_transform": 48, "result1": 56, "THEN": 56, "result2": 56, "assign_category_label": 56, "pytest_mark": 58, "test_long_running_funct": 58, "test_database_interact": 58, "test_function_1": 58, "test_function_2": 58, "deselect": 58, "32m3": 58, "subscriptionplan": 15, "get_plan_detail": 15, "subscript": 15, "basic_plan": 15, "premium_plan": 15, "great_tabl": 63, "appeal": 63, "footer": [54, 63], "island": [59, 63], "islands_mini": 63, "ascend": 63, "rowname_col": 63, "tab_head": 63, "landmass": 63, "subtitl": 63, "tab_source_not": 63, "source_not": 63, "almanac": 63, "1975": 63, "mcneil": 63, "1977": 63, "wilei": 63, "tab_stubhead": 63, "fmt_number": 63, "sep_mark": 63, "988": 63, "506": 63, "antarctica": 63, "borneo": 63, "280": 63, "baffin": 63, "184": 63, "britain": 63, "celeb": 63, "axel": 63, "heiberg": 63, "__pydantic_self__": 24, "162": 24, "__tracebackhide__": 24, "163": 24, "__pydantic_validator__": 24, "validate_python": 24, "self_inst": 24, "int_pars": 24, "input_valu": 24, "input_typ": 24, "feasibl": 21, "extrem": [21, 59], "large_log": 21, "log_entri": 21, "large_log_fil": 21, "process_log_entri": 21, "lazili": 21, "consolid": 50, "recipe_scrap": 50, "scrape_m": 50, "cookieandk": 50, "thai": 50, "curri": 50, "veget": [50, 51], "total_tim": 50, "ingredi": [50, 54], "\u00bc": 50, "cup": 50, "jasmin": 50, "rice": 50, "grain": 50, "rins": 50, "tablespoon": 50, "coconut": 50, "chop": 50, "pinch": 50, "grate": 50, "fresh": 50, "ginger": 50, "inch": 50, "nub": 50, "clove": 50, "press": 50, "minc": 50, "peel": 50, "diagon": 50, "thick": 50, "ounc": 50, "water": 50, "thinli": 50, "kale": 50, "tough": 50, "rib": 50, "tuscan": 50, "lacinato": 50, "dinosaur": 50, "teaspoon": 50, "turbinado": 50, "tamari": 50, "soi": 50, "sauc": [50, 54], "vinegar": 50, "lime": 50, "juic": 50, "garnish": 50, "cilantro": 50, "flake": 50, "sriracha": 50, "chili": 50, "pot": 50, "boil": 50, "overflow": 50, "drain": 50, "readi": 50, "fluff": 50, "fork": 50, "nto": 50, "warm": 50, "skillet": 50, "sprinkl": 50, "stir": 50, "soften": 50, "transluc": 50, "fragrant": 50, "nadd": 50, "tender": 50, "mixtur": 50, "simmer": 50, "gentl": 50, "nremov": 50, "punch": 50, "bowl": 50, "spici": 50, "nutrient": 50, "calori": 50, "340": 50, "sugarcont": 50, "sodiumcont": 50, "473": 50, "mg": 50, "fatcont": 50, "saturatedfatcont": 50, "transfatcont": 50, "carbohydratecont": 50, "fibercont": 50, "proteincont": 50, "cholesterolcont": 50, "computation": 59, "proven": 59, "classic": 59, "rnn": 59, "nbeat": 59, "airpassengersdf": 59, "nf": 59, "input_s": 59, "max_step": 59, "tqdmwarn": 60, "iprogress": 60, "ipywidget": 60, "readthedoc": 60, "user_instal": 60, "autonotebook": [59, 60], "notebook_tqdm": 60, "pytorch_lightn": [], "nn": [], "checkpoint": [], "save_hyperparamet": [], "gpu": [], "mp": 47, "tpu": [], "ipu": [], "hpu": [], "lightning_log": [], "mae": [], "padder_train": [], "constantpad1d": [], "temporalnorm": [], "modulelist": [], "trainabl": [], "900": [], "789": [], "saniti": [], "trainer": [], "connector": [], "data_connector": [], "val_dataload": [], "bottleneck": [], "num_work": [], "train_dataload": [], "fit_loop": [], "log_every_n_step": [], "epoch": [], "miscalcul": [], "autograd": [], "aten": [], "sgn": [], "fall": [], "implic": [], "runner": 67, "mpsfallback": [], "_execution_engin": [], "run_backward": [], "02it": [], "v_num": [], "train_loss_step": [], "460": 59, "train_loss_epoch": [], "78it": [], "tsdataset": [], "sourcetensor": [], "detach": [], "requires_grad_": [], "tempor": [], "predict_dataload": [], "81it": [], "nixtla_id_as_col": 59, "adopt": [], "suppress": [], "unique_id": 59, "1961": [], "607208": [], "421": [], "863037": [], "493": [], "197845": [], "499": [], "307739": [], "199921": [], "587": [], "497253": [], "091309": [], "662": [], "209167": [], "577": [], "726501": [], "089569": [], "432": [], "609131": [], "420624": [], "mirascop": [], "your_api_kei": 51, "openaiextractor": 51, "meetingdetail": 51, "topic": 51, "particip": 51, "meetingextractor": 51, "extract_schema": 51, "prompt_templ": 51, "upcom": 51, "15th": 51, "sarah": [51, 56], "meeting_detail": 51, "lack": 51, "ipytest": 56, "actual_df": 56, "expected_df": 56, "assertdataframeequ": 56, "test_query_return_correct_number_of_row": 56, "song": 24, "release_d": 24, "beats_per_minut": 24, "multiple_of": 24, "song1": 24, "believ": 24, "dragon": 24, "greater_than": 24, "charli": 45, "david": 45, "ev": 45, "berlin": 45, "predefin": 45, "with_column": 47, "to_uppercas": 47, "comment_karma": 47, "respond": 51, "helpfulli": 51, "wider": 51, "databas": [51, 63], "executemani": 51, "openaical": 51, "openaicallparam": 51, "get_item_info": 51, "item_nam": [], "fetchon": 51, "sorri": 51, "groceryitemqueri": 51, "call_param": 51, "query_tool": 51, "nixtla": 59, "financi": 59, "nixtlacli": 59, "nixtla_cli": 59, "my_api_key_provided_by_nixtla": 59, "time_column": 59, "jbrownle": 59, "6550": 59, "8728": 59, "12026": 59, "14395": 59, "14587": 59, "time_col": 59, "target_col": 59, "timegpt_fcst_df": 59, "1969": 59, "14672": 59, "101562": 59, "15793": 59, "253906": 59, "21517": 59, "191406": 59, "22996": 59, "332031": 59, "25959": 59, "019531": 59, "max_insample_length": 59, "first_nam": 56, "age_after_10_year": 56, "reusabl": 2, "volum": [2, 59], "smoothi": 2, "breakfast": 2, "tropic": 2, "blast": 2, "dark_background": 60, "72befa": 60, "e583b6": 60, "72fcdb": 60, "color_list": 60, "autoet": 59, "generate_seri": 59, "n_seri": 59, "horizon": 59, "spark_df": 59, "30138168803582194": 59, "2724415914984484": 59, "211827399669452": 59, "322947056533328": 59, "218793605631347": 59, "sf": 59, "season_length": 59, "485": [], "lo": [59, 67], "hi": 59, "261609": [], "0255513": [], "4976664": [], "1963573": [], "9603": [], "432415": [], "28230855": [], "04625102": [], "5183661": [], "2641948": [], "0281373": [], "5002524": [], "2624528": [], "0263953": [], "4985104": [], "resource_track": [], "leak": [], "semaphor": [], "shutdown": [], "executorenv": 59, "tqdmexperimentalwarn": 59, "consol": [59, 68], "overhead": 56, "pandas_plus_on": 56, "488073": [], "62014": [], "62028": [], "347": [], "747": 59, "keyword_processor": 54, "add_keyword": 54, "clean_nam": 54, "new_sent": 54, "replace_keyword": 54, "917809": [], "56356": [], "56367": [], "handle_unknown": 52, "numerical_column": 52, "categorical_column": 52, "param_grid": 52, "model__n_estim": 52, "model__max_depth": 52, "model__min_samples_split": 52, "grid_search": 52, "tabularpredictor": 52, "predictor": 52, "disguis": 68, "malwar": 68, "mislead": 68, "shutil": 68, "iterdir": 68, "is_dir": 68, "rmtree": 68, "unlink": 68, "plain_text": 68, "plain": 68, "xml": 68, "nsome": 68, "ini": 68, "yml": 68, "nage": 68, "34mexampl": 68, "37mexampl": 68, "bankaccount": 2, "initial_bal": 2, "_balanc": 2, "isnotnul": 56, "1l": [], "scan": 56, "existingrdd": 56, "301782": [], "60847": [], "60857": [], "former": 59, "unavoid": 59, "latter": 59, "robot_execution_failur": 59, "download_robot_execution_failur": 59, "load_robot_execution_failur": 59, "f_x": 59, "f_y": 59, "f_z": 59, "t_x": 59, "t_y": 59, "t_z": 59, "extract_relevant_featur": 59, "features_filt": 59, "column_id": 59, "column_sort": 59, "83it": 59, "dd": 47, "ddf": 47, "npartit": 47, "mlforecast": 59, "utilsforecast": 59, "uncertainti": 59, "plot_seri": 59, "s3": [59, 60], "amazonaw": [59, 60], "m4": 59, "h1": 59, "586": 59, "559": 59, "uid": 59, "forecasts_df": 59, "renam": 59, "palett": 59, "set_size_inch": 59, "predictioninterv": 59, "kneighborsregressor": 59, "mlf": 59, "prediction_interv": 59, "n_window": 59, "lag_featur": 59, "lag24": 59, "lag48": 59, "lag72": 59, "lag96": 59, "lag120": 59, "lag144": 59, "lag168": 59, "date_featur": 59, "num_thread": 59, "454151": 59, "615": 59, "597": 59, "550958": 59, "601": 59, "310692": 59, "037187": 59, "620": 59, "871115": 59, "623": 59, "597610": 59, "627": 59, "357344": 59, "599": 59, "090": 59, "603": 59, "631": 59, "702": 59, "538": 59, "415217": 59, "551": 59, "491": 59, "913415": 59, "094072": 59, "337321": 59, "493112": 59, "568": 59, "736361": 59, "584": 59, "917018": 59, "675": 59, "534": 59, "535": 59, "567": 59, "525": 59, "703": 59, "496": 59, "797892": 59, "509": 59, "458": 59, "432874": 59, "483280": 59, "481": 59, "705219": 59, "890565": 59, "112505": 59, "162911": 59, "475": 59, "020": 59, "488": 59, "492": 59, "526": 59, "530": 59, "544": 59, "462": 59, "689475": 59, "114933": 59, "435": 59, "849278": 59, "808787": 59, "482": 59, "570164": 59, "489": 59, "529672": 59, "264017": 59, "423": 59, "451": 59, "504": 59, "705": 59, "439": 59, "784731": 59, "384": 59, "182476": 59, "400": [56, 59], "101658": 59, "419": 59, "176045": 59, "393416": 59, "467803": 59, "386986": 59, "394": 59, "555": 59, "645": 59, "test_with_forecast": 59, "plot_random": 59, "80l": 56, "orders_df": 56, "1001": 56, "1003": 56, "lee": 56, "1005": 56, "tom": 56, "600": 56, "customer_nam": 56, "revenu": 56, "total_revenu": 56, "top_custom": [], "order_count": 56, "ntop": [], "nnumber": 56, "2550": 56, "985951": [], "52614": [], "52648": [], "strong": [54, 59], "sim_randomwalk": 59, "utils_func": 59, "smoother": 59, "lowesssmooth": 59, "timestep": 59, "process_nois": 59, "measure_nois": 59, "smooth_fract": 59, "get_interv": 59, "shade": 59, "smooth_data": 59, "polycollect": 59, "0x15b25a8e0": 59, "eda": 60, "pyg": 60, "graphic": [], "walker": [], "kanari": 60, "ap": 60, "northeast": 60, "bike_sharing_dc": 60, "holidai": 60, "feeling_temp": 60, "humid": 60, "winspe": 60, "casual": 60, "winter": 60, "0014": 60, "0000": 60, "9982": 60, "0016": 60, "0032": 60, "0010": 60, "0x137d39650": 60, "decis": 59, "histor": 59, "simul": 59, "goog": 59, "2013": 59, "808": 59, "2303900": 59, "795": 59, "2202500": 59, "794": 59, "804": 59, "791": 59, "2026100": 59, "801": 59, "806": 59, "2265800": 59, "797": 59, "807": 59, "796": 59, "2175400": 59, "sma": 59, "roll": 59, "crossov": 59, "smacross": 59, "precomput": 59, "sma1": 59, "sma2": 59, "invest": 59, "broker": 59, "commiss": 59, "realist": 59, "bt": 59, "stat": 59, "3116": 59, "exposur": 59, "067039": 59, "equiti": 59, "68221": 59, "96986": 59, "peak": 59, "68991": 59, "21986": 59, "582": 59, "219699": 59, "458242": 59, "ann": 59, "266427": 59, "volatil": 59, "383008": 59, "sharp": 59, "658271": 59, "sortino": 59, "288779": 59, "calmar": 59, "763748": 59, "drawdown": 59, "082172": 59, "581506": 59, "win": 59, "255319": 59, "11931": 59, "worst": 59, "629898": 59, "074326": 59, "profit": 59, "factor": 59, "190805": 59, "606294": 59, "sqn": 59, "990216": 59, "_strategi": 59, "_equity_curv": 59, "_trade": 59, "entryb": 59, "shuffl": [], "7000": 56, "joined_df": 56, "scene": 56, "competit": 59, "y_df": 59, "743": 59, "744": 59, "785": 59, "756": 59, "719": 59, "748": 59, "cross_valid": 59, "cross_validation_df": 59, "691": 59, "726797": 59, "678": 59, "618": 59, "559522": 59, "167938": 59, "680": 59, "930997": 59, "981893": 59, "plot_cv": 59, "df_cv": 59, "last_n": 59, "gridspec_kw": 59, "hspace": 59, "notic": 59, "said": 59, "opencv": 63, "pypdf2": 63, "read_pdf": 63, "tablelist": 63, "parsing_report": 63, "to_html": 63, "to_sqlit": 63, "ki": 63, "km": 63, "nspeed": 63, "naccel": 63, "nstop": 63, "nidl": 63, "2012_2": 63, "2145_1": 63, "4234_1": 63, "2032_2": 63, "4171_1": 63, "173": 63, "codecut": 74, "electron": 47, "cloth": 47, "pandas_df": 47, "polars_df": 47, "categorypricestri64": 47, "categoryquantitypricestri64i64": 47, "5200": 47, "1020": 47, "4300": 47, "666667": 47, "categoryquantitypricestri64f64": 47, "1225": 47, "12216": 47, "my_project": 73, "hierarchicalforecast": 59, "numba": 59, "reconcil": 59, "leisur": 59, "tourism": 59, "quarter": 59, "s_df": 59, "12251": 59, "wale": 59, "outback": 59, "nsw": 59, "780860": 59, "33131": 59, "western": 59, "648865": 59, "22034": 59, "fleurieu": 59, "peninsula": 59, "31119": 59, "victoria": 59, "phillip": 59, "2017": 59, "063034": 59, "7671": 59, "405": 59, "891206": 59, "18339": 59, "queensland": 59, "mackai": 59, "135284": 59, "23043": 59, "limeston": 59, "coast": 59, "visi": 59, "604546": 59, "22129": 59, "738053": 59, "11349": 59, "hunter": 59, "226040": 59, "16599": 59, "brisban": 59, "490809": 59, "y_test_df": 59, "y_train_df": 59, "act": 59, "canberra": 59, "perth": 59, "425": 59, "y_hat_df": 59, "y_fitted_df": 59, "zza": 59, "forecast_fitted_valu": 59, "coher": 59, "hierarchicalreconcili": 59, "bottomup": 59, "hrec": 59, "y_rec_df": 59, "25990": 59, "068359": 59, "24380": 59, "257812": 59, "24458": 59, "490234": 59, "22902": 59, "765625": 59, "23974": 59, "056641": 59, "22412": 59, "982422": 59, "24563": 59, "455078": 59, "23127": 59, "439453": 59, "24516": 59, "759766": 59, "abstract": 54, "contextu": 54, "newsgroup": 54, "18000": 54, "topic_model": 54, "993": [], "484": [], "huggingfac": [], "disabl": 67, "deadlock": [], "tokenizers_parallel": [], "980": [], "get_topic_info": 54, "representative_doc": 54, "6789": 54, "1_to_the_is_of": 54, "refus": 54, "1823": 54, "0_game_team_games_h": 54, "game": 54, "player": 54, "hock": 54, "rivalri": 54, "ahem": 54, "jokerit": 54, "630": 54, "1_key_clipper_chip_encrypt": 54, "clipper": 54, "chip": 54, "encrypt": 54, "escrow": 54, "expert": 54, "cryptographi": 54, "scie": 54, "2_idjits_ites_cheek_danc": 54, "idjit": 54, "ites": 54, "cheek": 54, "yep": 54, "nyep": 54, "ndanc": 54, "3_israel_israeli_jews_arab": 54, "israel": 54, "isra": 54, "jew": 54, "jewish": 54, "nthi": 54, "010318688564543007": 54, "008992489388365084": 54, "0071658097402482355": 54, "006986923839656088": 54, "00631255726099582": 54, "006207025740053": 54, "hockei": 54, "006108581738112714": 54, "0057638598847672895": 54, "005625421684874428": 54, "005577343029862753": 54, "topics_": 54, "visualize_top": 54, "tf": 54, "idf": 54, "visualize_barchart": 54, "top_n_top": 54, "perhap": [], "n_gram_rang": [], "update_top": [], "011119596146117955": [], "nasa": [], "0047697533973351915": [], "shuttl": [], "0044533985251824495": [], "orbit": [], "004129278694477752": [], "spacecraft": [], "004011023125258004": [], "satellit": [], "003783732360211832": [], "moon": [], "003639954930862572": [], "lunar": [], "0034753177228921146": [], "002821040122532999": [], "mar": [], "0028033947303940923": [], "afterward": [], "reduce_top": [], "nr_topic": [], "666": [], "berttop": 54, "modern": [52, 63], "argparse_exampl": 63, "argumentpars": 63, "add_argu": 63, "parse_arg": 63, "click_exampl": 63, "vbox": [], "322": [], "dedup": [], "floatprogress": [], "999393": [], "mlflow": [], "prone": [15, 52], "anyon": 52, "infer_signatur": 52, "start_run": 52, "model_info": 52, "log_model": 52, "sk_model": 52, "artifact_path": 52, "model_uri": 52, "f8b0fc900aa14cf0ade8d0165c5a9f11": 52, "1e20d72afccf450faa3b8a9806a97e83": 52, "sklearn_pyfunc": 52, "pyfunc": 52, "load_model": 52, "inspect": 52, "mlrun": 52, "mlmodel": 52, "conda": 52, "python_env": 52, "python_funct": 52, "virtualenv": 52, "loader_modul": 52, "model_path": 52, "predict_fn": 52, "python_vers": 52, "pickled_model": 52, "serialization_format": 52, "cloudpickl": 52, "sklearn_vers": 52, "post1": 52, "mlflow_vers": 52, "model_size_byt": 52, "model_uuid": 52, "e7487bc3c4ab417c965144efcecaca2f": 52, "run_id": 52, "utc_time_cr": 52, "516963": 52, "outlin": 52, "forg": 52, "psutil": 52, "build_depend": 52, "setuptool": 52, "wheel": [52, 67], "get_data_for_last_week": 58, "test_main": 58, "test_get_data_for_last_week": 58, "mock_datetim": 58, "assert_called_onc": 58, "behav": 58, "infix": 62, "travers": 62, "unfold": 62, "first_fiv": 62, "skip_first_two": 62, "pip3": 52, "fastapi": [], "unfamiliar": 52, "versatil": 52, "mobil": 52, "divers": 52, "mse": 52, "ml_app": 52, "medinc": 52, "houseag": 52, "avebedrm": 52, "aveoccup": 52, "curl": 52, "1400": 52, "discoveri": 54, "essenc": 54, "surpass": 54, "sentence_transform": 54, "sentencetransform": 54, "cosine_similar": 54, "oatmeal": 54, "cooki": 54, "bake": 54, "chia": 54, "pud": 54, "fri": 54, "oreo": 54, "sunda": 54, "caramel": 54, "bacon": 54, "cheeseburg": 54, "pizza": 54, "minilm": 54, "l6": 54, "recipe_embed": 54, "find_similar_recip": 54, "top_k": 54, "query_embed": 54, "top_indic": 54, "dessert": 54, "healthier": 54, "clearli": 54, "unhealthi": 54, "pygment": 67, "mdurl": 67, "removeprefix": 67, "removesuffix": 67, "32m2024": 67, "329": 67, "1merror": 67, "36m__main__": 67, "36m14": 67, "1man": 67, "caught": 67, "mainprocess": 67, "31530": 67, "mainthread": 67, "8332868224": 67, "1mtraceback": 67, "_run_module_as_main": 67, "ipykernel_launch": 67, "launch_new_inst": 67, "launch_inst": 67, "ipykernel": 67, "kernelapp": 67, "ipkernelapp": 67, "traitlet": 67, "1053": 67, "0x107d28860": 67, "0x104cdf1d0": 67, "io_loop": 67, "baseasyncioloop": 67, "0x107d29760": 67, "tornado": 67, "asynciomainloop": 67, "0x107d3fc90": 67, "asyncio_loop": 67, "run_forev": 67, "baseeventloop": 67, "0x105c9fb00": 67, "_unixselectoreventloop": 67, "1mbase_ev": 67, "33m607": 67, "35mrun_forev": 67, "35m": 67, "1m_run_onc": 67, "_run_onc": 67, "0x105ca1940": 67, "33m1922": 67, "35m_run_onc": 67, "1mhandl": 67, "1m_run": 67, "_run": 67, "0x105c32840": 67, "task_wakeup": 67, "fini": 67, "6d0": 67, "1mevent": 67, "33m80": 67, "35m_run": 67, "1m_context": 67, "1mrun": 67, "1m_callback": 67, "1m_arg": 67, "_arg": 67, "_callback": 67, "_context": 67, "kernelbas": 67, "dispatch_queu": 67, "process_on": 67, "0x1077f2fc0": 67, "ipkernel": 67, "ipythonkernel": 67, "0x107d40a50": 67, "513": 67, "dispatch": 67, "zmq": 67, "0x10848d250": 67, "0x10848d610": 67, "dispatch_shel": 67, "418": 67, "execute_request": 67, "0x107a77320": 67, "758": 67, "reply_cont": 67, "do_execut": 67, "0x107a71240": 67, "run_cel": 67, "zmqinteractiveshel": 67, "0x107d15c60": 67, "zmqshell": 67, "0x107d68490": 67, "store_histori": 67, "silent": 67, "cell_id": 67, "efficient_python_tricks_and_": 67, "nimport": 67, "nfrom": 67, "nlogger": 67, "interactiveshel": 67, "3024": 67, "_run_cel": 67, "0x106bc3ce0": 67, "3079": 67, "coro": 67, "run_cell_async": 67, "0x1086c18a0": 67, "_pseudo_sync_runn": 67, "0x106baae80": 67, "async_help": 67, "3284": 67, "has_rais": 67, "run_ast_nod": 67, "code_ast": 67, "cell_nam": 67, "ipykernel_31530": 67, "1455742643": 67, "ast": 67, "importfrom": 67, "0x10881c0d0": 67, "0x10881f310": 67, "0x10881fc10": 67, "exp": 67, "0x10881f5b0": 67, "0x106bc8040": 67, "3466": 67, "run_cod": 67, "async_": 67, "asi": 67, "executionresult": 67, "108825410": 67, "execution_count": 67, "error_before_exec": 67, "error_in_exec": 67, "executioninfo": 67, "0x17346b750": 67, "0x106bc80e0": 67, "exec": 67, "code_obj": 67, "user_global_n": 67, "user_n": 67, "__package__": 67, "0x106ba3830": 67, "1m1455742643": 67, "33m14": 67, "1mevaluate_result": 67, "1my_tru": 67, "1my_pr": 67, "1marrai": 67, "0x172e23e20": 67, "33m9": 67, "35mevaluate_result": 67, "1mmean_square_err": 67, "1mmean_squared_error": 67, "0x173478180": 67, "_param_valid": 67, "0x1734780e0": 67, "0x173457ba0": 67, "0x172e205e0": 67, "457": 67, "1mvalueerror": 67, "hide": 67, "dunder": 67, "nodoc": 67, "ret": 67, "grai": 67, "py2": 67, "colorama": 67, "asttoken": 67, "25ldone": 67, "25hrequir": 67, "werkzeug": 67, "itsdanger": 67, "blinker": 67, "markupsaf": 67, "25h": 67, "235994": 67, "23d469a3676f399435ed1581b0da936ef614a134749520be801eb96aadeb19b6": 67, "ce": 67, "bb": 67, "26835a451cc11eb8d362d2d2b2c322220c6d61edc825233820": 67, "25l": 67, "inspector": 67, "examin": 67, "prepend": 67, "949190": 67, "repr": 67, "fold": 67, "999999": 67, "0001": 67, "000001": 67, "nonetyp": 67, "ctime": 67, "fromisocalendar": 67, "iso": 67, "fromisoformat": 67, "8601": 67, "fromordin": 67, "prolept": 67, "gregorian": 67, "fromtimestamp": 67, "posix": 67, "isocalendar": 67, "isoformat": 67, "ddt": 67, "ss": [45, 67], "mmm": 67, "uuu": 67, "isoweekdai": 67, "timetupl": 67, "localtim": 67, "timetz": 67, "__class__": 67, "toordin": 67, "tzname": 67, "utcfromtimestamp": 67, "utcnow": 67, "utcoffset": 67, "utctimetupl": 67, "test_rm_fil": 58, "rm_file": 58, "test_with_unittest_mock": 58, "mock_remov": 58, "assert_called_once_with": 58, "test_unix_f": 58, "mocker": 58, "wherea": 58, "nest": 15, "vari": 45, "transpil": 45, "hive": 45, "date_format": 45, "yy": 45, "backtick": 45, "converted_pric": 45}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"pytest": [0, 43, 58, 69, 75], "cach": [0, 43, 69, 75], "directori": [0, 23, 43, 58, 69, 75], "python": [1, 2, 4, 5, 6, 7, 9, 11, 13, 14, 15, 16, 17, 18, 21, 25, 27, 45, 46, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68], "built": 1, "method": [1, 2, 7, 8, 11, 19, 20, 25, 27, 42, 52, 58], "class": [2, 19, 24, 27, 58, 60], "inherit": 2, "abstract": 2, "declar": [2, 27, 58], "without": [2, 50, 62], "implement": 2, "vs": [7, 19, 47, 52, 56, 58, 66], "composit": [], "choos": 58, "right": [], "design": 2, "approach": [59, 62], "distinguish": 2, "instanc": 2, "level": 2, "getattr": 2, "better": [2, 21, 47, 63, 73], "wai": [2, 21, 47, 53, 60], "get": [2, 5, 7, 8, 9, 14, 16, 22, 23, 25, 33, 35, 40, 42, 49, 50, 52, 73], "attribut": [2, 25], "__call__": 2, "call": [2, 20, 62, 68], "your": [2, 7, 16, 18, 19, 27, 29, 38, 40, 45, 47, 49, 52, 53, 54, 55, 57, 58, 60, 64, 66, 67, 68, 73], "like": [2, 59], "function": [2, 3, 6, 7, 8, 20, 21, 25, 26, 27, 29, 47, 58, 62, 63, 64, 67, 68], "comparison": [2, 4, 42, 47, 52, 58], "static": [2, 64, 68], "us": [2, 4, 5, 6, 7, 14, 16, 21, 24, 25, 27, 29, 30, 31, 32, 33, 34, 40, 42, 45, 46, 47, 48, 49, 50, 58, 60, 62, 66, 67, 68, 73], "ad": 2, "requir": [2, 65, 73], "new": [2, 15, 20, 23, 29, 50], "minim": 2, "data": [2, 11, 18, 19, 21, 24, 31, 32, 33, 37, 40, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 64, 73], "risk": 2, "privat": 2, "variabl": [2, 14, 15, 32, 49, 52], "properti": [33, 58], "decor": [6, 51, 62], "A": [7, 18, 21, 45, 47, 53, 58, 59, 60, 62, 68], "getter": 2, "setter": 2, "__str__": 2, "__repr__": 2, "creat": [2, 7, 18, 23, 31, 40, 45, 46, 49, 50, 52, 54, 58, 60, 63, 65, 68], "string": [2, 7, 8, 11, 16, 29, 32, 37, 45, 49, 54, 59, 62], "represent": 2, "object": [2, 7, 25, 40, 55, 58, 63, 67], "__add__": 2, "add": [2, 19, 27, 33, 47, 57, 59, 60, 67], "two": [2, 5, 10, 11, 19, 23, 30, 39, 42, 52, 58, 62, 63, 65, 67], "optim": [2, 29, 32, 47, 56], "memori": [2, 32, 56, 57, 64], "usag": [2, 32, 57, 64], "slot": 2, "code": [2, 3, 6, 7, 15, 16, 29, 45, 46, 48, 49, 50, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 66, 67, 68, 73], "speed": [3, 47, 57, 67], "concurr": [3, 57], "execut": [3, 15, 25, 47, 58, 63, 65, 67, 68], "task": [3, 7], "separ": 3, "cpu": 3, "compar": [3, 19, 39, 53, 63, 65, 67], "The": [3, 7, 16, 18, 33, 35, 47, 49, 53, 54, 58, 59, 60, 73, 74], "time": [3, 25, 33, 48, 50, 52, 57, 58, 59, 67, 68], "between": [3, 10, 11, 19, 35, 39, 42, 53, 58, 60, 62], "2": [3, 10, 21, 31, 32, 35, 53, 54, 55], "save": 3, "disk": 3, "space": [3, 42, 59], "larg": [3, 14, 21, 31, 45, 47, 51, 57, 63], "dataset": [3, 45, 48, 50, 52, 53, 54], "parquet": [3, 31, 47], "datetim": [4, 31, 33, 59], "timedelta": 4, "calcul": [4, 16, 35, 54], "end": 4, "base": [4, 11, 20, 30, 32, 33, 34, 42, 49, 58, 65, 68, 73], "start": [4, 37, 68], "durat": 4, "date": [4, 16, 24, 33, 59], "month": 4, "featur": [4, 15, 48, 49, 52, 53, 59], "arithmet": 4, "oper": [4, 5, 7, 11, 15, 20, 22, 26, 29, 40, 42, 45, 47, 56], "dictionari": [5, 18, 22, 25, 29, 35, 62], "updat": [5, 30, 47, 56], "With": [5, 16, 21, 25, 30, 37, 47, 58], "item": [5, 8, 18, 20, 22, 25, 40], "from": [5, 9, 11, 22, 23, 31, 34, 35, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 59, 63, 64, 66, 68, 74], "anoth": [5, 16, 20, 23, 30, 34, 66], "kei": [5, 18, 21, 50, 62], "paramet": [5, 7, 27, 58, 64], "max": [5, 9, 42], "find": [5, 9, 10, 16, 25, 33, 35, 37, 49, 50, 52, 58, 59, 62, 64], "largest": [5, 40], "valu": [5, 7, 9, 13, 18, 21, 25, 27, 29, 33, 34, 35, 38, 40, 42], "dict": 5, "default": [5, 18], "doesn": 5, "t": [5, 7, 46], "exist": 5, "doubl": [5, 14, 42], "nest": [5, 7, 21, 25, 62], "miss": [5, 29, 33, 60, 64], "fromkei": 5, "list": [5, 7, 8, 9, 10, 11, 12, 16, 18, 21, 22, 25, 32, 34, 37, 40, 42, 67], "revers": 5, "comprehens": [5, 8, 60, 67], "merg": [5, 30, 47], "union": [5, 10, 15, 27], "3": [5, 11, 15, 52, 54, 56], "9": 5, "iter": [5, 8, 11, 13, 20, 21, 29, 57], "omit": [6, 25], "els": [6, 7], "claus": 6, "improv": [2, 6], "readabl": [2, 6, 7, 15, 16, 30, 52, 57, 60, 62, 67], "when": [6, 7, 13, 18, 30, 31, 33, 39, 48, 52, 58, 68], "Not": [6, 7, 18, 27, 58], "lambda": 6, "how": [6, 48, 63, 76], "pass": [6, 7, 55], "an": [6, 7, 8, 11, 15, 16, 18, 21, 26, 27, 29, 42, 50, 52, 54, 60, 68], "arbitrari": [6, 49], "number": [6, 14, 16, 24, 33, 35, 42, 50, 54], "argument": [6, 7, 20, 21], "good": 7, "practic": [7, 46], "write": [7, 15, 27, 31, 45, 48, 58, 62, 73], "meaning": [7, 54], "name": [7, 34, 40, 49, 54, 58], "assign": [7, 15, 29, 40, 58], "complex": [7, 56], "condit": [7, 8, 15, 21, 42, 58], "make": [7, 19, 31, 57, 63], "more": [7, 21], "avoid": [7, 56], "duplic": 7, "underscor": [7, 14], "_": 7, "ignor": [7, 13, 39], "That": [7, 27, 48], "Will": 7, "Be": [7, 27], "index": [7, 16, 25, 33, 34, 39, 42], "For": [7, 21, 49, 54], "loop": [7, 21], "slice": [7, 54], "indic": 7, "statement": [7, 15, 45], "stop": [7, 67], "copi": [7, 31, 65], "instead": [7, 14, 46], "deepcopi": 7, "side": 7, "effect": [7, 40], "enumer": 7, "counter": [7, 18], "while": 7, "don": [7, 46], "multipl": [7, 9, 13, 14, 16, 18, 22, 29, 30, 40, 47, 56, 58], "OR": 7, "concaten": 7, "join": [7, 11, 48, 56], "should": [7, 27, 74], "onli": [6, 7, 19, 34, 58], "do": 7, "One": [7, 16, 18, 37, 42, 50, 52, 54, 57, 58, 59, 66, 67, 68], "have": 7, "fewer": [7, 20], "than": [7, 21], "four": 7, "flag": 7, "s": [7, 11, 20, 24, 25, 32, 34, 35, 37, 40, 42, 48, 49, 50, 51, 52, 57, 59, 67, 73], "condens": 7, "If": [7, 34], "line": [7, 46, 50, 52, 54, 55, 57, 59, 63, 64, 67, 68], "effici": [7, 21, 31, 32, 45, 47, 48, 54, 58], "check": [7, 8, 23, 42, 58, 62, 64], "type": [7, 15, 20, 27, 32, 64, 68], "try": 7, "except": [7, 29, 58], "never": [7, 67], "catch": 7, "all": [7, 8, 30, 34, 35, 42, 58], "clean": [7, 13, 54, 73], "error": [7, 56, 58], "handl": [7, 32, 45, 48, 59], "logic": [7, 56], "why": 7, "__name__": 7, "__main__": 7, "matter": 7, "script": [7, 63], "appli": [8, 20, 21, 29, 40, 47, 57], "element": [8, 9, 11, 21, 25, 29, 30, 35, 42, 49], "ani": [8, 42, 63, 65, 67], "true": [8, 11, 19], "inter": 8, "ar": [8, 18, 23, 39, 42, 68], "filter": [8, 21, 31, 34, 47, 62], "evalu": [8, 56, 58], "map": [8, 29, 60, 62], "each": [8, 29, 35, 40], "sort": [8, 36, 64], "tupl": 8, "first": 8, "second": [8, 66], "random": [9, 40, 50], "choic": 9, "randomli": 9, "select": [9, 33, 34, 35], "weight": [9, 52], "sampl": [9, 40], "heapq": 9, "n": [9, 25, 33, 40], "interact": [10, 45, 60, 63], "set": [10, 47, 58], "intersect": 10, "differ": [10, 11, 21, 35, 39, 40, 42, 53, 58, 62, 73], "turn": [11, 32, 35, 40, 42], "zip": [11, 21], "associ": 11, "order": [11, 18, 36, 39], "unzip": 11, "append": [11, 47], "extend": [11, 13], "unpack": 13, "perform": [14, 47, 58, 59, 64], "floor": 14, "divis": 14, "forward": [14, 29], "slash": 14, "fraction": 14, "numer": 14, "result": 14, "decim": [14, 16], "format": [14, 16, 38, 54], "confirm": 14, "whether": [14, 39], "Is": [14, 21, 52], "modulu": 14, "switch": [], "structur": [15, 18, 49, 51], "pattern": [15, 37, 62], "match": [15, 16, 25, 48, 54, 62], "10": [11, 15], "x": [15, 27], "y": [15, 27], "walru": 15, "express": [15, 16, 21, 34, 47, 62], "fine": 15, "grain": 15, "traceback": [15, 67], "11": 15, "control": [16, 53, 58, 73], "print": [16, 26, 38, 67], "f": 16, "pad": 16, "zero": 16, "enhanc": [2, 6, 15, 16, 30, 48, 56], "comma": 16, "debug": [16, 67, 73], "equal": [16, 35, 39, 42, 58], "sign": 16, "substr": [16, 37], "re": 16, "sub": 16, "replac": [16, 29, 33, 42, 54, 68], "regular": [16, 62], "split": [16, 25, 29, 48], "charact": 16, "multilin": 16, "difflib": 16, "sequencematch": 16, "detect": [16, 59, 60, 68], "almost": 16, "similar": [16, 39, 48, 53], "articl": [16, 54], "get_close_match": 16, "best": [16, 46, 47, 49], "certain": [16, 35, 42], "word": [16, 54, 57], "util": 17, "librari": [17, 45, 47, 58, 59, 68], "collect": 18, "count": [18, 34, 35], "occurr": 18, "namedtupl": 18, "lightweight": [18, 68], "mang": 18, "defaultdict": 18, "return": [6, 18, 32, 48], "avail": 18, "ordereddict": 18, "chainmap": 18, "combin": [18, 20, 21, 30, 58], "unit": [18, 56, 58, 62, 73], "normal": 19, "frozen": 19, "read": [19, 31, 33, 45, 66, 76], "post": 19, "init": 19, "functool": 20, "partial": 20, "gener": [20, 21, 50, 54, 58, 59, 60, 63, 65, 68, 73], "singledispatch": 20, "current": [20, 23, 29, 35], "reduc": [20, 32, 54], "cumul": [20, 35], "itertool": 21, "through": 21, "pair": 21, "product": [21, 52], "starmap": 21, "compress": 21, "boolean": [21, 34], "groupbi": [21, 40], "group": [21, 25, 33, 35, 40], "zip_longest": 21, "length": [21, 42], "dropwhil": 21, "drop": [21, 48, 60], "until": 21, "fals": [21, 52], "itemgett": 22, "pathlib": 23, "file": [23, 33, 46, 47, 55, 58, 64, 65, 66, 68, 73], "access": [23, 33, 35, 62], "home": 23, "parent": 23, "path": 23, "rel": 23, "same": [23, 58, 73], "pydash": 25, "work": [25, 33, 37, 45, 56, 58, 59], "flatten": [25, 42], "flatten_deep": 25, "deepli": 25, "chunk": [25, 31], "style": [25, 38, 60], "chain": [25, 29], "custom": [25, 30, 48], "plant": 25, "sympi": 26, "motiv": 26, "what": [26, 74], "basic": [26, 52], "symbol": 26, "equat": [26, 73], "expand": [26, 54], "factor": 26, "simplifi": [8, 15, 24, 26, 45, 47, 51, 52, 56, 58, 59, 62, 67], "solv": [26, 48], "substitut": 26, "trigonometr": 26, "deriv": 26, "integr": [2, 26, 45, 51, 52, 73], "limit": [26, 68], "special": 26, "latex": [26, 38, 42, 63], "callabl": 27, "specifi": [27, 30, 31], "input": [27, 58], "hint": 27, "annot": [27, 49, 60, 68], "metadata": [27, 45, 52], "typehint": 27, "final": 27, "overridden": 27, "liter": 27, "possibl": [27, 58], "typevar": 27, "flexibl": [27, 59], "context": 27, "depend": [27, 65], "panda": [28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 45, 47, 50, 56, 57, 58, 67], "chang": [29, 35, 42, 59, 68], "datafram": [29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 56, 57, 58], "pipe": [29, 62], "column": [29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 42, 56, 59], "elementwis": 29, "seri": [29, 33, 34, 35, 37, 40, 52, 59], "explod": 29, "transform": [29, 34, 40, 47, 48, 62], "row": [29, 30, 33, 34, 35, 36, 37, 40, 42], "fill": 29, "previou": [29, 33], "most": 29, "frequent": 29, "categori": [29, 40, 48, 58], "encod": [29, 48], "categor": [29, 32, 36, 48, 49], "rais": 29, "combine_first": 30, "null": [30, 62], "df": [30, 34, 35], "suffix": 30, "includ": [30, 32], "insert": 30, "Into": [30, 40, 49, 65], "locat": [30, 49, 50, 60], "leverag": [31, 56, 59], "pyarrow": [31, 32, 45], "fix": 31, "unnam": 31, "0": [31, 32, 33], "csv": [31, 33, 45, 47], "websit": [31, 68], "divid": 31, "html": 31, "tabl": [31, 40, 45, 47, 48, 63], "mode": [31, 47], "manipul": [32, 37, 40, 62], "select_dtyp": 32, "subset": [32, 34], "exclud": [32, 34], "Their": [32, 34, 49], "dtype": 32, "infer_object": 32, "sai": 32, "goodby": 32, "convers": 32, "parse_d": [31, 33], "convert": [33, 54, 59, 62], "dateoffset": 33, "interv": [33, 35, 42, 52, 59], "timestamp": 33, "roll": 33, "averag": 33, "datapoint": 33, "grouper": 33, "specif": [33, 36, 42, 58, 68], "frequenc": [33, 48, 54, 60], "dt": 33, "within": [33, 35, 73], "year": 33, "rang": 33, "reindex": 33, "befor": 33, "after": [33, 58, 68], "resampl": 33, "shift": [33, 35], "period": 33, "isin": 34, "contain": [34, 35, 37, 62], "queri": [34, 47, 54, 56], "nan": 34, "clip": 34, "outlier": 34, "loc": 35, "iloc": 35, "pd": 35, "pct_chang": 35, "percentag": 35, "prior": 35, "diff": 35, "take": [35, 42], "numpi": [35, 41, 42, 62], "arrai": [32, 35, 42, 56, 62], "to_dict": 35, "corrwith": 35, "comput": [35, 40, 59], "pairwis": 35, "correl": [35, 48, 60], "cut": 35, "bin": 35, "discret": 35, "qcut": 35, "size": [35, 40], "cumsum": 35, "sum": 35, "over": [2, 35, 40, 42, 50, 52, 58], "cummax": 35, "maximum": 35, "set_categori": 36, "str": 37, "text": [37, 38, 49, 52, 54, 60, 63], "startswith": 37, "highlight": 38, "easier": [38, 56], "analysi": [38, 52, 58, 59, 64], "color": 38, "background": 38, "gradient": 38, "displai": [38, 60, 73], "cell": 38, "to_markdown": 38, "markdown": [38, 68], "test": [39, 42, 50, 52, 54, 56, 58, 73], "assert_fram": 39, "agg": 40, "aggreg": 40, "pivot_t": 40, "pivot": 40, "melt": 40, "unpivot": 40, "crosstab": 40, "cross": [40, 59], "tabul": 40, "stack": 40, "align": 40, "ravel": 42, "np": 42, "squeez": 42, "remov": [42, 64, 65], "ax": 42, "posit": 42, "argsort": 42, "rank": 42, "where": [42, 68], "linspac": 42, "evenli": 42, "assert_almost_equ": 42, "up": [42, 47, 57], "precis": 42, "scienc": [44, 53], "tool": [44, 46, 47, 53, 54, 57, 59, 61, 63, 65, 67], "sql": [45, 53, 56], "dynam": [45, 58], "templat": 45, "fuguesql": 45, "spark": [45, 47, 56, 59], "dask": [45, 47], "sqlmodel": 45, "databas": [45, 58], "sqlfluff": 45, "linter": 45, "auto": [45, 59], "formatt": [45, 73], "postgresml": 45, "machin": [45, 52, 68], "learn": [45, 48, 52, 59, 68], "postgresql": [45, 58], "duckdb": 45, "sqlpars": [], "extract": [45, 49, 50, 51, 54, 59, 62, 63], "compon": [45, 49], "hard": 46, "hydra": 46, "dotenv": [], "load": 47, "secret": [], "inform": [46, 54, 73], "env": 46, "docopt": 46, "beauti": [46, 67], "command": [46, 63, 67, 68, 73], "interfac": [46, 59, 63], "document": 46, "tqdm": 47, "progress": [47, 58, 67], "bar": [47, 58, 67], "pandarallel": 47, "simpl": [47, 53, 58], "parallel": 47, "pandasai": 47, "gain": 47, "insight": 47, "ai": [47, 48, 54, 73], "fugu": 47, "engin": [47, 48, 54, 59], "version": [47, 53, 73], "delta": 47, "lake": 47, "partit": 47, "overwrit": 47, "scan": 47, "mismatch": [47, 48, 58], "polar": 47, "blaze": 47, "fast": [47, 52, 54, 59], "process": [21, 47, 54, 56], "12x": 47, "lazi": [47, 52, 56], "har": [47, 54, 59], "stratifi": 48, "fashion": 48, "scikit": [48, 52, 59], "strategi": [48, 59], "prevent": [11, 48, 52], "leakag": [48, 52], "rare": 48, "label": [48, 58], "dirti": [48, 58], "dirty_cat": 48, "fuzzi": 48, "snorkel": 48, "programmat": 48, "build": [48, 49, 52, 54, 63], "train": [48, 58, 59], "sketch": 48, "assist": 48, "understand": [48, 59], "content": [48, 68], "distfit": 49, "theoret": 49, "distribut": [49, 52, 53, 56], "geopi": 49, "fastai": [49, 57, 59], "cont_cat_split": 49, "continu": 49, "cardin": 49, "patsi": 49, "yarl": 49, "url": 49, "pigeon": 49, "quickli": [49, 57], "jupyt": [49, 60, 70, 73], "notebook": [49, 60, 68, 70, 73], "probablepeopl": 49, "pars": [49, 62], "unstructur": 49, "supercharg": [49, 52], "pdf": [49, 63], "pypdf": 49, "faker": 50, "fake": 50, "silli": 50, "produc": [50, 67], "user": 50, "fetch_openml": 50, "openml": 50, "autoscrap": 50, "autom": [50, 59, 66, 68], "web": [50, 54, 55], "scrape": 50, "reader": 50, "variou": 50, "internet": 50, "sourc": 50, "directli": 50, "pytrend": 50, "trend": 50, "keyword": [6, 50, 54], "googl": [50, 55], "search": [50, 54], "snscrape": 50, "social": [50, 54], "network": 50, "servic": [50, 58], "datacommon": 50, "statist": [50, 54, 60], "about": [50, 73, 74], "median": 50, "incom": 50, "california": 50, "peopl": 50, "u": 50, "robberi": 50, "people_also_ask": 50, "wrapper": 50, "also": 50, "ask": 50, "facebook": 50, "public": 50, "page": [50, 66], "api": [50, 56, 60], "languag": [51, 54], "model": [51, 52, 54, 57, 58, 59, 60], "llm": [51, 52, 58], "causalimpact": 52, "causal": [52, 59], "relat": [52, 58], "event": 52, "chatgpt": 52, "pipelin": [48, 52, 67], "gridsearchcv": 52, "scale": [52, 59], "squar": 52, "rmse": 52, "sklearn": [52, 59], "mean_squared_error": 52, "modelkit": 52, "ml": [52, 57, 58, 63], "system": 52, "decompos": 52, "high": [52, 60], "dimension": [52, 60], "three": 52, "dimens": [52, 54, 60], "visual": [52, 54, 60, 65, 67], "import": [52, 64, 65, 68, 73], "yellowbrick": 52, "valid": [24, 52, 58, 59], "curv": 52, "determin": 52, "estim": [52, 54, 59], "underfit": 52, "overfit": 52, "mlxtend": 52, "plot": [52, 60], "decis": [52, 60], "region": 52, "classifi": 52, "deepcheck": [52, 58], "bias": 52, "track": 52, "imbalanc": 52, "deal": 52, "predict": [52, 59, 68], "mapi": 52, "mlforecast": 52, "scalabl": 52, "mlem": 52, "captur": [52, 60], "manag": [45, 53, 65, 73], "dvc": 53, "project": [53, 65], "sweetviz": 53, "quadrat": 53, "speadsheet": 53, "whylog": 53, "log": [52, 53, 58, 67], "made": [52, 53, 56, 59], "easi": [52, 53, 59], "fluke": 53, "easiest": [53, 60], "move": 53, "around": 53, "natur": 54, "textblob": 54, "sumi": 54, "summar": [54, 66], "spacy_streamlit": 54, "app": 54, "textaci": 54, "contigu": 54, "sequenc": 54, "preprocess": [48, 54], "texthero": 54, "wordfreq": 54, "36": 54, "newspaper3k": 54, "questgen": 54, "question": 54, "ninja": 54, "lump": 54, "togeth": 54, "textstat": 54, "rapidfuzz": 54, "rapid": [52, 54], "checklist": 54, "nlp": 54, "top2vec": 54, "quick": 54, "topic": 54, "english": 54, "contract": 54, "inflect": 54, "plural": 54, "singular": 54, "indefinit": 54, "flashtext": 54, "sentenc": [], "ekphrasi": 54, "media": 54, "chroma": 54, "lightn": 54, "solut": [47, 54], "embed": 54, "share": [55, 58], "download": [55, 66, 68], "datapan": 55, "publish": 55, "gdown": 55, "drive": 55, "pyserd": 55, "effortless": 55, "serial": 55, "deseri": 55, "dataclass": [15, 55], "itsdanger": 55, "safe": [53, 55], "trust": 55, "untrust": 55, "environ": [55, 65], "back": 55, "df_shrink": 57, "shrink": 57, "swifter": 57, "23": 57, "faster": [47, 57], "pyinstrument": 57, "profil": [57, 67], "coval": 57, "resum": 58, "break": 58, "fail": 58, "descript": [58, 63], "short": 58, "benchmark": 58, "fixtur": 58, "mark": 58, "parametr": 58, "twice": 58, "id": 58, "case": 58, "onc": [45, 58], "per": 58, "session": 58, "skipif": 58, "skip": 58, "met": 58, "xfail": 58, "expect": [58, 74], "verifi": 58, "repeat": 58, "sugar": 58, "show": 58, "failur": [58, 68], "instantli": 58, "step": 58, "pick": 58, "run": [45, 58, 68, 73], "unstag": 58, "git": [58, 66], "setup": 58, "freezegun": 58, "freez": 58, "simul": 58, "extern": [51, 58], "mock": 58, "pyfakef": [], "pandera": 58, "deepdiff": 58, "deep": [58, 68], "assert": 58, "hypothesi": 58, "conflict": 58, "leab": 58, "ab": 58, "incorpor": 58, "suit": 58, "maintain": 58, "accuraci": [51, 58], "docstr": [58, 64], "exampl": 58, "doctest": 58, "deepev": 58, "datefind": 59, "automat": [59, 60, 64, 68], "add_datepart": 59, "relev": [51, 59], "maya": 59, "trace": 59, "unevenli": 59, "holidai": 59, "workalendar": 59, "dai": 59, "pmdarima": 59, "r": 59, "arima": 59, "power": 59, "seaborn": 60, "matplotlib": 60, "graphviz": 60, "flowchart": 60, "idea": 60, "folium": 60, "dtreeviz": 60, "interpret": [54, 60], "tree": [60, 63], "hiplot": 60, "missingno": 60, "dendogram": 60, "venn": 60, "diagram": 60, "squarifi": 60, "treemap": 60, "umap": 60, "reduct": 60, "evid": 60, "drift": 60, "mermaid": 60, "flow": 60, "chart": 60, "pretti": 60, "confus": 60, "matrix": 60, "matplotx": 60, "extens": [2, 60], "ipysankeywidget": 60, "ipython": [60, 68, 73], "sankei": 60, "widget": 60, "ipyvizzu": 60, "anim": [60, 63], "eas": [60, 66], "stori": 60, "present": 60, "lux": 60, "intellig": 60, "discoveri": 60, "signific": 60, "adjust": 60, "blox": 60, "attract": 60, "lovelyplot": 60, "nice": 60, "figur": 60, "gif": 60, "token": 60, "corpora": 60, "prettymap": 60, "paint": 60, "vizro": 60, "modular": [2, 56, 60], "applic": [60, 65], "cool": 61, "altern": 62, "box": 62, "dot": 62, "notat": 62, "modul": [62, 65], "shorter": 62, "inflix": [], "pregex": 62, "human": [62, 63], "bracket": 62, "pampi": 62, "dictdiff": 62, "unyt": 62, "asynchron": 62, "prefect": [62, 68], "output": [51, 63], "strip": 63, "pyfiglet": 63, "uniqu": 63, "letter": 63, "out": [56, 63], "ordinari": 63, "fire": 63, "cli": [63, 66], "typer": 63, "few": 63, "view": [56, 63, 67], "rich": [63, 67], "latexify_pi": 63, "math": [63, 73], "manimml": 63, "common": 63, "concept": 63, "review": 64, "isort": 64, "1": 64, "interrog": 64, "mypi": 64, "checker": [64, 73], "refurb": 64, "refurbish": 64, "modern": [64, 68], "codebas": 64, "erad": 64, "junk": 64, "comment": 64, "pydant": [24, 64], "enforc": [47, 64], "runtim": [64, 68], "perfplot": 64, "snippet": 64, "analyz": [54, 64], "vultur": 64, "dead": 64, "virtualenv": 65, "clone": 65, "virtual": 65, "pip": [65, 66], "autoremov": 65, "packag": [65, 73], "Its": 65, "unus": 65, "pipreq": 65, "txt": [65, 73], "pydep": 65, "poetri": 65, "pyinstal": 65, "bundl": 65, "singl": [6, 65], "github": 66, "bring": 66, "termin": 66, "pull": 66, "branch": 66, "wget": 66, "github1": 66, "browser": 66, "astral": 66, "organ": [58, 66, 68], "star": 66, "instal": 66, "e": 66, "fork": 66, "repositori": 66, "open": [2, 66, 68], "local": 66, "gpt": 66, "commit": 66, "request": 66, "inspect": 67, "report": 67, "consol": 67, "loguru": 67, "icecream": 67, "again": 67, "heartrat": 67, "program": 67, "real": [48, 67], "pyheat": 67, "heatmap": 67, "snoop": [67, 73], "smart": 67, "hyperfin": 67, "timelin": 67, "workflow": 68, "schedul": 68, "At": 68, "notifi": 68, "send": 68, "desktop": 68, "notif": 68, "finish": 68, "sound": 68, "knockknock": 68, "receiv": 68, "email": 68, "makefil": 68, "notedown": 68, "vice": 68, "versa": 68, "removestar": 68, "explicit": 68, "monkeytyp": 68, "whereami": 68, "you": [68, 74], "watchfil": 68, "rerun": 68, "retri": 68, "nbdime": 73, "reus": 73, "across": 73, "watermark": 73, "hardwar": 73, "Being": 73, "ipytest": 73, "nbqa": 73, "thi": [74, 76], "book": [74, 76], "author": 74, "support": 48, "magent": 51, "prompt": 51, "friendli": 56, "big": 56, "make_column_transform": 48, "point": [6, 59], "falsifi": 58, "mllib": 52, "rocketri": 68, "vector": [29, 56], "misspel": 48, "world": 48, "store": [46, 53], "sensit": 46, "secur": 46, "pytub": 68, "youtub": 68, "video": 68, "enum": 2, "aeon": 59, "ultim": 59, "forecast": 59, "classif": 59, "ruptur": 59, "non": 59, "stationari": 59, "signal": 59, "embrac": 2, "close": 2, "principl": 2, "mixin": 2, "pyspark": 56, "reusabl": 56, "parameter": 56, "seamless": 73, "creation": 73, "lab": 73, "strict": 11, "loss": 11, "outlin": 51, "ensur": [2, 51], "consist": 51, "tmp_path": 58, "temporari": [56, 58], "prototyp": 52, "qualiti": 47, "constraint": 47, "testbook": 73, "gluont": 59, "probabilist": 59, "mayb": 62, "tfcausalimpact": 59, "relationship": 59, "galat": 54, "massiv": 54, "5": 56, "safetensor": 53, "tensor": 53, "pendulum": 59, "quantstat": 59, "stock": 59, "udf": 56, "kneed": 59, "knee": 59, "functiontransform": 48, "robust": [48, 59], "great": 63, "scientif": 63, "look": 63, "islic": 21, "stream": [21, 47], "recip": [50, 54], "scraper": 50, "neuralforecast": 59, "streamlin": 59, "neural": 59, "familiar": 59, "syntax": [47, 59], "mirascop": 51, "field": 24, "maxim": 51, "pre": 59, "timegpt": 59, "num2word": 54, "later": 56, "statsforecast": 59, "pandas_udf": 56, "standard": 56, "autogluon": 52, "accur": 52, "magika": 68, "tsfresh": 59, "beyond": [54, 59], "tsmoothi": 59, "exponenti": 59, "smooth": 59, "drag": 60, "pygwalk": 60, "backtest": 59, "assess": 59, "trade": 59, "effortlessli": 59, "slide": 59, "window": 59, "shuffl": 56, "camelot": 63, "scientist": 47, "navig": 73, "top": 73, "magic": 73, "hierarch": 59, "bertop": 54, "bert": 54, "argpars": 63, "click": 63, "mlflow": 52, "pickl": 52, "eleg": 62, "fastapi": 52, "semant": 54, "wat": 67, "explor": 67, "unittest": 58, "sqlglot": 45, "anywher": 45}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinxcontrib.bibtex": 9, "sphinx": 56}}) \ No newline at end of file +Search.setIndex({"docnames": [".pytest_cache/README", "Chapter1/Chapter1", "Chapter1/class", "Chapter1/code_speed", "Chapter1/datetime", "Chapter1/dictionary", "Chapter1/function", "Chapter1/good_practices", "Chapter1/list/apply_functions_to_elements", "Chapter1/list/get_elements", "Chapter1/list/interaction_between_2_lists", "Chapter1/list/join_iterable", "Chapter1/list/list", "Chapter1/list/unpack_iterables", "Chapter1/number", "Chapter1/python_new_features", "Chapter1/string", "Chapter2/Chapter2", "Chapter2/collections", "Chapter2/dataclasses", "Chapter2/functools", "Chapter2/itertools", "Chapter2/operator", "Chapter2/pathlib", "Chapter2/pydantic", "Chapter2/pydash", "Chapter2/sympy", "Chapter2/typing", "Chapter3/Chapter3", "Chapter3/change_values", "Chapter3/combine_dataframes", "Chapter3/create_dataframe", "Chapter3/data_types", "Chapter3/date_time", "Chapter3/filter", "Chapter3/get_values", "Chapter3/sort_dataframe", "Chapter3/string", "Chapter3/style_dataframe", "Chapter3/testing", "Chapter3/transform_dataframe", "Chapter4/Chapter4", "Chapter4/Numpy", "Chapter5/.pytest_cache/README", "Chapter5/Chapter5", "Chapter5/SQL", "Chapter5/best_python_practice_tools", "Chapter5/better_pandas", "Chapter5/feature_engineer", "Chapter5/feature_extraction", "Chapter5/get_data", "Chapter5/llm", "Chapter5/machine_learning", "Chapter5/manage_data", "Chapter5/natural_language_processing", "Chapter5/sharing_downloading", "Chapter5/spark", "Chapter5/speed_up_code", "Chapter5/testing", "Chapter5/time_series", "Chapter5/visualization", "Chapter6/Chapter6", "Chapter6/alternative_approach", "Chapter6/better_outputs", "Chapter6/code_review", "Chapter6/env_management", "Chapter6/git_github", "Chapter6/logging_debugging", "Chapter6/workflow_automation", "Chapter7/.pytest_cache/README", "Chapter7/Chapter7", "Chapter7/example_notebook", "Chapter7/example_notebook2", "Chapter7/jupyter_notebook", "README", "gpt_scripts/.pytest_cache/README", "how_to_read"], "filenames": [".pytest_cache/README.md", "Chapter1/Chapter1.md", "Chapter1/class.ipynb", "Chapter1/code_speed.ipynb", "Chapter1/datetime.ipynb", "Chapter1/dictionary.ipynb", "Chapter1/function.ipynb", "Chapter1/good_practices.ipynb", "Chapter1/list/apply_functions_to_elements.ipynb", "Chapter1/list/get_elements.ipynb", "Chapter1/list/interaction_between_2_lists.ipynb", "Chapter1/list/join_iterable.ipynb", "Chapter1/list/list.md", "Chapter1/list/unpack_iterables.ipynb", "Chapter1/number.ipynb", "Chapter1/python_new_features.ipynb", "Chapter1/string.ipynb", "Chapter2/Chapter2.md", "Chapter2/collections.ipynb", "Chapter2/dataclasses.ipynb", "Chapter2/functools.ipynb", "Chapter2/itertools.ipynb", "Chapter2/operator.ipynb", "Chapter2/pathlib.ipynb", "Chapter2/pydantic.ipynb", "Chapter2/pydash.ipynb", "Chapter2/sympy.ipynb", "Chapter2/typing.ipynb", "Chapter3/Chapter3.md", "Chapter3/change_values.ipynb", "Chapter3/combine_dataframes.ipynb", "Chapter3/create_dataframe.ipynb", "Chapter3/data_types.ipynb", "Chapter3/date_time.ipynb", "Chapter3/filter.ipynb", "Chapter3/get_values.ipynb", "Chapter3/sort_dataframe.ipynb", "Chapter3/string.ipynb", "Chapter3/style_dataframe.ipynb", "Chapter3/testing.ipynb", "Chapter3/transform_dataframe.ipynb", "Chapter4/Chapter4.md", "Chapter4/Numpy.ipynb", "Chapter5/.pytest_cache/README.md", "Chapter5/Chapter5.md", "Chapter5/SQL.ipynb", "Chapter5/best_python_practice_tools.ipynb", "Chapter5/better_pandas.ipynb", "Chapter5/feature_engineer.ipynb", "Chapter5/feature_extraction.ipynb", "Chapter5/get_data.ipynb", "Chapter5/llm.ipynb", "Chapter5/machine_learning.ipynb", "Chapter5/manage_data.ipynb", "Chapter5/natural_language_processing.ipynb", "Chapter5/sharing_downloading.ipynb", "Chapter5/spark.ipynb", "Chapter5/speed_up_code.ipynb", "Chapter5/testing.ipynb", "Chapter5/time_series.ipynb", "Chapter5/visualization.ipynb", "Chapter6/Chapter6.md", "Chapter6/alternative_approach.md", "Chapter6/better_outputs.ipynb", "Chapter6/code_review.ipynb", "Chapter6/env_management.ipynb", "Chapter6/git_github.ipynb", "Chapter6/logging_debugging.ipynb", "Chapter6/workflow_automation.ipynb", "Chapter7/.pytest_cache/README.md", "Chapter7/Chapter7.md", "Chapter7/example_notebook.ipynb", "Chapter7/example_notebook2.ipynb", "Chapter7/jupyter_notebook.ipynb", "README.md", "gpt_scripts/.pytest_cache/README.md", "how_to_read.md"], "titles": ["pytest cache directory", "2. Python Built-in Methods", "2.6. Classes", "2.8. Code Speed", "2.7. Datetime", "2.4. Dictionary", "2.5. Function", "2.9. Good Python Practices", "2.3.5. Apply Functions to Elements in a List", "2.3.1. Get Elements", "2.3.4. Interaction Between 2 Lists", "2.3.3. Join Iterables", "2.3. List", "2.3.2. Unpack Iterables", "2.2. Number", "2.10. New Features in Python", "2.1. String", "3. Python Utility Libraries", "3.1. Collections", "3.7. Data Classes", "3.3. Functools", "3.2. Itertools", "3.6. Operator", "3.9. pathlib", "3.10. Pydantic", "3.4. Pydash", "3.5. SymPy", "3.8. Typing", "4. Pandas", "4.1. Change Values", "4.6. Combine Multiple DataFrames", "4.5. Create a DataFrame", "4.8. Manipulate a DataFrame Using Data Types", "4.3. Work with Datetime", "4.7. Filter Rows or Columns", "4.2. Get Certain Values From a DataFrame", "4.9. Sort Rows or Columns of a DataFrame", "4.10. Work with String", "4.11. Style a DataFrame", "4.12. Test", "4.4. Transform a DataFrame", "5. NumPy", "5.1. NumPy", "pytest cache directory", "6. Data Science Tools", "6.14. SQL Libraries", "6.11. Tools for Best Python Practices", "6.12. Better Pandas", "6.2. Feature Engineer", "6.1. Feature Extraction", "6.3. Get Data", "6.16. Large Language Model (LLM)", "6.5. Machine Learning", "6.4. Manage Data", "6.6. Natural Language Processing", "6.8. Sharing and Downloading", "6.15. PySpark", "6.9. Tools to Speed Up Code", "6.13. Testing", "6.7. Time Series", "6.10. Visualization", "7. Cool Tools", "7.1. Alternative Approach", "7.5. Better Outputs", "7.3. Code Review", "7.7. Environment Management", "7.6. Git and GitHub", "7.4. Logging and Debugging", "7.2. Workflow Automation", "pytest cache directory", "8. Jupyter Notebook", "<no title>", "<no title>", "8.1. Jupyter Notebook", "What Should You Expect From This Book?", "pytest cache directory", "1. How to Read This Book"], "terms": {"thi": [0, 1, 2, 3, 5, 6, 7, 9, 13, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 73, 75], "contain": [0, 27, 32, 43, 47, 48, 50, 54, 58, 59, 65, 67, 68, 69, 73, 75], "data": [0, 3, 4, 5, 7, 15, 20, 23, 28, 29, 34, 43, 46, 57, 61, 62, 63, 65, 66, 67, 68, 69, 70, 74, 75], "from": [0, 2, 3, 4, 7, 10, 13, 14, 15, 16, 18, 19, 20, 21, 24, 25, 26, 27, 29, 30, 32, 33, 39, 43, 46, 48, 53, 56, 57, 58, 60, 62, 65, 67, 69, 73, 75, 76], "s": [0, 2, 4, 15, 19, 23, 26, 29, 31, 33, 36, 38, 43, 45, 46, 53, 54, 55, 56, 58, 60, 62, 63, 65, 68, 69, 75], "plugin": [0, 43, 58, 69, 73, 75], "which": [0, 5, 7, 8, 16, 19, 25, 27, 29, 31, 32, 35, 42, 43, 45, 47, 48, 49, 51, 52, 53, 54, 56, 58, 59, 60, 62, 64, 65, 67, 69, 73, 75], "provid": [0, 2, 4, 6, 15, 16, 24, 26, 32, 34, 43, 45, 47, 50, 51, 52, 53, 54, 55, 58, 59, 60, 62, 63, 69, 73, 75], "lf": [0, 43, 48, 69, 75], "ff": [0, 43, 69, 75], "option": [0, 9, 18, 29, 31, 38, 43, 45, 46, 47, 49, 50, 52, 54, 57, 62, 63, 65, 68, 69, 73, 75], "well": [0, 2, 43, 48, 52, 54, 60, 66, 69, 75], "fixtur": [0, 43, 56, 59, 69, 75], "do": [0, 4, 9, 14, 15, 16, 22, 25, 26, 27, 29, 31, 34, 38, 43, 45, 47, 48, 50, 52, 54, 57, 58, 59, 60, 62, 63, 65, 67, 68, 69, 74, 75], "commit": [0, 43, 45, 48, 51, 53, 58, 64, 69, 73, 75], "version": [0, 26, 36, 43, 46, 48, 50, 52, 54, 58, 59, 60, 62, 64, 65, 67, 68, 69, 75], "control": [0, 2, 7, 43, 46, 51, 60, 69, 75], "see": [0, 3, 7, 16, 26, 29, 31, 43, 46, 47, 48, 50, 52, 54, 57, 58, 59, 60, 63, 65, 67, 68, 69, 73, 75], "doc": [0, 23, 29, 43, 46, 52, 54, 60, 68, 69, 73, 75], "more": [0, 2, 8, 9, 13, 15, 18, 20, 24, 32, 35, 38, 40, 42, 43, 45, 46, 47, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 66, 67, 68, 69, 73, 74, 75], "inform": [0, 7, 24, 25, 43, 47, 48, 49, 50, 51, 52, 60, 65, 67, 68, 69, 75], "chapter": [1, 17, 28, 41, 44, 61, 70], "cover": [1, 17, 28, 40, 44, 46, 47, 48, 50, 53, 54, 55, 57, 60, 61, 62, 64, 68, 70, 73], "some": [1, 2, 3, 7, 11, 15, 18, 20, 21, 22, 24, 25, 26, 27, 28, 29, 31, 35, 40, 41, 44, 46, 48, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 61, 62, 63, 64, 66, 68, 70, 73, 74], "us": [1, 3, 8, 9, 10, 11, 13, 15, 18, 19, 20, 22, 23, 26, 28, 35, 36, 37, 38, 39, 41, 44, 51, 52, 53, 54, 55, 56, 57, 59, 61, 63, 64, 65, 74, 76], "librari": [1, 18, 20, 21, 22, 23, 25, 26, 28, 48, 49, 50, 51, 52, 53, 54, 56, 57, 60, 62, 64, 65, 67, 70, 73, 74], "have": [2, 4, 5, 13, 15, 21, 25, 26, 27, 29, 31, 33, 38, 40, 47, 48, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "you": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 73, 76], "ever": [2, 4, 7, 26, 31, 33, 38, 50, 57, 58, 60, 62, 63, 65, 67, 73], "had": [2, 32, 52, 54, 58, 59], "multipl": [2, 6, 15, 24, 27, 48, 50, 51, 52, 54, 59, 60, 62, 64, 67, 73, 74], "similar": [2, 20, 30, 47, 52, 54, 58, 59, 64, 67], "In": [2, 4, 5, 6, 7, 8, 9, 11, 14, 15, 16, 18, 19, 20, 21, 24, 27, 29, 30, 31, 32, 33, 34, 35, 39, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 64, 67, 68, 73], "code": [5, 8, 9, 11, 13, 14, 18, 19, 20, 25, 26, 27, 30, 31, 32, 33, 35, 37, 42, 47, 51, 53, 62, 65, 74, 76], "below": [2, 4, 5, 6, 7, 8, 9, 11, 14, 16, 18, 19, 20, 21, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 68, 73], "dachshund": [2, 19, 27, 50], "poodl": 2, "color": [2, 5, 19, 25, 48, 52, 53, 54, 55, 59, 60, 63, 67], "show_info": 2, "def": [2, 3, 6, 7, 8, 9, 14, 15, 18, 19, 20, 21, 25, 27, 29, 34, 38, 40, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 72, 73], "__init__": [2, 19, 24, 27, 57, 58, 62, 64, 65], "self": [2, 19, 27, 34, 39, 52, 58, 59, 62, 64, 67, 68], "str": [2, 3, 7, 8, 15, 16, 19, 24, 27, 29, 38, 40, 45, 47, 48, 50, 51, 55, 58, 59, 60, 63, 64, 67], "print": [2, 3, 4, 6, 7, 9, 10, 11, 13, 14, 15, 18, 20, 21, 23, 27, 29, 30, 31, 32, 34, 35, 40, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 62, 63, 64, 65, 68, 73], "f": [2, 3, 4, 6, 7, 9, 11, 15, 19, 20, 23, 25, 31, 32, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 57, 58, 59, 60, 62, 63, 65, 67, 68, 73], "bim": [2, 15, 19, 24, 27], "black": [2, 19, 54, 59, 73], "If": [2, 3, 5, 6, 8, 9, 11, 13, 14, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74, 76], "so": [2, 7, 19, 21, 27, 42, 47, 48, 50, 52, 54, 60, 62, 63, 65, 66, 68], "organ": [2, 18, 48, 51, 52, 54], "allow": [2, 3, 6, 9, 11, 14, 15, 16, 18, 21, 25, 26, 27, 29, 31, 33, 38, 40, 45, 46, 47, 48, 49, 50, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73, 74], "defin": [2, 6, 15, 31, 45, 47, 48, 49, 52, 55, 56, 58, 59, 62, 63, 64, 68], "parent": [2, 27, 57, 67], "child": 2, "all": [2, 10, 15, 16, 18, 21, 25, 26, 33, 40, 45, 46, 47, 48, 49, 50, 52, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 76], "super": [2, 66, 67], "make": [2, 5, 6, 13, 15, 20, 23, 24, 26, 27, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 60, 62, 64, 66, 67, 68, 73, 74], "its": [2, 3, 7, 16, 19, 25, 26, 32, 38, 45, 49, 50, 52, 54, 60, 63, 65, 67, 73], "we": [2, 3, 7, 13, 14, 16, 20, 25, 26, 27, 31, 32, 34, 45, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 68, 73], "dog": [2, 19, 24, 27, 48, 50, 54, 58, 60, 62, 67], "With": [2, 19, 20, 26, 32, 45, 49, 50, 51, 52, 53, 54, 56, 59, 60, 63, 65, 66, 67, 73], "avoid": [2, 6, 15, 25, 31, 47, 48, 58, 64, 65], "repeat": [2, 6, 7, 15, 25, 52, 54], "same": [2, 6, 7, 11, 13, 15, 16, 21, 22, 25, 30, 31, 34, 35, 40, 42, 48, 52, 54, 56, 57, 60, 62, 65, 67, 68], "piec": [2, 6, 7, 54, 57, 60, 74], "time": [2, 4, 6, 7, 9, 18, 21, 31, 32, 45, 46, 47, 51, 54, 60, 62, 63, 65, 66, 73], "type_": [2, 52], "type": [2, 5, 19, 24, 26, 34, 40, 45, 46, 47, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 73], "coco": 2, "brown": [2, 47, 50, 52], "learn": [2, 24, 26, 47, 49, 50, 54, 56, 58, 60], "about": [2, 3, 7, 13, 24, 46, 47, 48, 49, 52, 53, 54, 55, 56, 58, 59, 62, 63, 65, 66, 67, 68], "here": [2, 16, 37, 47, 49, 50, 52, 53, 54, 55, 56, 58, 60, 62, 63, 64, 66, 67, 68, 73], "sometim": [14, 19, 25, 29, 31, 38, 42, 48, 49, 52, 58, 59, 60, 64, 65, 66, 67, 68], "might": [2, 7, 14, 19, 25, 29, 32, 34, 38, 42, 46, 48, 49, 52, 54, 57, 58, 59, 60, 63, 64, 65, 66, 67, 68], "want": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "differ": [2, 6, 7, 15, 16, 18, 27, 29, 32, 45, 47, 48, 49, 52, 54, 55, 56, 57, 59, 60, 64, 65, 68], "But": [25, 26, 54, 59], "those": [7, 10, 42, 48, 50, 51, 53, 54, 59, 67, 68, 73], "can": [2, 3, 4, 5, 6, 7, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 23, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 38, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74, 76], "slightli": [], "each": [3, 7, 9, 11, 18, 21, 25, 31, 39, 45, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 65, 67, 68, 74], "good": [6, 18, 25, 46, 48, 50, 54, 58, 64], "an": [2, 4, 5, 13, 14, 19, 20, 24, 25, 31, 32, 34, 38, 40, 45, 46, 47, 48, 51, 53, 56, 57, 58, 59, 62, 63, 64, 66, 67, 76], "one": [6, 7, 15, 16, 18, 21, 25, 26, 27, 29, 30, 31, 33, 34, 35, 37, 40, 42, 45, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 66, 67, 68, 73, 74], "The": [2, 5, 14, 15, 23, 25, 26, 29, 31, 32, 36, 37, 38, 40, 42, 46, 48, 50, 51, 52, 55, 56, 62, 63, 65, 66, 67, 68], "subclass": [2, 27, 62], "abc": [2, 27], "import": [2, 3, 4, 6, 7, 9, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 67, 71], "abstractmethod": 2, "anim": [50, 62], "name": [2, 5, 6, 15, 18, 19, 24, 25, 30, 33, 35, 39, 42, 45, 46, 47, 48, 50, 51, 52, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73], "make_sound": [], "pass": [2, 8, 18, 29, 45, 46, 47, 50, 52, 54, 58, 64, 65, 73], "sai": 68, "woof": 27, "cat": [2, 29, 34, 36, 45, 47, 48, 52, 56, 58, 60, 64], "meow": 60, "pepper": [5, 15, 19, 50, 54], "bella": [], "when": [2, 4, 5, 8, 14, 15, 16, 19, 21, 24, 25, 26, 27, 29, 34, 38, 40, 45, 46, 47, 50, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 73], "special": [48, 50, 53, 57], "anoth": [2, 7, 11, 14, 25, 26, 40, 47, 48, 50, 54, 58, 59, 60, 65, 68], "follow": [2, 6, 7, 15, 23, 29, 31, 32, 45, 47, 51, 52, 54, 56, 58, 59, 63, 64, 65, 66, 67, 68, 73], "exampl": [2, 3, 7, 14, 15, 21, 27, 29, 31, 32, 34, 35, 38, 40, 42, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 68, 73], "wholemilk": [], "repres": [13, 26, 29, 47, 52, 54, 67, 73], "specif": [7, 9, 24, 35, 45, 46, 47, 48, 50, 52, 57, 59, 60, 62, 63, 65], "milk": [50, 51, 54], "fat_cont": [], "float": [2, 6, 7, 14, 15, 21, 24, 27, 32, 34, 45, 51, 52, 58, 59, 62, 63, 64, 67, 68, 72, 73], "prepar": [51, 52, 54, 60, 67], "serv": [2, 47, 50, 67], "whole": [], "3": [2, 3, 6, 7, 8, 9, 13, 14, 16, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 71, 73], "5": [2, 3, 4, 6, 7, 8, 9, 11, 14, 15, 16, 19, 20, 21, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "cream": [54, 62], "On": [24, 46, 47, 50, 52, 54, 57, 58], "other": [2, 7, 15, 19, 24, 33, 37, 39, 46, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 66, 68, 73, 74], "hand": [24, 47, 50, 59, 73], "form": [26, 40, 54], "ha": [2, 6, 14, 27, 31, 32, 45, 47, 48, 50, 52, 54, 55, 59, 60, 63, 67, 74], "relationship": [40, 60], "milktea": 51, "By": [2, 7, 31, 32, 40, 48, 50, 52, 54, 56, 58, 59, 64, 65], "enabl": [15, 21, 45, 47, 48, 51, 52, 53, 54, 56, 60, 62, 65, 68], "substitut": 45, "impact": [52, 58, 59], "reus": [6, 56, 58], "cake": [], "sugar_percentag": [], "sugar": [50, 54, 67], "milk_tea": [], "10": [2, 3, 6, 7, 8, 9, 16, 19, 21, 24, 27, 31, 33, 35, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "instanti": [2, 47, 52, 54, 58, 59, 60], "oper": [2, 13, 14, 27, 31, 33, 50, 53, 58, 59, 62, 64, 65, 67], "while": [2, 3, 6, 25, 27, 29, 35, 40, 45, 47, 48, 50, 51, 53, 56, 57, 58, 59, 60, 62, 63, 68], "doesn": [2, 21, 29, 48, 51, 63, 68], "t": [2, 13, 19, 20, 21, 25, 26, 27, 29, 45, 47, 48, 49, 50, 51, 52, 54, 58, 60, 62, 63, 65, 67, 68, 73], "altern": [2, 5, 25, 48, 52], "construct": [2, 47, 48, 52, 67], "from_csv": 2, "read": [2, 6, 13, 21, 23, 42, 47, 48, 50, 51, 54, 56, 58, 59, 62, 63], "csv": [2, 3, 7, 48, 54, 59, 60, 63, 66, 68], "file": [2, 3, 15, 21, 24, 27, 31, 38, 39, 42, 45, 52, 53, 54, 59, 60, 63, 67], "panda": [2, 3, 6, 7, 10, 39, 48, 49, 52, 53, 54, 55, 59, 60, 63, 64, 65, 71, 73, 74], "pd": [2, 3, 6, 7, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 64, 65, 67, 71, 73], "dataanalyz": 2, "analyz": [2, 16, 40, 45, 47, 59], "shape": [2, 31, 42, 47, 49, 52, 59, 60, 73], "classmethod": 2, "cl": 2, "csv_path": 2, "read_csv": [2, 7, 31, 33, 47, 48, 54, 59, 60], "return": [2, 3, 5, 7, 8, 9, 14, 15, 16, 19, 20, 21, 25, 27, 29, 31, 34, 35, 36, 38, 40, 47, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 72, 73], "datafram": [2, 3, 6, 7, 52, 53, 54, 55, 59, 60, 63, 64, 65, 67, 73], "1": [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 68, 71, 73], "2": [2, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 19, 20, 24, 25, 26, 27, 29, 30, 33, 34, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 71, 73], "b": [2, 6, 7, 8, 11, 13, 14, 16, 18, 20, 21, 25, 29, 30, 31, 32, 33, 34, 35, 38, 40, 42, 45, 47, 48, 49, 52, 54, 56, 58, 60, 62, 63, 64, 65, 67, 68, 73], "4": [2, 3, 6, 7, 8, 9, 11, 13, 14, 15, 16, 18, 20, 21, 25, 26, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 71, 73], "6": [2, 3, 6, 7, 8, 11, 14, 16, 19, 20, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 73], "csv_file_path": 2, "default": [2, 16, 30, 31, 40, 45, 46, 47, 48, 52, 53, 56, 58, 60, 65, 73], "valu": [2, 6, 15, 16, 19, 20, 30, 31, 32, 39, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 60, 62, 63, 64, 67], "attribute_nam": 2, "simpli": [2, 19, 26, 29, 33, 42, 47, 48, 49, 50, 55, 57, 58, 60, 66, 67, 73, 76], "howev": [2, 6, 7, 11, 19, 21, 25, 34, 35, 45, 46, 52, 53, 56, 58, 59, 60, 62, 68, 73], "found": [2, 7, 16, 27, 45, 47, 48, 58, 60, 63, 65, 67, 76], "food": [2, 15, 18, 48, 54, 57, 62], "appl": [2, 5, 6, 8, 11, 15, 16, 18, 21, 22, 25, 27, 29, 30, 34, 35, 37, 40, 45, 47, 51, 52, 53, 54, 56, 58, 60, 62, 64], "red": [2, 5, 25, 38, 50, 52, 53, 63], "yellow": [2, 5, 48, 50, 53, 54, 60], "flavor": [2, 50, 52, 54, 62], "sweet": [2, 5, 25, 52, 58, 62], "attributeerror": [2, 6, 68], "traceback": [2, 5, 6, 7, 11, 19, 21, 24, 25, 34, 39, 42, 64, 68], "most": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 26, 34, 39, 42, 45, 48, 52, 54, 62, 64, 67, 68], "recent": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 34, 39, 42, 54, 64, 67, 68], "last": [2, 5, 6, 7, 11, 15, 19, 21, 24, 25, 27, 34, 39, 42, 48, 50, 58, 64, 67, 68, 73], "tmp": [2, 21, 34, 47, 67], "ipykernel_337430": 2, "3178150741": 2, "py": [2, 7, 15, 21, 24, 27, 29, 34, 36, 39, 42, 46, 52, 54, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "modul": [2, 15, 18, 19, 21, 22, 25, 27, 34, 50, 52, 57, 67, 68, 73], "dataload": 2, "data_dir": [2, 46], "data_load": 2, "my_data_dir": 2, "even": [2, 7, 8, 32, 52, 54, 58, 68, 73], "thei": [2, 3, 7, 29, 34, 39, 46, 50, 51, 52, 54, 56, 58, 59, 60, 62, 67, 73, 74], "ar": [2, 3, 5, 6, 7, 11, 13, 14, 16, 21, 27, 29, 30, 32, 33, 34, 35, 37, 45, 46, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 73, 74], "equal": [2, 26, 52, 65], "becaus": [2, 3, 5, 6, 7, 16, 21, 23, 26, 34, 50, 54, 58, 65, 68, 74], "store": [2, 3, 11, 19, 25, 32, 40, 47, 50, 52, 58, 59, 60, 62, 67], "separ": [2, 7, 11, 14, 29, 35, 45, 46, 47, 53, 58, 65, 67, 73], "locat": [2, 5, 15, 40, 48, 52, 53, 54, 58, 68], "To": [2, 3, 5, 6, 7, 8, 10, 11, 14, 16, 19, 21, 22, 25, 26, 29, 30, 31, 33, 34, 35, 37, 40, 42, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73], "how": [2, 4, 7, 14, 16, 25, 27, 30, 33, 34, 37, 39, 45, 46, 47, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 64, 65, 66, 67, 73], "should": [2, 24, 45, 46, 52, 54, 57, 58, 59, 60, 63, 65, 66, 67, 68, 73], "compar": [2, 4, 18, 32, 38, 45, 47, 52, 54, 56, 57, 58, 59, 60, 62, 64, 68, 73], "__eq__": [2, 19], "dog1": 2, "dog2": 2, "fals": [2, 3, 7, 8, 18, 31, 33, 34, 42, 45, 47, 48, 54, 55, 56, 58, 59, 60, 63, 64, 67, 68], "true": [2, 6, 7, 9, 14, 15, 18, 23, 24, 31, 32, 34, 35, 36, 39, 40, 42, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 64, 67, 68, 73], "access": [2, 7, 18, 22, 31, 37, 46, 47, 52, 54, 58, 74], "ani": [2, 6, 7, 34, 47, 48, 50, 57, 58, 59, 60, 64, 66, 68, 74, 76], "fit": [2, 47, 48, 49, 50, 52, 54, 58, 59, 60], "find": [2, 4, 7, 8, 26, 29, 46, 48, 53, 54, 60, 66, 67], "redund": [2, 7], "That": [2, 16, 19, 25, 26, 38, 46, 50, 52, 54, 57, 58, 59, 60, 63, 65, 66, 67, 68, 73, 76], "turn": [2, 5, 10, 25, 29, 31, 38, 50, 54, 68], "need": [2, 6, 7, 11, 15, 16, 18, 19, 20, 21, 22, 25, 45, 47, 48, 49, 50, 52, 53, 54, 55, 58, 59, 60, 65, 66, 67, 73], "staticmethod": 2, "now": [2, 7, 19, 23, 26, 27, 29, 31, 32, 34, 37, 47, 48, 52, 54, 58, 59, 60, 65, 66, 67, 68, 73], "re": [2, 6, 14, 20, 26, 27, 36, 47, 50, 52, 58, 59, 62, 64, 67, 68], "processtext": 2, "text_column": 2, "remove_url": 2, "sampl": [2, 29, 45, 47, 48, 51, 52, 56, 57, 58, 59, 60, 64, 67, 68, 73], "replac": [2, 7, 15, 25, 27, 37, 48, 49, 52, 56, 58, 59, 64, 66, 67], "url": [2, 7, 50, 54, 55, 62, 65, 73], "empti": [2, 5, 52, 58, 64, 66, 68], "space": [2, 16, 45, 48, 54, 67, 73], "sub": [2, 26, 31, 60, 65, 67], "r": [2, 16, 23, 47, 48, 52, 55, 62, 63, 68], "http": [2, 24, 29, 31, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 58, 59, 60, 62, 64, 65, 66, 68, 73], "text": [2, 7, 8, 16, 23, 45, 50, 51, 55, 58, 59, 62, 67, 68], "my": [2, 18, 23, 29, 33, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 58, 60, 62, 63, 65, 66, 67, 68, 73, 74], "favorit": [2, 46, 50], "page": [2, 31, 49, 52, 60, 63], "www": [2, 50, 54], "googl": [2, 48, 54, 59, 68, 76], "com": [2, 31, 34, 45, 47, 48, 49, 50, 54, 55, 59, 60, 62, 64, 66, 68, 73], "restrict": [2, 59], "extern": [2, 24, 73], "modif": 2, "outsid": [2, 18], "doubl": [2, 50, 56], "underscor": 2, "help": [2, 6, 32, 42, 45, 46, 47, 52, 54, 56, 58, 59, 60, 63, 67, 68, 73], "chanc": [2, 52, 59], "unintend": [2, 7], "alter": [2, 6, 47], "groceri": [2, 11, 27, 51], "item": [2, 7, 9, 13, 29, 34, 38, 48, 50, 51, 52, 54, 56, 58, 62, 68, 73], "price": [2, 5, 6, 7, 8, 11, 15, 16, 21, 25, 31, 33, 34, 35, 37, 38, 40, 45, 47, 48, 51, 52, 56, 58, 62, 64], "__price": 2, "get_pric": [2, 15, 25, 27, 62], "grocery_item": [2, 51], "99": [2, 15, 59, 63], "directli": [2, 6, 52, 59, 67, 68, 73, 76], "cell": [2, 5, 6, 7, 11, 19, 24, 39, 42, 50, 52, 59, 63, 64, 67, 68, 73], "line": [2, 5, 6, 11, 15, 18, 19, 21, 24, 25, 26, 29, 31, 39, 42, 45, 47, 53, 60, 66], "18": [2, 26, 33, 47, 48, 49, 50, 57, 59, 60, 65, 67, 68], "15": [2, 14, 16, 26, 31, 33, 35, 42, 47, 48, 49, 50, 52, 56, 57, 58, 59, 60, 68], "17": [2, 4, 35, 47, 48, 49, 50, 56, 59, 60, 63, 64, 67, 68], "behavior": [5, 6, 30, 50, 58, 59], "execut": [6, 7, 31, 45, 50, 51, 53, 56, 57, 62, 64, 73, 76], "set": [2, 6, 15, 21, 22, 27, 29, 33, 48, 50, 51, 52, 53, 54, 56, 59, 60, 64, 65, 67, 68, 73], "onli": [2, 5, 8, 13, 14, 16, 20, 21, 25, 27, 29, 30, 37, 42, 45, 46, 47, 50, 51, 52, 54, 56, 57, 59, 62, 63, 64, 65, 67, 68, 73], "fruit": [5, 8, 11, 18, 21, 22, 25, 27, 34, 35, 37, 40, 45, 47, 51, 53, 56, 58, 60, 62, 64], "_color": [], "isinst": [7, 8, 14, 15, 19, 20, 51, 58, 68], "els": [2, 4, 5, 8, 15, 18, 20, 27, 29, 38, 48, 56, 57, 58, 59, 63, 67, 68], "rais": [2, 7, 11, 15, 19, 20, 27, 34, 39, 42, 58, 63, 64, 67, 68], "must": [7, 19, 21, 45, 47, 52, 68], "var": [7, 16, 29, 67, 68], "folder": [23, 29, 58, 65, 66, 67, 68, 73], "5w": [29, 67], "fg65_rp17lz39z89p0nkv8ch0000gn": [29, 67], "ipykernel_78260": [], "1033431134": [], "3888926808": [], "14": [7, 27, 31, 33, 35, 47, 48, 49, 50, 54, 56, 57, 58, 59, 60, 67, 68], "16": [2, 8, 14, 21, 31, 33, 47, 48, 49, 52, 57, 59, 60, 62, 63, 65, 67, 68, 73], "show": [2, 3, 7, 14, 15, 18, 20, 21, 22, 31, 33, 37, 39, 41, 42, 46, 47, 50, 52, 54, 55, 56, 59, 60, 63, 64, 65, 66, 67, 68, 73], "readabl": [5, 8, 20, 27, 29, 49, 54, 58, 68, 74], "output": [2, 7, 16, 26, 38, 42, 45, 46, 47, 48, 50, 52, 54, 55, 57, 58, 59, 60, 64, 65, 67, 68, 73], "displai": [2, 14, 16, 49, 56, 59, 62], "debug": [2, 15, 47, 52, 64, 65, 68], "str__": 2, "i": [2, 3, 7, 8, 9, 11, 14, 16, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 35, 42, 45, 48, 49, 50, 52, 54, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "ag": [2, 15, 19, 24, 45, 48, 50, 55, 56, 58, 59, 60, 62, 68], "int": [2, 3, 6, 7, 9, 14, 15, 19, 24, 27, 45, 47, 51, 53, 54, 55, 57, 58, 60, 63, 64, 67, 68], "7": [2, 3, 6, 7, 16, 19, 20, 25, 29, 30, 31, 33, 34, 35, 38, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "pip": [2, 3, 24, 25, 26, 27, 29, 31, 32, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 67, 68, 73], "instal": [2, 3, 24, 25, 26, 27, 29, 31, 32, 38, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "memory_profil": [2, 64], "flexibl": [2, 28, 56, 63], "dictionari": [2, 6, 40, 56, 59, 74], "structur": [2, 7, 23, 54, 56, 59, 63, 65, 68], "lot": [2, 25, 48, 50, 53, 58, 60, 65], "effici": [2, 13, 18, 20, 22, 53, 56, 59, 62, 63, 68, 73, 74], "reserv": 2, "ahead": 2, "signific": [2, 31, 32, 52, 58, 59], "reduc": [2, 15, 33, 46, 50, 56, 57, 58, 60], "writefil": [2, 7, 15, 27, 45, 46, 52, 54, 57, 58, 63, 64, 65, 67, 68, 73], "without_slot": 2, "random": [2, 3, 7, 18, 31, 32, 33, 47, 48, 49, 52, 57, 58, 59, 60, 65, 68, 73], "randint": [2, 3, 7, 18, 32, 33, 47, 57, 58, 73], "profil": [2, 47, 48, 50, 53, 58, 64, 65], "main": [2, 7, 24, 46, 47, 50, 54, 58, 59, 63, 64, 65, 67, 68], "0": [2, 3, 4, 6, 7, 8, 9, 13, 14, 15, 16, 18, 21, 24, 25, 26, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 45, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "30": [2, 4, 16, 26, 31, 45, 47, 48, 49, 50, 52, 56, 57, 58, 59, 60, 62, 63, 67, 68, 73], "_": [2, 13, 15, 16, 18, 32, 50, 52, 57, 58, 60, 62, 63], "rang": [2, 3, 7, 9, 16, 18, 27, 31, 32, 47, 48, 51, 52, 57, 58, 59, 60, 64, 73], "100000": [2, 31, 58], "__name__": [2, 27, 46, 58, 63, 64, 67, 68], "__main__": [2, 27, 46, 58, 63, 64, 67, 68], "m": [2, 4, 16, 27, 32, 35, 40, 45, 48, 50, 53, 54, 57, 58, 59, 60, 64, 73], "filenam": [2, 57, 58, 64, 67, 68], "mem": [2, 64], "increment": [2, 47, 64], "occurr": [2, 16, 34, 48, 60, 64, 67], "content": [2, 18, 47, 49, 50, 52, 54, 64, 66, 73], "41": [2, 31, 45, 47, 48, 49, 59, 64, 67], "mib": [2, 64], "11": [2, 3, 4, 7, 16, 19, 20, 24, 27, 29, 31, 33, 35, 40, 45, 47, 48, 49, 50, 52, 54, 56, 58, 59, 60, 63, 64, 65, 67, 68, 73], "12": [2, 3, 14, 16, 19, 23, 27, 31, 32, 33, 35, 40, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 65, 67, 68, 73], "57": [2, 48, 59, 60, 63, 68], "8": [2, 3, 6, 7, 8, 15, 16, 20, 21, 25, 27, 30, 31, 33, 34, 36, 38, 40, 42, 47, 48, 49, 50, 52, 53, 54, 56, 58, 59, 60, 63, 64, 65, 67, 68, 73], "100003": 2, "with_slot": 2, "__slots__": 2, "13": [2, 29, 31, 33, 35, 48, 49, 52, 54, 56, 58, 59, 60, 67, 68], "46": [2, 31, 47, 48, 50, 67, 68], "section": [3, 7, 15, 18, 20, 21, 22, 31, 35, 39, 40, 46, 47, 48, 50, 53, 54, 55, 57, 59, 60, 62, 64, 66, 68, 73, 74], "wai": [3, 5, 7, 13, 15, 18, 25, 29, 31, 33, 34, 48, 50, 52, 54, 57, 58, 59, 62, 63, 66, 67, 74], "up": [3, 7, 9, 16, 26, 35, 45, 48, 50, 51, 52, 54, 58, 59, 60, 62, 65, 66, 68, 73], "track": [3, 6, 7, 53, 54, 58, 68], "perform": [3, 7, 29, 31, 40, 52, 54, 56, 60], "your": [3, 4, 6, 15, 25, 26, 32, 33, 34, 35, 37, 42, 46, 48, 50, 51, 56, 59, 62, 63, 65, 74, 76], "python": [3, 8, 19, 20, 22, 23, 26, 35, 41, 51, 56, 73, 74], "run": [3, 7, 9, 25, 31, 46, 47, 50, 52, 54, 57, 59, 60, 62, 63, 64, 65, 66, 67, 74, 76], "faster": [3, 9, 15, 18, 31, 45, 58], "consid": [3, 6, 7, 15, 18, 47, 48, 49, 51, 52, 54, 57, 58, 59, 64, 73], "joblib": [2, 3, 52], "parallel": [3, 56, 60], "It": [2, 3, 7, 15, 16, 26, 34, 40, 46, 50, 52, 54, 58, 59, 60, 62, 63, 65, 66, 68, 73], "easili": [3, 16, 23, 49, 53, 54, 55, 60, 63, 66], "sever": [3, 7, 15, 25, 52, 58, 63], "onc": [3, 6, 7, 25, 50, 52, 54, 55, 59, 68], "own": [3, 25, 37, 50, 63, 67], "processor": [3, 52, 64, 73], "delai": [3, 47], "multiprocess": [3, 47], "add_thre": 3, "num": [3, 6, 7, 8, 9, 11, 14, 15, 16, 21, 35, 40, 42, 47, 52, 57, 58, 62, 64, 67, 68, 73], "num_cor": 3, "cpu_count": [3, 47], "result": [3, 7, 13, 20, 29, 31, 32, 34, 47, 48, 50, 51, 52, 54, 56, 57, 58, 59, 62, 63, 64, 65, 67, 68], "n_job": [3, 59], "9": [2, 3, 6, 7, 14, 15, 19, 24, 27, 29, 31, 33, 34, 35, 39, 40, 42, 45, 47, 48, 49, 50, 52, 54, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68, 73], "try": [3, 9, 26, 29, 39, 40, 42, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68], "timeit": [3, 7, 9, 18, 31, 45, 47, 57], "also": [3, 7, 9, 16, 24, 25, 26, 29, 31, 33, 38, 42, 46, 47, 48, 49, 51, 52, 53, 54, 56, 58, 59, 60, 62, 63, 64, 65, 66, 67, 73, 74], "specifi": [3, 6, 16, 19, 25, 38, 40, 42, 46, 47, 48, 55, 58, 59, 60, 62, 65, 67, 68, 73], "number": [3, 4, 7, 8, 9, 21, 26, 29, 31, 32, 47, 48, 52, 56, 57, 58, 59, 62, 63, 64, 67, 68], "rerun": [3, 52], "get": [3, 10, 11, 18, 21, 26, 31, 32, 34, 37, 46, 47, 48, 51, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 67, 68, 74], "better": [3, 5, 7, 29, 31, 52, 54, 58, 59], "estim": 3, "func": [3, 6, 47, 62, 64, 67, 68], "comprehens": [3, 22, 54, 64], "l": [3, 8, 9, 13, 25, 27, 32, 34, 35, 38, 40, 48, 64, 68], "10_000": [3, 59, 68], "func2": 3, "list": [3, 14, 15, 19, 20, 27, 29, 33, 35, 48, 51, 52, 58, 59, 60, 62, 63, 64, 65, 68, 73], "expsiz": [3, 9], "1000": [3, 6, 7, 9, 18, 31, 47, 48, 49, 52, 59, 60], "time1": 3, "time2": 3, "6299518653018685": 3, "than": [3, 9, 11, 18, 24, 31, 32, 34, 35, 42, 45, 47, 49, 52, 54, 56, 57, 58, 59, 60, 68, 74], "averag": [3, 6, 47, 48, 52, 57, 58, 59], "pyarrow": [3, 57], "instead": [2, 3, 5, 6, 8, 18, 21, 22, 25, 26, 27, 29, 31, 32, 33, 34, 35, 37, 40, 42, 47, 48, 52, 54, 57, 58, 59, 62, 64, 65, 66, 67, 73], "compress": 3, "take": [3, 4, 6, 18, 26, 32, 54, 57, 58, 59, 60, 62, 67, 68], "less": [3, 5, 24, 32, 42, 54, 58, 67], "memori": [3, 21, 31, 33, 45, 47, 52, 53, 54, 59], "uncompress": 3, "For": [2, 3, 14, 24, 31, 38, 40, 47, 48, 50, 52, 56, 57, 58, 59, 60, 62, 64, 65, 66, 68, 73], "million": [3, 31, 45, 47, 50, 54], "row": [3, 31, 32, 38, 45, 47, 48, 49, 51, 52, 53, 56, 57, 59], "column": [3, 7, 39, 45, 47, 48, 49, 52, 53, 54, 57, 58, 60, 63, 65, 73], "189": 3, "59": [3, 4, 32, 48, 49, 57, 60, 63, 67, 68], "mb": [3, 32, 52], "around": [3, 50, 60], "78": [3, 49, 57, 59, 67, 68], "96": [3, 48, 49, 52, 59, 60], "approxim": [3, 26, 31, 32, 45, 47, 54], "110": 3, "63": [3, 45, 48, 49, 58, 59, 60, 67], "storag": [3, 45, 47, 52, 53, 55], "numpi": [3, 10, 29, 31, 32, 33, 34, 38, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 65, 66, 67, 71, 73, 74], "np": [3, 29, 31, 32, 34, 38, 47, 48, 49, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 67, 71, 73], "creat": [3, 6, 15, 19, 20, 21, 26, 27, 29, 32, 33, 37, 47, 48, 51, 53, 55, 56, 57, 59, 62, 66, 67, 73], "seed": [3, 9, 18, 32, 47, 48, 52, 54, 57, 59, 60], "123": [3, 46, 52, 57, 59], "size": [3, 32, 34, 47, 48, 49, 52, 54, 55, 56, 58, 59, 60, 63, 67, 74], "1000000": [3, 14, 32, 47], "df": [3, 6, 7, 29, 31, 32, 33, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 63, 65, 67, 73], "col": [3, 29, 36, 47, 54, 56], "write": [3, 23, 25, 38, 42, 46, 47, 54, 57, 59, 60, 63, 64, 65, 66, 67, 68], "to_parquet": [3, 31, 47], "to_csv": [3, 31, 33, 45, 60, 63], "index": [3, 9, 13, 21, 22, 29, 31, 32, 35, 40, 45, 48, 50, 52, 53, 54, 58, 59, 67, 73], "os": [3, 23, 46, 47, 50, 51, 58, 73], "path": [3, 45, 46, 47, 49, 52, 53, 54, 58, 65, 68, 73], "getsiz": 3, "82805080": 3, "198796161": 3, "event": [4, 50, 59, 62, 68], "certain": [4, 19, 25, 32, 48, 50, 54, 58, 62, 67, 68], "minut": [4, 50, 58, 67, 74], "finish": [4, 7, 45, 52, 54, 57, 62], "determin": [4, 48, 54], "sum": [4, 7, 8, 25, 29, 33, 40, 45, 47, 52, 54, 56, 58, 59, 63, 64], "trick": [4, 26, 66, 74], "begin": [4, 38, 42, 46, 47, 50, 52, 63, 73], "2020": [4, 33, 37, 54, 59, 60, 65], "01": [4, 7, 21, 33, 45, 47, 48, 49, 50, 52, 58, 59, 60, 67, 73], "03": [4, 16, 33, 47, 48, 49, 50, 52, 54, 56, 58, 59, 60, 67, 73], "23": [4, 33, 35, 47, 48, 49, 52, 54, 56, 59, 60, 63, 67, 68], "00": [4, 33, 40, 42, 47, 48, 49, 50, 52, 54, 55, 58, 59, 60, 67, 68, 73], "duration_in_minut": 4, "2500": 4, "strptime": [4, 59, 67], "y": [2, 4, 7, 21, 26, 30, 32, 40, 42, 45, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 63, 64, 65, 73], "d": [4, 7, 11, 16, 18, 33, 35, 40, 42, 47, 48, 49, 50, 52, 53, 54, 56, 58, 59, 60, 62, 63, 67], "h": [4, 40, 47, 48, 52, 59, 60], "dai": [4, 16, 31, 33, 47, 48, 50, 52, 54, 58, 60, 67, 68], "39": [4, 48, 49, 57, 58, 59, 65, 73], "seri": [4, 32, 39, 47, 48, 50, 56, 58, 65, 73], "calendar": [4, 59], "monthrang": 4, "year": [4, 15, 37, 47, 48, 50, 54, 55, 59, 60, 67, 73], "like": [4, 7, 9, 18, 25, 26, 32, 33, 34, 38, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 60, 62, 63, 64, 65, 66, 67, 68, 73], "subtract": [4, 52, 59], "date1": 4, "2022": [4, 16, 33, 50, 54, 59, 73], "date2": 4, "diff": [4, 10, 26, 39, 62, 64, 65, 66, 68, 73], "apart": [4, 48], "304": 4, "method": [5, 9, 10, 16, 18, 21, 22, 23, 26, 28, 29, 32, 33, 34, 35, 36, 37, 40, 41, 45, 47, 48, 49, 50, 54, 56, 57, 59, 62, 64, 67, 74], "birth_year": 5, "ben": [5, 40, 60, 62], "1997": 5, "new_birth_year": 5, "michael": [5, 32, 50], "1993": 5, "lauren": [5, 40], "1999": 5, "josh": [5, 40, 60, 62], "1990": [5, 31], "olivia": [5, 50], "1991": 5, "appli": [2, 5, 6, 7, 10, 25, 31, 32, 38, 42, 48, 56, 59, 60, 62, 67, 68], "alex": [5, 47, 56], "2000": [5, 31, 50, 59], "oliv": [5, 18, 50, 57], "1995": 5, "add": [5, 6, 7, 11, 20, 25, 26, 30, 31, 40, 45, 46, 48, 50, 51, 53, 54, 55, 58, 62, 63, 64, 65, 66, 68, 72, 73], "max_val": 5, "sinc": [5, 7, 27, 33, 34, 35, 47, 52, 54, 58, 59, 60, 63, 64, 65, 68], "meeting3": 5, "onlin": 5, "meeting1": 5, "room1": 5, "meeting2": 5, "room2": 5, "assum": [2, 5, 47, 48, 51, 58], "extract": [5, 9, 13, 15, 31, 46, 47, 52, 58, 66], "attr": [5, 18, 65], "tast": [5, 25, 27, 50], "orang": [5, 6, 8, 11, 15, 18, 21, 22, 25, 27, 30, 34, 35, 37, 40, 45, 47, 49, 50, 53, 56, 58, 64], "sour": [5, 27], "grape": [5, 8, 11, 15, 21, 22, 25, 27, 34, 35, 37, 64], "purpl": 5, "banana": [5, 8, 16, 21, 22, 45, 47, 51, 53, 54, 56, 58], "statement": [5, 6, 8, 20, 29, 34, 42, 47, 54, 56, 67, 68], "handl": [5, 15, 23, 46, 47, 52, 53, 56, 58, 67, 68], "lengthi": [5, 7, 21, 34, 54], "unknown": [5, 15], "A": [2, 5, 6, 13, 16, 29, 30, 31, 33, 34, 38, 40, 48, 52, 54, 56, 57, 63, 64, 65], "twice": [5, 7, 15, 42], "abov": [5, 14, 15, 16, 25, 27, 38, 42, 48, 50, 52, 54, 56, 58, 59, 60, 63, 64, 66, 68, 73], "first": [5, 16, 20, 21, 27, 29, 30, 31, 32, 35, 42, 47, 48, 50, 52, 54, 58, 59, 60, 68], "second": [5, 25, 27, 29, 42, 47, 48, 50, 54, 57, 58, 59, 62, 67, 68], "either": [5, 6, 16, 23, 27, 32, 34, 35, 42, 48, 54, 58, 62, 76], "furnitur": 5, "bed": 5, "tabl": [5, 38, 51, 55, 56, 58, 67], "chair": [5, 50], "loc1": 5, "ikea": 5, "furniture_loc": 5, "vice": 5, "versa": 5, "combin": [5, 11, 40, 45, 47, 48, 49, 50, 51, 56, 59, 60, 62, 67, 73], "green": [5, 25, 38, 48, 50, 51, 59, 63], "onion": [5, 50], "pair": [5, 11, 55, 60], "dict_item": [5, 18, 48], "switch": [5, 53, 67], "loop": [5, 8, 18, 25, 31, 45, 47, 67, 68], "v": [5, 24, 50, 58, 59], "k": [5, 9, 52, 54, 59, 64], "befor": [5, 15, 24, 27, 31, 38, 45, 47, 50, 52, 54, 56, 57, 58, 59, 64, 65, 66, 67, 68], "common": [5, 6, 10, 13, 15, 16, 26, 31, 37, 40, 48, 52, 57, 58, 59], "approach": [2, 5, 7, 15, 21, 26, 29, 47, 48, 52, 54, 58, 63], "modifi": [2, 5, 6, 29, 47, 56, 62, 66, 67], "origin": [5, 7, 26, 31, 32, 34, 40, 42, 46, 47, 48, 50, 52, 58, 59, 66, 68], "lead": [2, 5, 6, 7, 11, 15, 16, 29, 47, 48, 52, 56, 58, 59, 60, 62, 67, 73], "unexpect": [5, 29, 59, 60], "place": [5, 7, 50, 52, 54, 59, 67, 68], "accept": [2, 5, 6, 52, 63], "hashabl": 5, "give": [5, 7, 25, 27, 38, 42, 46, 48, 52, 58, 59, 63], "typeerror": [5, 6, 7, 21, 51, 63], "call": [5, 6, 7, 11, 14, 15, 18, 19, 21, 24, 25, 27, 34, 39, 42, 46, 47, 48, 49, 50, 51, 54, 56, 57, 58, 59, 60, 64, 67], "unhash": 5, "tupl": [5, 7, 18, 21, 34, 52, 62, 64, 67], "work": [5, 14, 20, 21, 24, 26, 29, 34, 46, 47, 48, 49, 50, 52, 53, 54, 57, 60, 62, 63, 64, 65, 66, 73, 74], "immut": 5, "ad": [6, 7, 26, 47, 50, 54, 56, 58, 59, 62, 64, 67, 68], "mai": [2, 6, 24, 47, 48, 50, 52, 58, 59, 60, 64, 68], "introduc": [6, 7, 45, 74], "unnecessari": [6, 47, 56, 64], "complex": [6, 15, 45, 48, 52, 58, 59, 62, 67], "condit": [6, 47, 48, 50, 52, 62], "simpler": [6, 22, 23, 50, 56], "easier": [6, 7, 13, 15, 23, 26, 31, 45, 48, 52, 58, 60, 62], "get_discount": 6, "100": [2, 6, 7, 9, 16, 18, 21, 29, 31, 32, 39, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 73], "20": [2, 6, 7, 33, 35, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 64, 65, 68, 73], "50": [2, 6, 45, 48, 49, 51, 52, 54, 56, 58, 59, 60], "necessari": [6, 40, 50, 54, 57], "doe": [6, 7, 21, 47, 48, 50, 52, 56, 58, 59, 68], "requir": [6, 21, 24, 33, 45, 47, 48, 51, 52, 53, 56, 58, 63, 67], "even_numb": 6, "filter": [6, 7, 25, 45, 52, 54, 56, 60, 68], "variou": [6, 27, 45, 52, 56, 57, 58, 63, 65, 73], "part": [6, 47, 48, 57, 58, 67], "is_even": [6, 57], "arg": [6, 27, 36, 46, 51, 52, 54, 62, 63, 67, 68], "kwarg": [2, 6, 36, 62, 67, 68], "variabl": [6, 7, 13, 19, 26, 27, 40, 45, 46, 48, 54, 56, 58, 59, 60, 64, 67, 68, 73], "keyword": [11, 24, 45, 46], "multipli": [6, 8, 21, 27, 42], "add_to_ord": 6, "new_ord": 6, "cart": 6, "updat": [6, 7, 49, 60, 65, 66, 73, 74], "kiwi": 6, "keep": [6, 7, 30, 31, 40, 47, 48, 50, 51, 58, 66], "clean": [6, 48, 59, 60, 63, 64, 65], "without": [6, 7, 14, 15, 19, 21, 25, 31, 32, 34, 45, 47, 48, 52, 54, 56, 58, 59, 60, 65, 66, 67, 68, 73], "time_func": 6, "wrapper": [6, 48, 62, 67], "start": [6, 7, 8, 11, 16, 26, 32, 33, 35, 42, 47, 48, 50, 52, 54, 57, 58, 59, 60, 62, 63, 65, 67, 73], "end": [6, 7, 25, 33, 37, 38, 42, 50, 56, 57, 59, 60, 63, 67, 73], "elaps": [6, 59], "3f": [6, 52], "ms": [6, 31, 45, 47, 57, 59], "num1": [6, 7, 20, 34, 47, 48, 58, 63, 68, 72, 73], "num2": [6, 7, 20, 47, 48, 58, 63, 68, 72, 73], "006m": 6, "027m": 6, "includ": [7, 38, 40, 47, 48, 50, 51, 52, 54, 58, 59, 62, 64, 65, 67, 73, 74], "best": [7, 48, 51, 54, 59, 64], "bad": [7, 54, 58, 64, 68], "vagu": [7, 48], "x": [2, 7, 8, 20, 21, 26, 29, 30, 32, 40, 42, 45, 47, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 67, 73], "z": [7, 30, 40, 48, 64], "role": [7, 58, 60], "declar": [7, 15, 47, 63], "hint": [7, 19, 63, 64], "obviou": 7, "num_memb": 7, "num_guest": 7, "sum_": 7, "confus": [7, 58, 67], "understand": [6, 7, 13, 15, 23, 45, 46, 54, 57, 58, 60, 64, 65, 66, 67], "circle_area": 7, "thu": [7, 14, 26, 31, 47, 52, 56, 58, 65], "them": [7, 14, 16, 27, 29, 32, 46, 48, 49, 52, 54, 56, 57, 58, 59, 62, 64, 65, 66, 74], "pi": [7, 15, 26, 60], "radiu": [7, 15], "too": [7, 48, 54, 58], "improv": [7, 27, 30, 31, 56, 60, 62, 63, 64, 68, 70, 73], "both": [7, 9, 30, 34, 40, 45, 47, 51, 52, 54, 56, 57, 58, 59, 65, 67], "At": [7, 73], "least": [7, 42, 48, 52, 54, 68], "clearer": 7, "x_is_even_and_neg": 7, "y_is_odd_and_posit": 7, "chang": [2, 7, 16, 19, 31, 32, 33, 38, 45, 46, 47, 51, 52, 53, 54, 56, 57, 58, 60, 62, 64, 66, 73], "rememb": [7, 26, 48], "otherwis": [2, 7, 16, 58, 63, 67], "bug": [7, 11], "our": [7, 13, 26, 47, 48, 50, 52, 54, 58, 59, 60], "date": [7, 45, 47, 48, 50, 51, 54, 58, 60, 67, 73], "2021": [7, 16, 33, 37, 45, 48, 50, 52, 57, 59, 65, 73], "arrai": [7, 25, 34, 36, 45, 48, 52, 58, 59, 60, 63, 67, 73], "datetim": [7, 16, 24, 47, 48, 50, 58, 67], "val1": [7, 56, 58], "val2": [7, 56, 58], "iloc": [7, 29, 31, 32, 39, 53, 59, 60], "subset_x": 7, "subset_i": 7, "filt": 7, "futur": [7, 36, 47, 48, 59, 67, 68], "return_two": 7, "care": [7, 13, 14, 58], "hello": [7, 15, 23, 50, 51, 63, 67, 68], "difficult": [7, 14, 50, 52, 58, 59, 60, 62, 73], "hardcod": 7, "imposs": 7, "discern": 7, "mean": [2, 7, 15, 31, 32, 33, 40, 45, 47, 48, 52, 53, 54, 56, 58, 59, 60, 64, 76], "addit": [7, 24, 32, 45, 47, 57, 58, 65], "context": [2, 7, 48, 54, 58, 67, 68], "comment": [7, 66], "price_differ": 7, "transpar": 7, "maintain": [7, 45, 47, 50], "built": [7, 14, 18, 20, 21, 22, 24, 47, 52, 57, 58, 59, 60, 62, 63, 67], "instantli": 7, "januari": [7, 47, 67], "rest": [7, 31, 50, 66], "februari": [7, 47, 50], "len": [7, 15, 47, 54, 58, 59, 60, 63, 64, 68], "particular": [7, 33, 47, 58, 59], "thing": [7, 15, 22, 26, 48, 50, 54, 57, 58, 59, 62, 65], "know": [7, 26, 49, 50, 52, 54, 58, 59, 62, 67], "yet": [7, 59], "put": [7, 46, 55, 68], "high": [7, 26, 47, 48, 50, 54, 56, 57, 59], "level": [7, 47, 48, 54, 56, 57, 59, 67], "go": [2, 7, 26, 29, 48, 50, 51, 54, 60, 66], "back": [7, 14, 26, 50, 58], "prevent": [7, 31, 47, 50, 58], "thought": [7, 58], "being": [7, 16, 46, 48, 50, 67, 73], "disrupt": 7, "say_hello": 7, "ask_to_sign_in": 7, "is_us": 7, "bool": [7, 34, 67, 68], "new": [7, 31, 33, 36, 40, 42, 45, 47, 48, 49, 52, 53, 54, 56, 58, 59, 60, 64, 65, 66, 67, 68, 73, 74], "old": [7, 48, 67], "point": [7, 33, 48, 49, 50, 52, 54, 58, 60, 66, 68], "l1": [7, 52], "l2": [7, 52], "append": [2, 7, 18, 56, 57, 60, 64], "shallow": 7, "deep": [7, 32, 50, 54], "children": [7, 50, 54, 59], "becom": [6, 7, 45, 50, 56, 58, 59, 64], "l3": 7, "stai": [7, 9], "inadvert": 7, "append_four": 7, "nums1": 7, "produc": [7, 47, 51, 52, 59, 62], "much": [7, 39, 48, 52, 58, 59, 60, 63, 66, 73], "cleaner": [7, 15, 56, 58, 62, 73], "arr": [7, 42, 73], "c": [2, 6, 7, 8, 11, 13, 18, 29, 30, 32, 34, 35, 40, 45, 47, 48, 49, 52, 54, 56, 58, 59, 60, 63, 67], "e": [7, 37, 40, 49, 52, 55, 58, 59, 60, 65, 68], "val": [7, 29, 30, 32, 33, 56, 59], "shorten": [7, 34], "between": [7, 15, 30, 40, 45, 47, 48, 51, 52, 54, 55, 56, 57, 59, 64, 65, 67, 68], "two": [7, 9, 16, 18, 20, 21, 33, 35, 38, 40, 47, 48, 53, 54, 56, 59, 60, 68, 73], "char": [7, 18, 21, 67], "10000": [7, 9, 47, 57], "411": [7, 59], "\u00b5s": [7, 31, 45, 47], "98": [7, 47, 49, 54, 59], "per": [7, 15, 31, 45, 47, 48, 54, 59, 74], "std": [2, 7, 31, 45, 47, 59], "dev": [7, 24, 31, 45, 47, 52, 73], "000": [7, 16, 45, 47, 57, 59], "60": [7, 31, 48, 49, 50, 51, 52, 54, 55, 58, 59, 60, 64], "process_data": [7, 20, 63, 68, 73], "violat": [7, 47], "principl": 7, "featur": [7, 32, 46, 47, 50, 58, 60], "although": [7, 52], "explain": [7, 56, 60, 64], "block": [7, 52, 68], "test": [7, 47, 48, 53, 57, 59, 60, 64], "unit": [7, 15, 27, 49, 50, 59], "insid": [7, 16, 23, 58, 60, 62, 68, 73], "challeng": [7, 21, 45, 48, 49, 54, 56, 58, 59, 62, 64], "axi": [6, 7, 29, 32, 34, 35, 40, 42, 47, 49, 50, 52, 59, 60], "split": [7, 40, 52, 54, 59, 60, 67], "smaller": [7, 31, 35, 42, 49, 57, 58], "revis": [7, 64], "accomplish": 7, "These": [7, 52, 58, 62], "pipe": [2, 7, 47, 48, 54, 67], "order": [6, 7, 16, 21, 32, 40, 42, 52, 54, 56, 57, 58, 60, 62, 63], "achiev": [7, 13, 20, 47, 54, 58, 59], "desir": [7, 51, 58], "comprehend": [7, 45, 54, 56, 64], "create_a_copi": 7, "add_new_featur": 7, "add_on": [7, 62], "sum_all_column": 7, "As": [7, 32, 47, 48, 50, 52, 56, 64], "increas": [7, 16, 29, 33, 52, 59, 64], "purpos": [6, 7, 27, 47, 54, 59], "numer": [7, 24, 32, 47, 48, 54, 64, 66, 67, 68], "develop": [7, 15, 27, 48, 52, 64, 68, 74], "bundl": 7, "relat": [7, 50, 57, 59, 68], "cohes": 7, "dataclass": [7, 19, 24], "pydant": [7, 45, 51], "model": [2, 7, 38, 45, 48, 49, 53, 63, 68, 73], "zip_path": 7, "raw_train_path": 7, "raw_test_path": 7, "processed_train_path": 7, "processed_test_path": 7, "none": [2, 6, 7, 27, 30, 32, 34, 39, 45, 46, 48, 50, 52, 54, 57, 58, 60, 62, 64, 67, 68], "class": [7, 15, 18, 32, 33, 45, 47, 48, 51, 52, 54, 55, 56, 57, 59, 62, 64, 67, 74], "rawloc": 7, "path_train": 7, "path_test": 7, "processedloc": 7, "raw_loc": 7, "processed_loc": 7, "get_data": [7, 57, 58, 65, 68], "is_csv": 7, "read_pickl": [7, 48], "pkl": [2, 7, 48, 52, 59], "yourself": [7, 64], "get_csv_data": 7, "get_pickle_data": 7, "short": [7, 48, 50, 59, 62, 67, 68, 73], "purchas": 7, "shipping_fe": 7, "simplifi": [7, 54, 60, 68, 73], "group": [7, 14, 27, 45, 47, 48, 50, 52, 58, 59, 60, 64], "within": [2, 7, 47, 48, 49, 52, 54, 56, 58, 59, 66], "instanc": [7, 19, 48, 52, 54, 56, 58, 59], "is_numb": 7, "flow": [7, 57, 62, 67, 68], "program": [7, 48, 50, 52, 57, 64, 68], "base": [2, 7, 15, 27, 35, 38, 45, 51, 54, 56, 59, 60, 63, 64], "evalu": [7, 25, 34, 52, 59], "encount": [7, 34, 68], "actual": [7, 52, 53, 58, 59, 64, 68], "occur": [7, 29, 47, 54, 59, 60, 68], "possibl": [7, 9, 32, 47, 50, 51, 59], "low": [7, 31, 32, 47, 56, 59], "enhanc": [7, 47, 49, 51, 52, 59, 62], "speed": [7, 9, 31, 32, 54, 62], "divis": [7, 48, 58], "zero": [7, 53, 58, 60, 67], "zerodivisionerror": [7, 68], "explicit": [7, 45, 54, 63], "precis": [7, 32, 47, 50, 52, 68], "caus": [7, 29, 33, 54, 56], "consequ": 7, "messag": [7, 24, 39, 57, 58, 62, 63, 64, 67, 68], "cannot": [2, 7, 19, 21, 25, 26, 27], "divid": [7, 14, 26, 48, 50, 56, 58, 68], "though": [7, 32, 52], "accur": [7, 48, 54, 58, 59, 68], "22": [7, 18, 31, 33, 35, 47, 48, 49, 50, 52, 54, 59, 60, 65, 68, 73], "unsupport": 7, "operand": 7, "potenti": [2, 7, 11, 32, 47, 50, 52], "problemat": 7, "post": [7, 16, 31, 48, 50, 52, 54, 59], "success": [7, 52, 58, 68], "action": [7, 47, 48, 52, 56, 60, 66], "messi": [7, 66, 73], "harder": [7, 58, 68], "clear": [7, 15, 52, 58, 62], "sum_num": 7, "mean_num": 7, "unintention": 7, "trigger": 7, "process": [2, 7, 20, 31, 32, 37, 45, 46, 48, 50, 51, 52, 57, 58, 59, 60, 62, 64, 67, 68, 73], "overwrit": [7, 46, 52, 54, 58, 64, 65, 73], "if__name__": 7, "uppercas": [8, 56, 67], "abcd": [8, 11], "isupp": [8, 67], "satisfi": [8, 42, 48, 67], "given": [6, 8, 33, 51, 52, 54, 58, 59, 65, 67, 68, 73], "lambda": [8, 18, 21, 25, 29, 40, 47, 54, 57, 62, 64], "everi": [8, 21, 33, 47, 54, 58, 64, 66, 67, 68, 73, 74], "kei": [8, 30, 33, 34, 35, 45, 47, 48, 51, 53, 54, 55, 56, 58], "paramet": [8, 9, 21, 31, 32, 33, 36, 46, 49, 52, 56, 65, 68, 73], "by_lett": 8, "revers": [9, 40], "by_pric": 8, "whether": [23, 34, 42, 48, 52, 56, 58, 59, 67], "check_mention_fruit_1": 8, "got": [8, 14, 29, 33, 50, 54, 64], "check_mention_fruit_2": 8, "besid": [9, 49], "home": [9, 36, 47, 50, 52, 53, 54, 55, 58, 60, 65, 67, 73], "wa": [9, 32, 47, 54, 58, 66], "pick": [9, 54, 64], "to_do_tonight": 9, "attend": [9, 59], "parti": 9, "exercis": [9, 31, 60], "weigh": 9, "ten": [9, 19, 24, 63], "random_num": 9, "larg": [9, 16, 29, 36, 40, 48, 50, 52, 54, 56, 58, 59, 60], "sort": [9, 21, 32, 42, 48, 54, 56, 73], "get_n_max_sort": 9, "get_n_max_heapq": 9, "nlargest": [9, 40], "time_sort": 9, "global": [9, 18, 67], "time_heapq": 9, "ratio": [9, 16, 54, 57, 59], "round": [9, 47, 50, 52, 57, 58, 62], "experi": [9, 18, 21, 47, 48, 49, 52, 54, 57, 58, 59, 60, 70], "827": 9, "obtain": [10, 23, 35, 45, 48, 52, 59, 74], "uniqu": [10, 40, 48, 50, 54, 55, 59], "element": [10, 13, 27, 40, 50, 58, 60, 62, 63, 67], "convert": [10, 29, 31, 32, 37, 45, 48, 50, 53, 55, 56, 60, 63, 64, 67, 68, 73], "requirement1": 10, "statsmodel": [10, 52], "requirement2": 10, "matplotlib": [10, 42, 52, 54, 59], "fruits_str": 11, "todai": [11, 16, 24, 29, 52, 54, 58, 60, 67], "comb": [11, 21], "nums_2": 11, "chars_2": 11, "assign": [2, 13, 19, 48, 56, 57], "simultan": [13, 56, 57], "practic": [13, 51, 58, 68], "longer": [11, 13, 50, 58, 65, 68], "subset": [13, 31, 40, 47, 48, 54, 59, 60], "splat": 13, "don": [13, 19, 20, 26, 48, 58, 60, 65, 73], "normal": [14, 18, 20, 21, 22, 25, 26, 35, 48, 49, 52, 54], "6666666666666665": 14, "prefer": [14, 23, 35, 50, 56], "There": [14, 29, 52, 54, 58, 59, 68], "function": [14, 22, 24, 37, 45, 48, 51, 52, 54, 56, 57, 59, 60, 73, 74], "exactli": [14, 26, 47, 48, 50, 52, 54, 59, 60, 62, 67], "3752999689475413": 14, "2251799813685248": 14, "cool": [14, 25, 26, 48, 54, 60, 65], "limit": [14, 16, 21, 32, 45, 48, 51], "limit_denomin": 14, "object": [6, 14, 18, 26, 29, 31, 32, 33, 34, 35, 36, 37, 39, 45, 47, 48, 52, 53, 54, 59, 60, 62, 68, 73], "again": [14, 49, 68], "figur": [14, 26, 48, 49, 52, 54, 59, 67], "out": [14, 26, 31, 34, 47, 48, 50, 54, 59, 62, 64, 66, 67, 68], "mani": [14, 33, 50, 51, 52, 53, 60, 66, 67, 68], "digit": [14, 16, 45, 48, 54, 62, 67], "visual": [14, 49, 59, 63, 66, 73], "thousand": [14, 16, 48, 54], "large_num": 14, "1_000_000": [14, 32, 47], "integ": [14, 16, 19, 21, 24, 27, 32, 45, 49, 51, 64, 68], "check": [14, 15, 24, 27, 31, 47, 50, 52, 65, 66, 67, 68, 73], "remaind": 14, "n": [14, 21, 31, 39, 42, 47, 48, 50, 52, 53, 54, 55, 58, 59, 60, 63, 64, 65, 67, 68], "select": [14, 29, 31, 45, 47, 48, 50, 51, 52, 54, 56, 58, 59, 62], "whose": [14, 29, 33, 34, 35, 37, 42, 60], "get_multiples_of_n": 14, "elif": [2, 6, 15, 34, 56, 58, 59, 68], "case": [15, 21, 37, 38, 42, 45, 48, 52, 54, 56, 59, 67, 73, 74], "get_youngest_pet": 15, "pet_info": 15, "age1": 15, "age2": 15, "min": [15, 31, 32, 40, 45, 47, 53, 58, 67], "dict": [15, 20, 27, 45, 47, 51, 54, 59, 62], "pet_info1": 15, "pet_info2": 15, "compon": [15, 52, 54, 59, 60], "comput": [15, 25, 26, 32, 41, 47, 48, 49, 52, 54, 56, 57, 58, 68], "meaning": [2, 15, 48, 58, 59], "math": [15, 18, 26, 42, 64, 68], "diamet": 15, "circl": [15, 49], "area": [15, 52, 54, 59, 60, 66], "error": [2, 6, 15, 19, 24, 27, 29, 34, 42, 45, 47, 52, 54, 62, 63, 64, 67, 68, 76], "quickli": [15, 31, 47, 48, 50, 52, 54, 60, 67], "identifi": [15, 45, 52, 54, 58, 59, 64, 67, 68], "exact": [15, 48, 49, 52, 54, 58, 62], "illustr": [15, 59], "trackback_test": 15, "greet": 15, "greetng": 15, "typo": [15, 48], "khuyen": [15, 16, 18, 23, 36, 40, 42, 47, 52, 54, 55, 58, 60, 65, 67, 68, 73, 74], "user": [15, 23, 42, 45, 47, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 63, 65, 67, 68, 73], "khuyentran": [15, 52, 54, 55, 58, 59, 60, 67, 73], "book": [15, 23, 24, 34, 36, 39, 42, 47, 48, 50, 52, 54, 55, 58, 60, 63, 64, 65, 67, 68, 73], "efficient_python_tricks_and_tools_for_data_scientist": [15, 23, 42, 52, 58, 73], "chapter1": 15, "nameerror": 15, "did": 15, "shown": [16, 42, 58], "3123": 16, "1f": [16, 38], "2f": [16, 32, 47, 52, 54, 67], "31": [16, 47, 48, 49, 50, 53, 58, 59, 60, 65, 67, 68, 73], "curli": 16, "bracket": [16, 25, 34, 63], "45": [16, 32, 45, 47, 48, 49, 56, 59, 60, 67, 68], "p": [16, 45, 49, 52, 54, 59, 60, 68, 73], "pm": [16, 51, 59, 60], "saturdai": [16, 50, 59], "02": [16, 33, 47, 48, 49, 50, 52, 58, 59, 60, 63, 73], "hour": [16, 33, 47, 48, 58, 59, 60, 67, 68], "am": [16, 48, 54, 58, 60], "wake": 16, "08": [16, 47, 48, 49, 52, 54, 58, 59, 60, 67, 68, 73], "09": [16, 33, 48, 49, 50, 52, 55, 56, 57, 58, 59, 60, 62, 68, 73], "100000000": 16, "total": [16, 32, 33, 45, 48, 56, 57, 58, 59, 60], "itertool": [16, 17, 52, 62], "permut": 16, "j": [16, 21, 48], "sentenc": [16, 50, 54, 58], "nice": [16, 19, 21, 25, 26, 46, 47, 48, 50, 54, 55, 58, 65, 67, 68, 73], "No": [16, 50, 51, 52, 54, 58, 60], "stop": [16, 42, 54, 57, 60], "posit": [6, 16, 21, 35, 38, 45, 47, 49, 51, 52, 54, 59, 73], "search": [16, 46, 49, 59, 64], "pattern": [16, 25, 40, 50, 59, 60], "swap": [2, 16, 62], "sundai": 16, "match_pattern": 16, "sent": [16, 54], "nice_dai": 16, "regrex": 16, "veri": [16, 19, 48, 50, 52, 54, 59, 61, 68], "long": [16, 40, 45, 47, 50, 54, 57, 58, 59, 63, 67], "break": [16, 45, 67, 68], "parenthes": 16, "backslash": 16, "made": [16, 50, 54, 63, 66], "ident": [16, 26, 56, 58], "mayb": 16, "grammar": 16, "three": [16, 50, 59, 60, 63, 67], "cross": [16, 50, 52], "drop": [16, 29, 40, 46, 52, 59], "come": [16, 19, 25, 26, 46, 48, 49, 50, 52, 54, 57, 58, 59, 60, 65, 66, 67, 68, 73], "handi": [16, 19, 25, 26, 46, 48, 50, 52, 54, 57, 58, 59, 60, 65, 66, 67, 68, 73], "text1": 16, "text2": 16, "khuen": 16, "9523809523809523": 16, "tool": [16, 24, 28, 50, 51, 52, 55, 60, 62, 64, 66, 68, 70, 73, 74], "pencil": 16, "pen": [16, 59], "erasor": 16, "ink": 16, "pencel": 16, "closer": [16, 50, 54], "argument": [11, 16, 24, 27, 35, 47, 52, 54, 58, 60, 63, 65, 67, 68], "cutoff": [16, 48, 59], "collect": [17, 40, 47, 48, 52, 54, 56, 58, 59, 60, 67, 68, 73], "functool": 17, "pydash": 17, "deal": [15, 18, 26, 31, 48, 50, 59, 66], "slow": [18, 58], "ineffici": [18, 21, 32, 47], "char_list": 18, "custom_count": 18, "list_": 18, "char_count": 18, "custom": [18, 33, 45, 47, 50, 54, 56, 58, 63, 65, 67, 68, 73], "num_list": [18, 21], "numexp": 18, "custom_tim": 18, "counter_tim": 18, "6199148843686806": 18, "small": [18, 36, 40, 47, 48, 50, 52, 57, 59], "manag": [18, 48, 50, 52, 54, 56, 58, 66], "project": [18, 44, 45, 50, 52, 54, 57, 58, 60, 63, 66, 68, 73, 74], "person": [18, 54], "attribut": [6, 15, 18, 19, 27, 67, 73], "gender": [18, 48, 50, 54, 60], "male": [18, 50, 60], "femal": [18, 50, 60], "just": [2, 18, 25, 50, 51, 52, 53, 54, 59, 60, 63, 65, 66, 68, 73], "obj": [2, 18, 34, 39], "b23": 18, "physic": [18, 47, 56, 73], "d24": 18, "spanish": [18, 48], "cleanest": 18, "food_pric": 18, "ignor": [18, 27, 31, 48, 52, 54, 56, 58, 60, 62, 65, 68, 73], "unordered1": 18, "unordered2": 18, "ordered1": 18, "ordered2": 18, "across": [2, 18, 45, 47, 48, 49, 52, 56, 59, 62, 67], "tomato": 18, "veggi": 18, "carrot": [18, 50, 51], "map": [18, 21, 25, 47, 48, 49, 54, 67, 68], "avail": [19, 27, 47, 48, 50, 52, 59, 65, 67], "represent": [19, 52, 54, 59], "few": [19, 47, 48, 50, 52, 53, 54, 55, 56, 57, 59, 60], "decor": [2, 19, 27, 48, 57, 58, 63, 67, 68], "top": [19, 47, 50, 51, 52, 54, 56, 59, 60, 63, 68, 76], "dataclassdog": 19, "appropri": [19, 20, 58, 73], "__repr__": 19, "present": [19, 47, 50, 54, 58, 59, 63, 67], "cumbersom": [19, 53, 58, 65], "anybodi": 19, "adjust": [19, 35, 47, 52, 56, 63], "throw": [19, 29, 50], "golden": [19, 50], "frozeninstanceerror": 19, "ipython": [19, 25, 48, 62, 67], "input": [15, 19, 24, 25, 45, 46, 51, 52, 56, 59, 60, 63, 67, 68, 73], "0d6f339835b8": 19, "string": [19, 24, 27, 33, 40, 46, 48, 50, 53, 57, 63, 67, 73], "__setattr__": 19, "field": [19, 45, 50, 54, 62, 67, 74], "implement": [19, 20, 24, 29, 47, 52, 54, 58, 59, 68, 73], "automat": [19, 24, 32, 45, 47, 50, 52, 54, 57, 58, 67, 73], "___init__": 19, "initi": [19, 25, 47, 48, 49, 50, 52, 53, 58, 59, 65], "__post_init__": 19, "info": [19, 32, 33, 47, 51, 52, 54, 57, 58, 59, 62, 65, 67, 68, 73], "zip": [19, 52, 54, 55, 59, 64], "fix": [20, 33, 45, 54, 58, 59, 68, 73], "linear_func": 20, "linear_func_parti": 20, "data2": 20, "process_dict": 20, "process_list": 20, "choos": [20, 32, 34, 52, 57], "right": [20, 26, 39, 40, 62, 63, 66, 67, 73, 76], "process_data2": 20, "notimplementederror": 20, "pleas": [20, 47, 50, 52, 55, 60], "regist": [20, 50, 56, 60, 67], "process_dict2": 20, "process_list2": 20, "left": [20, 26, 39, 40, 59, 62, 63, 67, 73], "singl": [20, 29, 45, 47, 48, 52, 56, 59, 63, 68], "add_num": 20, "matter": [21, 48], "naiv": [21, 67], "param": [21, 47, 52, 58], "learning_r": 21, "1e": [21, 52, 59], "batch_siz": 21, "32": [21, 45, 47, 48, 49, 50, 52, 59, 60, 62, 65, 68], "64": [21, 48, 49, 57, 59], "001": [21, 49, 57, 60, 62], "ipykernel_38110": 21, "240000324": 21, "miss": [21, 32, 38, 50, 54, 58], "lemon": 21, "chosen": 21, "ipykernel_40588": 21, "2755098589": 21, "indic": [8, 21, 22, 42, 50, 52, 54, 56, 58, 59], "slice": [21, 29, 50], "key_func": 21, "aggreg": [11, 21, 45, 56, 59], "fill": [21, 30, 54, 67], "fillvalu": 21, "word": [21, 34, 48, 58, 60, 62, 67], "abcnic": 21, "upper": [21, 34, 35, 45, 48, 52, 53, 54, 56, 59, 60, 67], "islow": [21, 67], "join": [21, 23, 37, 40, 42, 45, 47, 54, 67], "export": [22, 52, 60, 63, 65, 73], "correspond": [6, 22, 47, 48, 62, 67], "intrins": 22, "syntax": [15, 22, 49, 55, 56, 62, 63, 66], "easi": [23, 24, 28, 47, 48, 49, 50, 51, 54, 55, 57, 58, 60, 62, 63, 64, 66, 68], "choic": [23, 32, 47, 51, 56, 63, 68], "exist": [23, 45, 47, 51, 59, 60, 62, 65, 68, 73], "makedir": [23, 47], "new_fil": 23, "txt": [23, 46, 52, 58, 60], "open": [21, 23, 28, 48, 50, 52, 59, 62, 65, 67, 73, 74], "w": [23, 48, 52, 62], "world": [23, 31, 50, 51, 54, 59, 63, 68], "mkdir": [23, 58, 68, 73], "exist_ok": [23, 47, 68], "write_text": [23, 58, 68], "read_text": [23, 45, 58], "document": [23, 29, 49, 52, 54, 60, 67, 68], "pictur": [23, 48, 50], "manipul": [23, 28, 45, 47, 56, 60, 63], "touch": [23, 58], "tree": [23, 52, 58, 64], "grep": 23, "grandpar": 23, "cwd": 23, "chapter2": 23, "relative_to": 23, "nlp": 23, "scienc": [23, 47, 48, 49, 50, 52, 54, 60, 61, 66, 74], "root": [23, 26, 52, 54, 58, 67], "posixpath": [23, 58], "samefil": 23, "absolut": [23, 42, 52, 59], "ipynb": [23, 42, 60, 68, 73], "kitchen": [25, 68], "sink": 25, "util": [25, 42, 45, 47, 54, 58, 59, 63, 65, 67, 68], "stuff": [25, 48], "py_": 25, "ye": [25, 26, 60, 66], "could": [25, 26, 38, 47, 48, 49, 54, 60, 63, 65, 66, 67, 73], "done": [25, 26, 38, 52, 66, 73], "walmart": [25, 40, 58, 62], "season": [25, 50, 54, 59, 60], "in_season": 25, "aldi": [25, 40, 58, 62], "out_of_season": 25, "wouldn": [25, 26, 46, 47, 48, 54, 58, 60, 65, 67, 68, 73], "dot": [25, 60], "notat": 25, "filter_fruit": 25, "valueerror": [2, 11, 15, 19, 25, 42, 58, 67, 68], "b01bf8b7ae1a": 25, "0x7f9880491310": 25, "find_index": 25, "what": [25, 32, 47, 48, 50, 51, 52, 53, 54, 58, 60, 62, 65, 66, 67], "filter_": 25, "map_": 25, "bought": 25, "reject": [25, 47], "startswith": [25, 67], "0x7f027895d1f0": 25, "note": [25, 32, 52, 59], "final": [25, 56, 59, 68], "lazi": 25, "hold": [25, 55, 59], "express": [25, 26, 50, 54, 55, 60, 68], "until": [25, 47, 50, 54, 56, 58, 68], "total_pric": 25, "wish": [26, 62, 63, 67], "algebra": 26, "eq": 26, "bore": 26, "mathemat": 26, "let": [26, 47, 48, 50, 52, 54, 56, 57, 58, 59, 60, 63, 65, 68], "over": [21, 26, 29, 45, 54, 59, 73, 74], "amaz": 26, "squar": [26, 48, 60], "decim": [26, 42, 52, 58, 63, 67], "242640687119285": 26, "sqrt": [26, 51, 63, 68], "displaystyl": [26, 63, 73], "tri": [26, 31, 54, 73], "fraction": [26, 48, 53], "25": [26, 31, 33, 42, 45, 47, 48, 49, 50, 52, 54, 56, 57, 58, 59, 60, 62, 64, 68], "6666666666666667": 26, "frac": [26, 63], "ration": 26, "real": [26, 45, 51, 54, 58], "power": [26, 28, 45, 47, 51, 52, 58, 62, 65, 66, 68], "abil": [26, 54], "expr": 26, "term": [26, 49, 52, 54, 59, 63], "happen": [26, 47, 58, 67], "aha": 26, "remain": [11, 26, 50, 52, 58], "unevalu": 26, "why": [26, 50, 52, 53, 54, 63, 74], "would": [26, 32, 47, 48, 52, 54, 58, 59], "kind": [26, 31, 32], "school": [26, 48, 50], "life": [26, 48], "expans": 26, "pretti": [26, 45], "isn": 26, "One": [26, 32, 38], "question": [26, 48, 50, 52, 58, 59], "luckili": [26, 48, 60, 73], "6x": 26, "fun": [26, 48, 50], "look": [26, 48, 50, 52, 54, 58, 59, 60, 65, 67, 73], "trigsimp": 26, "sec": [26, 49, 59, 67], "co": [26, 54], "sin": [26, 60, 63], "tan": 26, "cot": 26, "calculu": 26, "worri": 26, "infin": 26, "oo": 26, "factori": [26, 67], "rewrit": [26, 45, 47, 56, 58], "past": [26, 38, 42, 47, 50, 59], "notebook": [26, 38, 42, 52, 59, 65, 67, 74, 76], "markdown": [26, 42, 55, 63, 65, 67, 73], "sure": [27, 52, 54, 58, 73], "correct": [27, 45, 48, 52, 54, 56, 58, 64, 68], "mypi": 27, "callable_exampl": 27, "multiply_then_divide_by_two": 27, "multiply_func": 27, "static": [27, 58], "checker": 27, "inde": 27, "1m": [27, 54, 58, 64, 65, 67, 73], "32msuccess": 27, "issu": [6, 27, 32, 33, 54, 56, 58, 64, 66, 76], "sourc": [24, 27, 28, 47, 48, 54, 59, 60, 62, 63, 64, 65, 66, 67, 68, 74, 76], "fruit_typ": 27, "make_fruit": 27, "type_example_wrong": 27, "31merror": [27, 64, 67], "33m": [27, 58, 67, 73], "incompat": [27, 64, 65], "expect": [27, 52, 59, 64, 68, 73], "31mfound": [27, 64], "type_example_right": 27, "measur": [27, 48, 54, 73], "typing_annot": 27, "get_height_in_feet": 27, "height": [27, 48, 60], "meter": 27, "28084": 27, "typecheck": 27, "safe": [27, 52], "shouldn": 27, "typing_fin": 27, "bark": [27, 58, 60], "ruff": 27, "overrid": 27, "previous": [27, 32, 56], "misc": 27, "typing_liter": 27, "share": [2, 27, 50, 52, 65, 66, 74], "scalabl": [27, 59], "last_int": 27, "last_str": 27, "gener": [27, 31, 32, 47, 48, 51, 52, 64, 66], "adapt": 27, "invok": [27, 56], "infer": [27, 32, 45, 52, 58, 59, 68], "typevar_exampl": 27, "dict_valu": 27, "fast": [28, 48, 50, 53, 68], "analysi": [28, 45, 47, 54, 63, 65, 67], "textblob": [29, 52, 58], "get_sum": 29, "get_diff": [], "col1": [29, 31, 32, 34, 36, 38, 39, 40, 47, 49, 57, 58, 67], "col2": [29, 31, 32, 34, 36, 38, 39, 40, 47, 49, 57, 58, 67], "along": [29, 40, 48, 49, 65], "applymap": 29, "fail": [2, 6, 29, 64, 65, 68, 73], "everyth": [29, 57], "col3": [29, 32, 40, 47, 49], "col4": 29, "103": [29, 57], "309": [29, 58], "204": 29, "816": 29, "dtype": [29, 31, 33, 34, 35, 37, 39, 40, 47, 48, 52, 53, 54, 57, 58, 59, 73], "int64": [29, 31, 32, 33, 34, 35, 40, 45, 47, 52, 57, 59, 73], "insert": [29, 40, 45, 47, 49, 51, 57, 58, 59, 67, 73], "format": [15, 29, 32, 40, 45, 47, 48, 50, 51, 55, 59, 60, 62, 63, 67, 68, 73], "berri": [29, 54], "cherri": [29, 50], "garden": 29, "comma": [29, 65, 73], "fillna": [29, 54], "ffill": 29, "stand": [29, 73], "nan": [29, 30, 33, 35, 38, 40, 47, 48, 53, 54, 58, 60, 73], "mode": [29, 59, 60, 65, 67], "astyp": [29, 32, 36, 60], "encoded_col1": 29, "involv": [29, 47, 52, 54, 56, 58], "intend": [29, 50, 56, 68], "copi": [29, 38, 42, 45, 48, 53, 67], "ipykernel_77093": 29, "431778579": 29, "settingwithcopywarn": 29, "loc": [29, 30, 33, 34, 37, 49, 59], "row_index": 29, "col_index": 29, "caveat": 29, "pydata": 29, "org": [29, 31, 47, 52, 62, 73], "stabl": [29, 60, 73], "user_guid": 29, "html": [29, 48, 50, 52, 59, 60, 63, 73], "view": [29, 31, 46, 47, 49, 53, 54, 55, 57, 60, 65, 66, 74], "versu": 29, "chained_assign": 29, "settingwithcopyerror": 29, "non": [30, 32, 33, 34, 47, 57, 58, 65, 67, 68], "store1": 30, "store2": 30, "df1": [30, 31, 35, 39, 40, 47, 48], "key1": 30, "df2": [30, 31, 35, 39, 40, 47], "key2": 30, "left_on": [30, 48], "right_on": [30, 48], "value_x": 30, "value_i": 30, "a_x": [], "a_i": [], "belong": [52, 60], "left_kei": [], "right_kei": [], "a_left": [], "a_right": [], "_left": [], "_right": [], "match": [24, 30, 34, 35, 47, 52, 56, 58, 59, 60, 63, 65, 68], "outer": [30, 40], "v1": [30, 45, 54, 64], "v2": [30, 54, 64], "tip": [31, 48, 60, 74], "load": [2, 21, 31, 45, 46, 50, 52, 54, 55, 56, 57, 59, 60, 68, 73], "queri": [31, 45, 49, 51, 55, 58, 59, 65, 73], "push": [31, 53], "down": [31, 50, 68], "filer": 31, "engin": [31, 45, 56, 57, 62, 68], "optim": [31, 45, 49, 50, 52, 57, 59, 60, 64], "dataset": [2, 21, 29, 31, 32, 34, 47, 49, 56, 57, 58, 59, 60], "113": [31, 49], "file_path": [2, 31], "num_row": [31, 47], "100_000_000": 31, "id": [30, 31, 45, 46, 47, 50, 51, 54, 55, 56, 59, 60, 64, 68, 73], "rand": [31, 47, 60], "row_group_s": 31, "2_000_000": 31, "read_parquet": [31, 45, 47], "50000": [31, 48], "106": [31, 58], "19": [31, 33, 45, 47, 48, 49, 59, 60, 65, 67, 68, 73], "414": [31, 59], "index_col": [31, 59], "download": [31, 45, 50, 52, 54, 60, 67, 76], "github": [31, 38, 45, 48, 49, 52, 54, 60, 62, 64, 73, 76], "click": [31, 49, 54, 55, 60, 67, 73, 76], "raw": [31, 47, 48, 50, 52, 59, 60, 66], "link": [31, 33, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 73, 74], "githubusercont": [31, 47, 48, 59, 60, 66], "mwaskom": [31, 47], "seaborn": [31, 47, 48, 52, 54, 65], "master": [31, 47, 48, 58, 59, 60, 66], "head": [31, 47, 48, 49, 50, 53, 54, 58, 59, 60, 62, 63, 68], "diet": [31, 48], "puls": 31, "fat": [31, 54], "85": [31, 48, 49, 54, 59], "88": [31, 47, 48, 49, 50, 57, 58, 67, 73], "90": [6, 31, 47, 48, 52, 54, 59, 64], "92": [31, 49, 54, 59, 60], "consum": [2, 31, 32, 47, 50, 52, 54, 58, 60, 63, 67], "amount": [31, 48, 52, 56, 59], "chunksiz": [31, 47], "5495": 31, "warn": [31, 47, 48, 52, 54, 56, 58, 60, 62, 67, 68, 73], "filterwarn": 31, "flight_data_2018_to_2022": 31, "33": [31, 42, 48, 49, 58, 59, 68], "58": [31, 47, 48, 49, 52, 56, 57, 59, 60, 63, 68, 73], "563737": 31, "120": [31, 48, 59, 67, 68], "424": [31, 57], "portion": [21, 31, 57], "df_chunk": 31, "df_": [31, 40, 57], "63737": 31, "read_html": 31, "wikipedia": 31, "en": [31, 50, 54, 60, 73], "wiki": 31, "poverti": 31, "region": [31, 59, 60], "94": [31, 47, 48, 49, 59], "95": [31, 34, 47, 48, 49, 52, 58, 59, 60, 62], "2002": [31, 50, 59], "2004": [31, 50, 59], "1981": 31, "2008": [31, 50], "2010": [31, 48, 59], "2015": [31, 50, 59], "2018": [31, 33, 50], "east": [31, 48, 50, 60], "asia": [31, 48, 59, 63], "pacif": [31, 48], "77": [31, 45, 59, 60, 62, 67, 68], "80": [6, 31, 48, 49, 52, 59, 60, 62, 64], "34": [31, 38, 48, 49, 56, 59, 60, 65, 68, 73], "europ": [31, 59], "central": [31, 48, 50, 59, 60], "latin": 31, "america": [31, 59], "caribbean": 31, "middl": 31, "north": [31, 48, 49, 50, 59], "africa": [31, 63], "south": [31, 48, 50, 59, 60], "35": [31, 35, 45, 48, 49, 52, 54, 56, 57, 59, 60, 62, 65], "61": [31, 48, 49, 59], "36": [31, 48, 49, 50, 52, 56, 57, 59, 60, 62], "49": [31, 42, 47, 48, 49, 56, 58, 59, 60, 62, 64, 68, 73], "26": [31, 48, 49, 50, 57, 58, 59, 60], "saharan": 31, "42": [2, 31, 32, 47, 48, 52, 60, 68], "51": [31, 48, 49, 52, 56, 60, 62], "47": [31, 48, 58, 59, 60, 68, 73], "54": [31, 50, 54, 56, 57, 59, 62], "40": [31, 47, 48, 49, 50, 52, 58, 59, 60, 62, 68], "52": [31, 39, 48, 49, 59, 60], "27": [31, 32, 33, 48, 49, 58, 59, 60, 73], "refer": [31, 54, 57, 62, 63, 68], "affect": [31, 59, 60], "df3": [31, 47], "been": [31, 52, 55, 59, 66, 67], "offer": [24, 31, 32, 47, 51, 53, 58, 59, 62, 63], "copy_on_writ": 31, "manual": [24, 32, 45, 48, 50, 52, 57, 63, 64, 66, 68], "data_typ": 32, "core": [32, 33, 34, 36, 46, 47, 48, 49, 57, 58, 59, 60, 62, 67, 73], "frame": [32, 33, 39, 42, 57, 60, 67], "rangeindex": [32, 33, 57], "entri": [21, 32, 33, 48, 57], "null": [32, 33, 35, 51, 52, 53, 57, 58], "count": [32, 33, 40, 45, 48, 53, 54, 56, 57, 60, 62, 67], "float64": [32, 35, 47, 52, 57, 58, 59], "200": [2, 32, 47, 48, 52, 57, 59], "byte": [32, 33, 50, 52, 57], "cardin": [32, 48, 53], "categori": [32, 34, 36, 47, 49, 51, 52, 54, 56, 59, 60], "sklearn": [2, 32, 48, 49, 50, 53, 54, 57, 58, 60, 64, 67, 73], "load_iri": [32, 48, 52, 53], "as_fram": [32, 49, 50, 52, 53, 57, 60], "return_x_i": [32, 48, 52, 53, 57], "concat": [32, 40, 47, 49, 50, 52, 56], "target": [32, 45, 47, 48, 49, 52, 59, 60, 68], "memory_usag": 32, "128": [32, 48, 59, 68], "sepal": 32, "length": [11, 32, 34, 52, 54, 59, 67], "cm": 32, "1200": 32, "width": [32, 60, 67], "petal": 32, "282": [32, 68], "almost": 32, "fifth": 32, "tell": [24, 32, 48, 52, 60], "smallest": [32, 42], "Or": 32, "sort_valu": [32, 36, 48, 56, 63], "mix": [32, 52, 63], "slower": 32, "still": [32, 58, 59, 68], "after": [31, 32, 48, 49, 50, 54, 57, 59, 64, 65, 67, 73], "remov": [32, 36, 47, 48, 50, 54, 58, 60, 62, 63, 67, 73], "save": [32, 45, 46, 47, 50, 52, 58, 60, 63, 65, 66, 68, 73], "random_numb": 32, "132": [32, 47, 48, 49, 59, 68], "35960884": 32, "inferred_df": 32, "8000000": 32, "loss": [32, 47, 60, 68], "s1": 32, "integr": [32, 47, 48, 50, 53, 58, 63], "apach": [32, 47, 52], "arrow": [32, 45], "solv": [32, 47, 53, 62, 63, 65], "s2": 32, "extra": [33, 47, 48, 65, 73], "step": [2, 33, 48, 52, 53, 54, 59, 60, 62, 66, 67], "date_column_1": 33, "date_column_2": 33, "datetime64": [31, 33], "ns": [31, 33, 58, 60], "usag": [33, 46, 51, 52, 56, 63, 65, 73], "176": [33, 57, 60], "month": [15, 33, 47, 48, 50, 59, 60, 66, 67, 74], "tseri": 33, "offset": [33, 50, 59], "bdai": 33, "ts": 33, "2024": [24, 33, 47, 52, 58, 59, 67], "busi": [33, 59], "simpl": [33, 45, 48, 49, 50, 52, 54, 55, 59, 60, 63], "move": [33, 50, 59], "time_period": 33, "21": [2, 33, 35, 45, 47, 48, 49, 50, 52, 57, 59, 60, 63, 65], "24": [33, 47, 48, 49, 50, 52, 56, 57, 59, 60, 63, 67], "set_index": [33, 59], "imagin": [2, 24, 33, 48, 52, 57, 73], "groupbi": [33, 34, 45, 47, 48, 56, 58, 59], "instruct": [33, 48, 50, 53], "freq": [33, 47, 52, 54, 59, 73], "1w": 33, "week": [33, 48, 58, 59, 60, 67, 68], "to_datetim": [31, 33, 48, 50, 59], "easiest": [33, 50], "05": [24, 33, 34, 47, 48, 49, 50, 52, 54, 58, 59, 60, 73], "exclud": [33, 48, 54, 58], "datetimeindex": 33, "2019": [33, 48, 54, 60], "problem": [33, 47, 50, 52, 53, 58], "date_rang": [33, 47, 60, 73], "07": [33, 47, 48, 49, 50, 56, 58, 59, 60, 63, 73], "new_index": 33, "conform": 33, "new_": 33, "fill_valu": 33, "comparison": [33, 38, 54, 63, 65, 67], "filtered_df": 33, "record": [33, 35, 47, 48, 57, 60], "04": [33, 47, 48, 49, 50, 52, 56, 57, 59, 60, 62, 73], "06": [33, 47, 48, 49, 50, 52, 56, 58, 59, 60, 68, 73], "2d": [33, 54, 60, 73], "dropna": [2, 33, 35, 48, 60, 64], "fastest": [34, 50], "attempt": [2, 34, 47, 64, 68], "o": [34, 47, 48, 59], "shorter": [11, 34], "indexingerror": 34, "ipykernel_791962": 34, "4076731999": 34, "venv": [24, 34, 36, 39, 42, 47, 54, 58, 60, 64, 65, 67, 68], "lib": [24, 34, 36, 39, 42, 47, 54, 59, 60, 64, 65, 67, 68, 73], "python3": [24, 34, 36, 39, 42, 47, 54, 58, 59, 60, 64, 65, 67, 68, 73], "site": [24, 34, 36, 39, 42, 47, 54, 59, 60, 64, 65, 67, 68, 73], "packag": [24, 34, 36, 39, 41, 42, 47, 54, 59, 60, 62, 63, 64, 66, 67, 68], "__getitem__": 34, "929": 34, "930": [34, 59], "maybe_cal": 34, "apply_if_cal": [34, 57], "931": 34, "_getitem_axi": 34, "932": 34, "933": 34, "_is_scalar_access": 34, "1142": 34, "_get_slice_axi": 34, "1143": 34, "is_bool_index": 34, "1144": 34, "_getbool_axi": 34, "1145": 34, "is_list_like_index": 34, "1146": 34, "946": 34, "caller": [6, 34], "respons": [34, 50, 52, 58, 59], "ensur": [34, 40, 45, 47, 48, 52, 53, 55, 56, 58, 59, 68], "947": 34, "label": [34, 35, 40, 45, 49, 51, 52, 54, 56, 59, 60, 63], "_get_axi": 34, "948": 34, "check_bool_index": 34, "949": [34, 68], "ind": 34, "nonzero": 34, "950": 34, "_take_with_is_copi": 34, "2386": 34, "mask": [34, 37, 54], "isna": [34, 58], "_valu": 34, "2387": 34, "2388": 34, "2389": 34, "unalign": 34, "2390": 34, "charact": [34, 49, 67], "cat1": [34, 47, 48], "cat2": [34, 47, 48], "user1": [34, 45, 55, 62], "user2": [34, 45, 62], "user3": [34, 45], "is_all_nan": 34, "unusu": 34, "distort": 34, "statist": [34, 40, 47, 48, 52, 53, 57, 58, 59, 65, 67], "analys": [34, 52], "col0": 34, "trim": [34, 56], "quantil": 34, "lower": [34, 35, 37, 52, 53, 54, 56, 59, 67], "threshold": [34, 48, 52, 54], "bound": [35, 52, 59, 67], "larger": [35, 45, 47], "75": [35, 40, 47, 48, 49, 50, 51, 58, 59, 60, 67], "71": [35, 48, 49, 50, 68], "750000": 35, "714286": 35, "period": [35, 52, 59, 68], "diff2": 35, "leav": [35, 47, 60], "processed_df": [35, 56], "orient": [35, 48], "value_count": 35, "500000": [35, 48], "333333": [35, 53], "166667": 35, "943880": 35, "845154": 35, "roughli": [35, 54], "q": [35, 45, 47, 49, 59, 60], "999": [35, 49, 52], "667": 35, "max": [35, 40, 45, 47, 50, 52, 53, 58, 59, 67], "medium": [36, 50, 56], "mini": 36, "ordered_s": 36, "inplac": [36, 64], "2630": 36, "futurewarn": [36, 48, 52, 54, 56, 60], "deprec": 36, "unus": [36, 64, 73], "alwai": [36, 48, 52, 68], "oranga": 37, "appla": 37, "grapa": 37, "pricel": 37, "price2": [37, 58], "bunni": 37, "monkei": 37, "funni": [37, 50], "flower": [37, 67], "sub_str": 37, "ny": [37, 48], "ey": [37, 50], "join_str": 37, "neg": [2, 38, 45, 47, 49, 51, 52, 54, 58], "ones": [38, 47, 48, 52, 65, 73], "highlight_numb": 38, "white": [38, 50, 60], "nbsp": [38, 58], "predict": [2, 38, 45, 48, 51, 54, 58, 60], "predictions_1": 38, "predictions_2": 38, "real_label": 38, "highlight_cel": 38, "background_gradi": 38, "cmap": [38, 48, 60], "plasma": 38, "excel": [6, 38, 53, 54, 63], "sheet": [38, 53], "titl": [24, 38, 48, 49, 50, 52, 54, 59, 60, 63, 67, 68], "na_rep": 38, "to_excel": [38, 63], "formatted_fil": 38, "xlsx": 38, "tabul": 38, "readm": 38, "jupyt": [38, 42, 52, 59, 68, 74, 76], "tablefmt": 38, "grid": [38, 52, 60], "to_latex": 38, "editor": [38, 54, 60], "tabular": [38, 47, 49, 52, 57, 58, 59], "lrr": 38, "set_table_styl": 38, "selector": [38, 60], "toprul": 38, "prop": 38, "hline": 38, "midrul": 38, "bottomrul": 38, "column_format": 38, "assert_frame_equ": 39, "coll": [39, 40], "assertionerror": [39, 42, 58, 73], "skip": [39, 42, 62, 67], "hidden": [39, 42, 57, 58], "_lib": 39, "pyx": 39, "assert_almost_equ": 39, "167": 39, "_test": 39, "assert": [39, 42, 51, 56, 68, 73], "679": [39, 59], "raise_assert_detail": 39, "index_valu": 39, "676": [39, 47, 59], "677": [39, 59], "msg": [39, 42], "66": [39, 48, 58, 68], "66667": 39, "check_lik": 39, "align": [39, 58, 59], "counter": [40, 48, 54], "count_two": 40, "median": [40, 48, 52, 53, 58, 59], "etc": [40, 45, 49, 50, 52, 58, 64, 68], "g": [40, 48, 50, 52, 55, 58, 59, 65], "reset_index": [40, 59], "agg_method": 40, "mean_pric": 40, "summar": [40, 60], "aggfunc": 40, "compos": [40, 48, 52], "wide": [32, 40, 58, 59, 74], "costco": 40, "id_var": 40, "value_var": 40, "var_nam": 40, "network": [40, 54, 58, 59], "thinh": 40, "friends1": 40, "person1": 40, "person2": 40, "friends2": 40, "symmetr": 40, "friend": 40, "multiindex": 40, "stacked_df": 40, "nstack": 40, "get_dummi": [2, 40], "sep": [40, 67], "often": [15, 40, 45, 48, 50, 52, 53, 54, 56, 58, 59, 67, 68], "ax": [40, 49, 52, 54, 59, 60], "scientif": [41, 60], "multi": [42, 52, 60], "dimension": [42, 54], "new_arr": 42, "new_row_posit": 42, "fewer": [42, 74], "mask_al": 42, "AT": 42, "mask_ani": 42, "largest": [42, 52, 63], "argmax": 42, "highest": [42, 47], "probabl": [42, 48, 52, 59], "array_to_latex": 42, "a2l": 42, "to_ltx": 42, "bmatrix": 42, "greater": [24, 42, 56], "pyplot": [42, 52, 54, 59, 60], "plt": [42, 52, 54, 59, 60], "22222222": 42, "44444444": 42, "66666667": 42, "88888889": 42, "11111111": 42, "33333333": 42, "55555556": 42, "77777778": 42, "arang": [42, 52, 59, 60], "plot": [42, 48, 49, 50, 55, 59, 64], "assert_array_equ": 42, "arr1": 42, "arr2": 42, "chapter4": [42, 55, 58], "48": [42, 48, 52, 57, 59, 60, 73], "href": 42, "vscode": [42, 67], "ch0000052": 42, "truth": 42, "ambigu": 42, "ch0000053": 42, "_privat": 42, "844": 42, "assert_array_compar": 42, "err_msg": 42, "verbos": [42, 52, 54, 63], "header": [42, 45, 54, 63], "equal_nan": 42, "equal_inf": 42, "839": 42, "840": [42, 57], "remark": 42, "841": 42, "build_err_msg": 42, "ox": 42, "oy": 42, "842": 42, "843": 42, "845": [42, 49], "except": [15, 42, 51, 52, 62, 68], "846": 42, "mismatch": [42, 52], "rel": [42, 52, 54, 59], "222": [42, 57, 59], "221": [42, 68], "support": [45, 50, 51, 52, 54, 59, 62, 63, 73], "my_tabl": 45, "where": [45, 47, 48, 51, 52, 56, 59, 60, 62, 64, 67, 73], "start_dat": [31, 45, 47, 58], "pathlib": [45, 58, 68], "placehold": 45, "preprocess": [45, 52, 58, 59, 60], "rich": 45, "connect": [45, 51, 53, 58, 60, 73], "sqlalchemi": 45, "read_sql": 45, "create_engin": 45, "usernam": [45, 46, 50, 53, 54, 66], "password": [45, 46, 50, 53, 54], "host": [45, 49, 50, 53], "port": [45, 47, 49], "database_nam": 45, "table_nam": 45, "fugu": 45, "interfac": [2, 45, 47], "fugue_sql": 45, "fsql": 45, "input_df": [45, 47], "pandasdatafram": 45, "sqlite3": [45, 51], "conn": [45, 51], "db": [45, 51, 58], "cursor": [45, 51, 58], "create_table_sql": 45, "IF": [45, 48, 51], "NOT": [45, 51], "membership": 45, "primari": [2, 45, 51, 58], "autoincr": [45, 51], "activ": [45, 60, 65, 68], "insert_rows_sql": 45, "INTO": [45, 51, 58], "john": [32, 45, 47, 49, 51, 56, 58, 68], "jane": [45, 47, 56, 58], "mike": [45, 51], "close": [45, 50, 51, 54, 59, 67], "har": 45, "leverag": [29, 45, 47, 54, 58, 66], "annot": [45, 48, 51, 54, 63], "intuit": [45, 56, 59, 62], "session": [45, 73, 76], "primary_kei": 45, "through": [2, 45, 53, 54, 56, 58, 59, 60, 62, 64, 68, 73], "coercion": 45, "sqlite": [45, 51, 63], "metadata": [47, 54, 67], "create_al": 45, "lint": 45, "consist": [2, 45, 47, 48, 49, 52, 54, 58, 59], "style": [45, 56, 67, 73], "convent": 45, "free": [45, 50, 54, 58, 59, 76], "focu": 45, "task": [45, 47, 50, 51, 52, 54, 57, 58, 59, 60, 62, 67, 68, 73], "dialect": 45, "ansi": 45, "mysql": 45, "bigqueri": 45, "databrick": 45, "oracl": 45, "teradata": 45, "sqlfluff_exampl": 45, "AS": [45, 56], "foo": [45, 56, 63], "bar": [45, 54, 56, 60], "postgr": [45, 58], "30m": 45, "1msqlfluff_exampl": 45, "0m": [45, 52, 54, 56, 57, 58, 60, 63, 64, 65, 67, 73], "31mfail": 45, "34ml": 45, "lt09": 45, "0mselect": 45, "unless": 45, "34m": [45, 52, 54, 63], "0monli": 45, "1mlayout": 45, "select_target": 45, "st06": 45, "wildcard": 45, "calcul": [45, 57, 59, 60], "0mand": 45, "1mstructur": 45, "column_ord": 45, "lt02": 45, "0mexpect": 45, "indent": 45, "lt01": 45, "whitespac": [45, 54, 63, 67], "nake": 45, "0mbinari": 45, "binari": [45, 52], "cp01": 45, "0mkeyword": 45, "1mcapitalis": 45, "seamlessli": [45, 48, 52, 58, 59], "sentiment": [45, 51, 52, 54, 58], "pgml": 45, "transform": [45, 49, 51, 52, 54, 56, 58, 59, 60, 67], "classif": [45, 52, 58], "love": [45, 48, 50, 54], "amazingli": 45, "ml": [45, 64], "hate": 45, "mundan": 45, "thankless": 45, "score": [6, 45, 48, 52, 54, 58, 60], "9995759129524232": 45, "9903519749641418": 45, "train": [45, 49, 52, 53, 54, 60, 68], "relation_nam": 45, "y_column_nam": 45, "algorithm": [45, 52, 54, 59, 60], "xgboost": 45, "hyperparam": 45, "n_estim": [45, 58], "imag": [45, 50, 60, 65, 73], "quiet": [45, 55, 64], "wget": [45, 47, 54], "cwida": 45, "releas": [45, 47, 54, 57, 73], "lineitemsf1": 45, "snappi": 45, "parquet": [45, 56], "empow": 45, "scientist": [45, 50, 52, 53, 54, 59, 68, 70, 74], "capabl": [2, 45, 54, 56, 68], "alongsid": 45, "tradit": [15, 45, 52, 58, 59], "system": [45, 46, 50, 51, 54, 57, 58, 73], "demand": [45, 59], "dbm": 45, "server": [45, 52, 53, 57, 65, 73], "workflow": [45, 48, 60, 66], "mydf": 45, "to_df": 45, "nearli": [45, 59], "l_returnflag": 45, "agg": [45, 47, 56, 58], "l_extendedpric": 45, "avg": [45, 47, 56, 58, 59], "226": 45, "BY": 45, "37": [45, 48, 49, 56, 60], "deltalak": [45, 47], "delta": [45, 58], "lake": 45, "2906": 45, "writer": [45, 47], "write_deltalak": [45, 47], "delta_lak": [45, 47], "deltat": [45, 47], "quack": 45, "to_panda": [45, 47, 53], "l_quantiti": 45, "108": 45, "to_pyarrow_dataset": 45, "954": 45, "downstream": 45, "sql_queri": [], "employee_nam": 47, "department_nam": 48, "employe": [47, 56, 57], "depart": [48, 56], "ON": 45, "department_id": [], "pars": [24, 54, 59, 63, 67], "token": [54, 55], "newlin": [], "0x10a13e4c0": [], "dml": [], "0x10a1ae040": [], "0x10a1ae100": [], "identifierlist": [], "empl": [], "0x10a198e40": [], "0x10a1ae580": [], "0x10a1ae5e0": [], "0x10a1ae640": [], "emploi": [], "0x10a198c10": [], "0x10a1ae7c0": [], "0x10a1ae820": [], "0x10a1ae880": [], "0x10a198cf0": [], "0x10a1aea00": [], "0x10a1aea60": [], "0x10a1aeac0": [], "depa": [], "0x10a198dd0": [], "0x10a1aee80": [], "get_real_nam": [], "get_identifi": [], "encourag": 46, "script": [46, 55, 65, 73], "wast": 46, "reproduc": [46, 47, 48, 52, 58], "config": [46, 47, 52, 59, 60, 64, 67, 73], "configur": [46, 47, 52, 60, 67], "yaml": [46, 52, 55, 64, 68, 73], "data1": [46, 73], "drop_featur": 46, "iid": 46, "idg": 46, "wave": 46, "categorical_var": 46, "undergra": 46, "zipcod": 46, "seper": 46, "config_nam": 46, "termin": [46, 52, 54, 57, 58, 63, 64, 65, 68, 73], "hydra_exampl": 46, "userwarn": [46, 52, 60, 62], "config_path": 46, "cc": 46, "next": [46, 47, 48, 52, 54, 56, 59, 60, 65], "upgrad": [46, 59], "0_to_1": 46, "changes_to_hydra_main_config_path": 46, "articl": [46, 48, 49, 50, 52, 53, 55, 58, 62, 63, 65, 67, 74], "environ": [48, 51, 52, 54, 57, 58, 67, 68, 73], "load_dotenv": 46, "getenv": 46, "spend": [46, 48, 59], "docstr": 46, "docopt_exampl": 46, "dir": [46, 53, 65, 73], "directori": [46, 47, 53, 63, 65, 66, 67, 68, 73], "input_text": [46, 54], "__doc__": [46, 67], "argv": 46, "input_path": 46, "litt": 47, "bit": 47, "sleep": [47, 54, 57, 58, 62, 67, 68], "progress_appli": 47, "cpu": [47, 53, 54, 57, 73], "progress_bar": 47, "parallel_appli": 47, "worker": [47, 48, 54, 56, 68], "standard": [47, 52, 57, 58, 59, 62, 65, 67, 73], "transfer": [47, 53, 59], "3025": 47, "324": 47, "441": [47, 48], "6561": 47, "5329": 47, "2025": 47, "4900": 47, "1024": [32, 47, 53, 54], "5776": 47, "8100": 47, "3364": 47, "9995": 47, "4761": 47, "9996": 47, "3721": 47, "6889": 47, "9997": 47, "4225": 47, "9025": 47, "1156": 47, "9998": 47, "361": [47, 68], "529": [47, 49, 59], "9999": [47, 67], "5041": 47, "81": [47, 48, 49, 50, 59, 60, 73], "Not": [47, 52], "flight": 47, "passeng": [47, 48, 59, 60], "1949": [47, 50], "112": [47, 49], "118": [47, 49, 68], "march": [47, 48], "april": [47, 50], "129": [47, 48, 57, 67, 68], "121": [47, 49, 57, 59, 60], "june": [47, 51], "135": [47, 48, 57, 68], "juli": [47, 50, 60], "148": [47, 49, 62, 68], "august": 47, "septemb": 47, "136": [47, 48, 68], "octob": 47, "119": [47, 52, 59], "to_markdown": [47, 63], "llm": 47, "openai": [47, 51], "api_token": 47, "your_api_token": 47, "pandas_ai": 47, "convers": [47, 58, 64], "prompt": 47, "five": [47, 50], "1960": [47, 59], "5714": 47, "1959": 47, "5140": 47, "1958": 47, "4572": 47, "1957": 47, "4421": 47, "1956": 47, "3939": 47, "span": [47, 73], "pyspark": [47, 52, 59], "workload": [47, 56], "fugue_spark": 47, "sparkexecutionengin": 47, "map_pric": 47, "map_price_to_fruit": 47, "schema": [45, 47, 52, 58], "hostnam": [47, 53], "7740": 47, "resolv": [47, 52], "loopback": 47, "address": [45, 47, 49, 50, 56, 58, 68], "127": [47, 48, 49, 52, 57, 68], "192": [47, 54, 60, 62], "168": [47, 54], "wlp111s0": 47, "spark_local_ip": 47, "bind": 47, "illeg": 47, "reflect": [47, 59], "unsaf": 47, "platform": [47, 48, 52, 56, 58, 67, 73], "jar": [47, 54], "unsafe_2": 47, "constructor": 47, "java": [47, 56], "nio": 47, "directbytebuff": 47, "report": [47, 50, 52, 53, 55, 57, 59, 60, 64], "further": [24, 47, 54, 58, 64, 74], "deni": 47, "nativecodeload": [47, 56], "unabl": [24, 47, 52, 56], "nativ": [47, 56, 59, 68], "hadoop": [47, 56], "builtin": [47, 56], "applic": [47, 48, 51, 52, 54, 56, 58, 63, 64, 67, 68, 73, 74], "log4j": 47, "properti": [2, 47, 67], "log": [21, 47, 56, 59, 68], "sc": [47, 56], "setloglevel": [47, 56], "newlevel": [47, 56], "sparkr": [47, 56], "servic": [47, 48, 49, 64], "sparkui": 47, "4040": 47, "4041": 47, "stage": [47, 56, 66], "essenti": [47, 52, 54], "undo": [47, 58], "mistak": 47, "review": [47, 51, 66], "audit": 47, "transact": [47, 48, 50], "travel": [47, 48], "4719861e": 47, "1d3a": 47, "49f8": 47, "8870": 47, "225e4e46e3a0": 47, "_delta_log": 47, "00000000000000000000": 47, "json": [47, 50, 52, 55, 58, 63, 68], "dt": [47, 48], "current": [2, 47, 48, 50, 52, 58, 59, 65, 66, 67, 68, 73, 74], "creation": [31, 45, 47], "get_add_act": 47, "flatten": [47, 62], "size_byt": 47, "a6738752": 47, "efca": 47, "4577": 47, "8cbf": 47, "9c69b404f2ee": 47, "1654": 47, "7a6df896": 47, "715a": 47, "4d4a": 47, "b210": 47, "b12e3fe57bc6": 47, "modification_tim": 47, "data_chang": 47, "num_record": 47, "null_count": 47, "2023": [47, 54, 58, 67], "479": [47, 59], "657": [47, 59, 68], "prior": [47, 56], "dt0": 47, "rs": [45, 47], "segment": [47, 54], "rather": [31, 47, 48, 49, 54, 56, 59], "entir": [21, 47, 48, 52, 56, 68], "retriev": [47, 53, 54, 56], "complet": [47, 57, 58, 59, 62, 65, 68], "hourli": [47, 59, 68], "sale": [47, 52, 56, 59], "end_dat": [31, 47, 58], "784": [47, 59], "659": [47, 59, 68], "729": 47, "292": 47, "935": [47, 68], "table_path": 47, "79": [47, 48, 49, 50, 52, 56, 60, 68], "62": [47, 48, 59, 67], "delta_lake2": 47, "partition_bi": 47, "181": 47, "yesterdai": 47, "workaround": 47, "solut": [48, 51, 52], "a6813d0c": 47, "157b": 47, "4ca6": 47, "8b3c": 47, "8d5afd51947c": 47, "untouch": 47, "partition_filt": 47, "00000000000000000001": 47, "b5c9640f": 47, "f386": 47, "4754": 47, "b28f": 47, "90e361ab4320": 47, "disk": [45, 47, 59], "intens": [47, 57], "5000": [47, 52, 54, 56, 58], "6000": [47, 56], "employee_id": 47, "salari": [47, 56], "8000": [47, 52], "existing_data": 47, "recreat": [47, 52], "retain": [47, 56], "columnar": 47, "benefit": [47, 48], "u": [47, 49, 51, 52, 55, 56, 57, 58, 59, 60, 62, 65, 68, 73], "ingest": 47, "accumul": 47, "surg": 47, "compact": 47, "expand": [47, 64, 67], "data_url": 47, "gist": [47, 66], "khuyentran1401": [47, 48, 49, 52, 62, 66], "458905fc5c630d7a1f7a510a04e5e0f9": 47, "5b2d760011c9255a68eb08b83b3b8759ffa25d5c": 47, "numfilesad": 47, "numfilesremov": 47, "filesad": 47, "278115": 47, "totalfil": 47, "totals": 47, "filesremov": 47, "5712": 47, "5717": 47, "5715": 47, "571580": 47, "partitionsoptim": 47, "numbatch": 47, "totalconsideredfil": 47, "totalfilesskip": 47, "preserveinsertionord": 47, "dure": [47, 50, 52, 53, 55, 58, 59, 68], "demonstr": [47, 48, 52, 54, 56, 58, 59], "last_talk": 47, "people_t": 47, "new_df": [47, 48, 56, 57], "older": 47, "statu": [2, 47, 48, 58], "builder": [47, 52, 56, 59], "sql": [52, 54, 59], "sparksess": [47, 52, 56, 59], "appnam": 47, "myapp": 47, "extens": [47, 48, 52, 68, 73], "io": [47, 50, 52, 54, 60], "deltasparksessionextens": 47, "catalog": 47, "spark_catalog": 47, "deltacatalog": 47, "configure_spark_with_delta_pip": 47, "getorcr": [47, 52, 56, 59], "interview": 47, "createdatafram": [47, 52, 56, 59], "todf": 47, "compani": [47, 48, 49, 50, 52], "repartit": 47, "forpath": 47, "new_data": [47, 48], "one_month_ago": 47, "current_d": 47, "interv": [47, 49, 50], "alia": [47, 56], "whenmatchedupd": 47, "whennotmatchedbysourceupd": 47, "concaten": [47, 57, 67], "expens": [47, 57, 58, 59], "inconsist": [47, 56, 59, 67], "datatyp": [31, 32, 47], "suppos": 47, "filepath": 47, "concat_df": 47, "effortlessli": [47, 51, 60, 73], "preserv": [47, 62], "mergeschema": 47, "pandas_api": 47, "api": [47, 52, 53, 58, 59, 68], "pl": 47, "pandas_df1": 47, "value1": [47, 58], "pandas_df2": 47, "value2": [47, 58], "polars_df1": 47, "from_panda": 47, "polars_df2": 47, "start_tim": [47, 62], "pandas_merg": 47, "pandas_tim": [47, 57], "polars_merg": 47, "polars_tim": 47, "6f": 47, "604390": 47, "079080": 47, "lightn": 47, "machin": [2, 47, 48, 49, 53, 58, 59, 60, 73], "eager": 47, "immedi": [47, 54, 62, 68], "contrast": [45, 47, 52, 53, 56, 59], "defer": 47, "10_000_000": 47, "categor": [47, 58], "7292": 47, "7849": 47, "93": [47, 48, 49, 52, 59], "6940": 47, "1265": 47, "2509": 47, "70": [6, 47, 48, 59, 60, 68], "706": [47, 57], "pl_df": 47, "428": [47, 59], "airport": 47, "datahub": 47, "unwant": 47, "scan_csv": 47, "acceler": 47, "particularli": [15, 24, 47, 48], "57k": 47, "heliport": 47, "contin": [47, 55], "eu": 47, "143": [47, 48, 57, 68], "594": 47, "written": [47, 48, 54, 76], "rust": 47, "acid": [47, 50], "enforc": 48, "exception": 47, "moreov": [47, 54], "seamless": [47, 59], "category_col1": 47, "numeric_col1": 47, "tail": [47, 48, 52, 59, 62], "9999995": 47, "9999996": 47, "9999997": 47, "9999998": 47, "87": [47, 49], "9999999": 47, "277": [47, 68], "55": [47, 48, 49, 50, 52, 54, 59, 60], "save_path": 47, "bear_delta_lak": 47, "latest": [47, 50, 59, 65, 66], "read_delta": 47, "i64": 47, "43": [47, 48, 49, 52, 54], "882": 47, "38": [45, 47, 48, 49, 52, 56, 57, 58, 59, 67], "train_test_split": [48, 52, 53, 59, 64], "proport": [48, 60], "model_select": [48, 52, 53, 59, 64], "bincount": [48, 57], "x_train": [48, 52, 53], "x_test": [48, 52, 53, 59], "y_train": [48, 52, 53], "y_test": [48, 52, 53, 59, 60], "random_st": [2, 48, 52, 58, 64], "randomli": [48, 52], "bias": [48, 58], "customer_id": [47, 48, 56], "train_data": [48, 52], "test_data": [47, 48, 52, 56, 59], "test_siz": [48, 52, 64], "cutoff_d": 48, "feature_engin": 48, "dropcorrelatedfeatur": 48, "make_classif": [48, 52], "n_sampl": [2, 48, 52, 59], "n_featur": [2, 48, 52, 59], "n_redund": [48, 52], "n_clusters_per_class": [48, 52], "class_sep": [48, 52], "trabsform": 48, "colnam": 48, "var_": 48, "var_0": 48, "var_1": [48, 67], "var_2": [48, 67], "var_3": [48, 67], "var_4": 48, "var_5": 48, "corr": 48, "000000": [47, 48, 53, 59], "938936": 48, "874845": 48, "654745": 48, "tr": 48, "pearson": 48, "xt": 48, "fit_transform": [48, 49, 52, 54, 58, 60], "correlated_feature_sets_": 48, "mark": [48, 49, 50, 73], "rarelabelencod": 48, "fetch_openml": [48, 54, 60], "dating_profil": 48, "body_typ": 48, "drink": [2, 48], "drug": 48, "educ": [48, 50], "essay0": 48, "essay1": 48, "essay2": 48, "essay3": 48, "essay4": 48, "offspr": 48, "pet": [15, 48, 62], "religion": 48, "sex": [48, 60], "sign": [48, 60], "smoke": 48, "speak": [48, 50], "littl": [48, 50, 73], "strictli": [48, 59], "anyth": 48, "social": 48, "never": [48, 51, 54, 68], "colleg": 48, "univers": [48, 50], "me": [48, 50, 57, 58, 60, 62], "lt": [24, 48, 67], "br": 48, "gt": [24, 48, 63, 65, 67], "ni": [48, 50, 54], "think": [48, 53, 59], "intern": [48, 57, 68], "agent": 48, "fo": 48, "peopl": [48, 49, 54], "laugh": 48, "nrant": 48, "six": [48, 67], "foot": 48, "half": 48, "asian": 48, "nabsurdistan": 48, "republ": 48, "mi": [48, 63], "san": [48, 60], "francisco": 48, "california": [48, 52, 57, 60], "amp": 48, "rsquo": 48, "kid": 48, "straight": 48, "agnostic": 48, "seriou": 48, "gemini": 48, "english": [2, 48, 60], "mostli": 48, "camp": [48, 50], "chef": 48, "n1": [48, 58, 59, 68], "dedic": 48, "everydai": 48, "unbeliev": 48, "silli": 48, "ridicul": 48, "amont": 48, "die": [48, 50], "hard": [2, 48, 50, 57], "christoph": 48, "moor": 48, "fan": [48, 67], "oakland": 48, "cancer": 48, "fluentli": 48, "poorli": [48, 52], "french": 48, "thin": [48, 50], "graduat": 48, "asham": 48, "public": [48, 60, 67], "te": 48, "nerdi": 48, "softwar": [48, 52], "musician": 48, "artist": [24, 48, 50], "improvis": 48, "jaw": 48, "glass": 48, "physica": 48, "okai": 48, "cultur": [48, 59], "matrix": [48, 52], "pisc": 48, "vegetarian": 48, "dead": 48, "plai": [48, 50, 54, 60], "synthes": 48, "acco": 48, "awkward": 48, "batail": 48, "celin": 48, "beckett": 48, "nlynch": 48, "berkelei": 48, "german": 48, "athlet": 48, "hei": [48, 51], "pro": [48, 50, 54], "imageri": 48, "nhttp": [48, 50], "bag": [48, 54], "smile": 48, "inquisit": 48, "natur": [48, 51], "music": [48, 50], "band": [48, 50], "rapper": 48, "nat": [48, 50], "aquariu": 48, "australian": 48, "live": [48, 50, 60, 76], "awesom": [48, 50, 51], "im": 48, "shit": 48, "aforementio": 48, "big": [48, 50], "ask": 48, "kill": 48, "mockingbird": 48, "lord": 48, "ring": [48, 50], "atheism": 48, "tauru": 48, "chines": 48, "lau": 48, "dig": 48, "buri": 48, "treasur": 48, "frolick": 48, "nwitti": 48, "banter": 48, "nuse": 48, "unicorn": 48, "virgo": 48, "meet": [48, 51, 54, 59], "wit": 48, "birthdai": [48, 59], "send": [48, 52, 67], "card": [48, 60], "byproduct": 48, "alphabet": [48, 60, 64, 67], "aquarium": 48, "autobio": 48, "christian": 48, "sagittariu": 48, "oh": [48, 50], "moment": 48, "job": [6, 48, 50, 66], "freakishli": 48, "blond": 48, "willing": 48, "belveder": 48, "tiburon": 48, "jake": 48, "creativ": 48, "gui": 48, "explor": [48, 74], "che": 48, "prob": [48, 52, 54, 59], "tv": [48, 50], "summer": 48, "mateo": 48, "tol": [48, 52], "speci": [48, 60], "minimum": [48, 52, 58, 64], "replace_with": 48, "46107": 48, "45677": 48, "57928": 48, "53127": 48, "33300": 48, "33648": 48, "59701": 48, "57013": 48, "46428": 48, "57123": 48, "percentag": [48, 52, 58, 59], "observ": [48, 52, 59, 62, 68], "countfrequencyencod": 48, "sn": [48, 52, 54, 60], "load_dataset": [48, 60], "diamond": 48, "carat": 48, "cut": 48, "clariti": [48, 62, 67], "depth": [48, 52], "89": [48, 60], "premium": [15, 48], "si2": 48, "2815": 48, "76": [48, 49, 59, 60, 67, 68], "50332": 48, "si1": 48, "53": [48, 54, 57, 58, 59, 60], "2242": 48, "35652": 48, "ideal": [48, 52, 60], "vvs2": 48, "907": 48, "9439": 48, "vs1": 48, "4592": 48, "83": [48, 49], "15824": 48, "vs2": 48, "6332": 48, "45891": 48, "1720": 48, "52416": 48, "2512": 48, "42613": 48, "505": [48, 59], "68": [32, 48, 49, 52, 57, 59, 60, 63, 68], "43567": 48, "1431": 48, "2732": 48, "91": [48, 49, 68], "3246": 48, "40455": 48, "encoding_method": 48, "p_train": 48, "p_test": 48, "10176": 48, "152762": 48, "170436": 48, "4733": 48, "65": [48, 49, 50, 60, 68], "16083": 48, "29": [48, 49, 54, 58, 59, 60, 63, 68], "242022": 48, "56": [48, 50, 52, 57, 59, 73], "6424": 48, "13420": 48, "100531": 48, "5510": 48, "20407": 48, "179409": 48, "8770": 48, "8909": 48, "227314": 48, "4493": 48, "82": [48, 49, 54, 57, 59], "52283": 48, "182005": 48, "094401": 48, "2494": 48, "10789": 48, "fair": 48, "4861": 48, "1190": 48, "2932": 48, "3583": 48, "067384": 48, "3422": 48, "40845": 48, "1173": 48, "13485": 48, "standardscal": [48, 52, 60], "sklearntransformerwrapp": 48, "22474487": 48, "tranform": 48, "scaler": [48, 52, 58], "224745": 48, "captur": [48, 54, 58, 59, 66, 73], "among": [48, 50, 70], "similarityencod": 48, "employee_salari": 48, "fetch_employee_salari": 48, "assignment_categori": 48, "employee_position_titl": 48, "underfilled_job_titl": 48, "date_first_hir": 48, "year_first_hir": 48, "pol": 48, "polic": 48, "msb": 48, "mgmt": 48, "tech": 48, "fulltim": 48, "regular": [48, 50, 52, 58], "offic": [48, 68], "coordin": [48, 49, 50, 73], "1986": 48, "isb": 48, "major": [48, 52], "crime": 48, "fugit": 48, "1988": 48, "hh": [48, 67], "health": 48, "human": [48, 49, 51], "adult": 48, "protect": [46, 48, 50], "iv": 48, "1989": 48, "cor": 48, "rehabilit": 48, "prr": 48, "facil": 48, "secur": [48, 52, 53, 54], "resid": [21, 48], "supervisor": 48, "ii": [48, 49], "2014": [48, 59], "hca": 48, "hous": [48, 52, 57], "commun": [48, 74], "affair": 48, "afford": 48, "plan": [15, 47, 48, 50, 56], "specialist": 48, "iii": 48, "2007": [48, 55, 59], "psb": 48, "6th": 48, "district": [48, 60], "team": [48, 50, 52, 54, 56, 60, 68], "fr": [48, 50, 54], "fire": 48, "rescu": [48, 50], "em": 48, "bill": [48, 52], "account": [2, 48, 52, 59], "auditor": 48, "2016": [48, 50, 59], "administr": [48, 50], "recruit": 48, "firefight": 48, "rescuer": 48, "fsb": 48, "traffic": 48, "autom": [48, 52, 54, 64, 65], "aid": 48, "dirty_column": 48, "x_dirti": 48, "similaryencod": 48, "enc": 48, "ngram": [48, 54], "x_enc": 48, "reshap": [48, 52, 62], "05882353": 48, "03125": 48, "02739726": 48, "19008264": 48, "01351351": 48, "05555556": 48, "20535714": 48, "08088235": 48, "032": [48, 57], "008": 48, "02083333": 48, "056": [48, 49], "02325581": 48, "23076923": 48, "01574803": 48, "02777778": 48, "03738318": 48, "07317073": 48, "05405405": 48, "0733945": 48, "0625": 48, "06542056": 48, "11206897": 48, "07142857": 48, "09756098": 48, "08108108": 48, "04761905": 48, "3539823": 48, "06976744": 48, "09821429": 48, "05343511": 48, "14953271": 48, "26086957": 48, "06451613": 48, "01052632": 48, "03378378": 48, "02631579": 48, "heatmap": 48, "pylabtool": [48, 60], "figsiz": [48, 50, 52, 54, 59, 60], "plot_similar": 48, "normalized_featur": 48, "inner": [48, 56], "font_scal": 48, "xticklabel": 48, "yticklabel": 48, "vmin": 48, "vmax": 48, "ylorrd": 48, "annot_kw": 48, "set_xticklabel": [48, 60], "rotat": 48, "set_titl": 48, "encode_and_plot": 48, "somewhat": 48, "028": 48, "full": [48, 49, 50, 52, 58, 59, 62, 63, 64, 65, 68, 73], "git": [48, 53, 54, 68], "skrub": 48, "frequent": [48, 54, 67], "yemen": [48, 50], "rep": 48, "fuzzy_join": 48, "variat": [48, 58, 63], "happiness_report_2022": 48, "countri": [48, 50, 55, 59], "happi": [48, 58], "fetch_world_bank_ind": 48, "gdppc": 48, "indicator_id": 48, "gdp": 48, "pcap": 48, "cd": [48, 52, 60, 66, 68, 73], "107": 48, "venezuela": 48, "4925": 48, "vietnam": 48, "5485": 48, "131": [48, 68], "4197": 48, "zambia": 48, "3760": 48, "zimbabw": 48, "2995": 48, "146": [48, 57, 59, 68], "xx": [48, 50, 59], "capita": 48, "193": 48, "west": [48, 50, 60], "bank": [48, 63], "gaza": 48, "3789": 48, "327966": 48, "255": 48, "12647": 48, "480789": 48, "258": [48, 58], "701": [48, 59], "714878": 48, "260": 48, "1487": 48, "907764": 48, "261": [48, 57], "1266": 48, "996031": 48, "return_scor": 48, "matching_scor": 48, "merg": [48, 56, 59], "wb": [2, 48, 59], "madagascar": 48, "795045": 48, "egypt": 48, "arab": [48, 54], "654033": 48, "chad": 48, "683373": 48, "130": [48, 68], "ethiopia": 48, "653668": 48, "mauritania": 48, "810736": 48, "133": [48, 68], "jordan": 48, "134": [48, 68], "togo": 48, "india": 48, "137": 48, "malawi": 48, "138": [48, 57], "tanzania": 48, "139": [48, 68], "sierra": 48, "leon": 48, "140": [48, 59, 68], "lesotho": 48, "755238": 48, "141": 48, "botswana": 48, "795825": 48, "142": 48, "rwanda": 48, "754604": 48, "144": [48, 57, 62, 68], "lebanon": 48, "145": [48, 57, 68], "afghanistan": 48, "incom": [48, 68], "fake": [48, 54], "assumpt": [2, 48, 58, 68], "descript": [48, 50, 51, 52, 54, 55], "logo": 48, "simplefilt": [48, 52, 56, 60, 62], "train_df": 48, "blob": [48, 52, 54], "snorkel_exampl": 48, "train_fake_job": 48, "job_id": 48, "salary_rang": 48, "company_profil": 48, "telecommut": 48, "has_company_logo": 48, "has_quest": 48, "employment_typ": 48, "required_experi": 48, "required_educ": 48, "industri": 48, "fraudul": 48, "12276": 48, "12277": 48, "analyst": 48, "gb": [48, 50], "wsm": 48, "london": [45, 48], "product": [45, 48, 51, 56, 58, 59], "op": [48, 57, 58], "qubit": 48, "edg": [48, 54, 58, 60], "engineeringqubit": 48, "ll": [47, 48, 52, 59, 62, 63], "background": 48, "consult": 48, "plenti": 48, "perk": 48, "opportun": [48, 50], "associ": [48, 55, 59, 62], "bachelor": 48, "degre": [48, 68], "internet": 48, "14680": 48, "14681": 48, "advoc": 48, "ga": 48, "savannah": 48, "21st": 48, "centuri": 48, "center": [2, 48, 49, 50, 52, 60, 67], "16518": 48, "16519": 48, "fl": 48, "gainesvil": 48, "352": 48, "inc": [48, 49], "agenc": 48, "crea": 48, "partner": [48, 50], "great": [48, 52, 53, 54, 59], "client": [48, 54, 68], "smart": 48, "mvc": 48, "getfreedom": 48, "trust": [48, 52, 60], "mid": 48, "senior": 48, "technolog": [48, 49], "15478": 48, "15479": 48, "internship": 48, "IN": 48, "bangalor": 48, "pace": 48, "citi": [45, 48, 50, 60], "diver": 48, "deliv": 48, "qualiti": [48, 53, 58, 73], "16348": 48, "16349": 48, "web": [48, 52, 74], "backend": [32, 48, 54], "microservic": 48, "de": [48, 54, 60], "BE": 48, "10969": 48, "airfi": 48, "pr\u00e4gt": 48, "sicher": 48, "und": 48, "einfach": 48, "zu": 48, "bedienend": 48, "design": [48, 49, 52, 54, 59], "esp": 48, "flat": [48, 59], "hierarchi": 48, "fraud": 48, "labeling_funct": 48, "pandaslfappli": 48, "lfanalysi": 48, "abstain": 48, "no_company_profil": 48, "no_company_logo": 48, "conclus": [48, 58], "applier": 48, "l_train": 48, "13410": 48, "5849": 48, "25it": 48, "accuraci": [48, 49, 52, 59, 63], "lf_summari": 48, "polar": [48, 52, 54, 58], "coverag": [48, 52], "overlap": [30, 48], "conflict": [48, 52], "incorrect": [48, 58], "emp": 48, "acc": 48, "186204": 48, "459": [48, 59], "2038": 48, "183821": 48, "205742": 48, "2300": 48, "166365": 48, "244295": 48, "12741": 48, "669": 48, "950112": 48, "detail": [48, 51, 52, 59, 62], "agre": 48, "disagre": 48, "correctli": [48, 52, 58, 67], "incorrectli": 48, "empir": [48, 49], "insight": [48, 52, 54, 59], "taxi": [48, 60], "pickup": [48, 60], "dropoff": [48, 60], "distanc": [48, 49, 54, 59, 60, 63], "fare": [48, 60], "toll": [48, 60], "payment": [48, 60], "pickup_zon": [48, 60], "dropoff_zon": [48, 60], "pickup_borough": [48, 60], "dropoff_borough": [48, 60], "credit": [48, 50, 60], "lenox": [48, 60], "hill": [48, 49, 60], "un": [48, 60], "turtl": [48, 60], "bai": [48, 60], "manhattan": [48, 60], "cash": [48, 59, 60], "side": [48, 50, 52, 59, 60, 73], "villag": [48, 60], "hudson": [48, 60], "sq": [48, 60], "yorkvil": [48, 60], "midtown": [48, 60], "theatr": [48, 60], "batteri": [48, 60], "park": [48, 54, 60], "bridg": [48, 60], "seward": [48, 60], "murrai": [48, 60], "flatiron": [48, 60], "harlem": [48, 60], "lincoln": [48, 60], "friendli": [48, 59], "vehicl": 48, "zone": [48, 59], "borough": 48, "popular": [47, 48, 49, 50, 54, 63, 70, 74], "howto": 48, "pickup_hour": 48, "pickup_dai": 48, "weekday_nam": 48, "pickup_month": 48, "month_nam": 48, "weekdai": [48, 58, 67], "pickup_zone_count": 48, "pickup_zone_far": 48, "pickup_zone_dist": 48, "016667": 48, "857083": 48, "987778": 48, "031597": 48, "944444": 48, "796667": 48, "243830": 48, "198": [48, 67], "994949": 48, "239798": 48, "6428": 48, "72": [32, 48, 50, 52, 56, 59, 68], "550000": 48, "854306": 48, "6429": 48, "74": [48, 67, 68], "jamaica": 48, "concours": 48, "queen": [48, 50, 60], "bronx": [48, 60], "597500": 48, "261667": 48, "6430": 48, "crown": 48, "bushwick": 48, "brooklyn": [48, 60], "549167": 48, "665000": 48, "6431": 48, "york": [45, 48, 50, 60], "flatbush": 48, "remsen": 48, "409000": 48, "086000": 48, "6432": 48, "boerum": 48, "windsor": 48, "terrac": 48, "761905": 48, "812857": 48, "6433": 48, "dist": [49, 65], "norm": 49, "rss": 49, "0037316": 49, "018": [49, 62], "scale": [49, 56, 58, 60], "expon": 49, "1588997": 49, "019": 49, "dweibul": 49, "0079433": 49, "012": [49, 58], "0036884": 49, "873": [49, 68], "genextrem": 49, "0049831": 49, "037": 49, "gamma": 49, "0038504": 49, "101": 49, "098": 49, "089": 49, "lognorm": 49, "0037897": 49, "237": [49, 68], "099": 49, "uniform": [49, 60], "1145382": 49, "469": 49, "loggamma": 49, "0036960": 49, "239": [49, 67, 68], "858": 49, "44": [49, 59], "472": [49, 59], "confid": [49, 52, 59, 64], "parametr": [49, 56, 73], "1000x800": 49, "axessubplot": [49, 50, 52, 60], "nt": 49, "ndf": 49, "xlabel": [49, 50, 52, 59], "ylabel": [49, 52], "frequenc": [49, 52], "detect": [49, 54, 58, 67], "outlier": [49, 54, 58, 59, 67], "deviat": [49, 58, 59], "significantli": [49, 56, 57, 60], "globe": [49, 50], "geocod": 49, "nominatim": 49, "geoloc": 49, "user_ag": 49, "find_loc": 49, "drive": [49, 50, 54], "app": [49, 52, 60, 63, 65, 67, 68], "dogwood": 49, "acr": 49, "chapel": 49, "counti": 49, "carolina": 49, "27516": 49, "state": [2, 49, 50, 57, 59, 62, 66, 67, 68], "8796631": 49, "0770546": 49, "latitud": [49, 50, 52], "longitud": [49, 50, 52], "latitid": 49, "max_card": 49, "cont_nam": 49, "cat_nam": 49, "load_win": [49, 60], "alcohol": 49, "malic_acid": 49, "ash": 49, "alcalinity_of_ash": 49, "magnesium": 49, "total_phenol": 49, "flavanoid": 49, "nonflavanoid_phenol": 49, "proanthocyanin": 49, "color_intens": 49, "hue": [49, 60, 68], "od280": 49, "od315_of_diluted_win": 49, "prolin": 49, "28": [49, 50, 56, 58, 59, 60, 73], "1065": 49, "1050": 49, "67": [49, 58, 59, 68], "1185": 49, "86": [49, 52, 59, 60, 62], "1480": 49, "69": [49, 54, 59], "735": [49, 68], "97": [49, 50, 52, 58, 59], "1450": 49, "1290": 49, "1295": 49, "1045": 49, "dmatric": 49, "designmatrix": 49, "178": [49, 57, 59, 60, 68], "intercept": [49, 52, 59], "1510": 49, "1280": 49, "1320": 49, "1150": 49, "1547": 49, "1310": 49, "1130": 49, "1680": 49, "780": 49, "770": 49, "1035": 49, "1015": 49, "830": 49, "1195": 49, "1285": 49, "915": 49, "omit": [24, 49, 73], "asarrai": 49, "this_obj": 49, "scikit": [49, 60, 67], "linear_model": [48, 49, 52, 59], "linearregress": [49, 52, 59], "query_str": 49, "scheme": [49, 65], "fragment": 49, "with_queri": 49, "new_path": 49, "with_path": 49, "with_frag": 49, "unlabel": 49, "terribl": 49, "definit": [49, 50], "pp": 49, "mr": [49, 50, 58], "owen": 49, "harri": 49, "prefixmarit": 49, "givennam": 49, "surnam": 49, "suffixgener": 49, "kate": 49, "cume": 49, "And": [49, 50, 52, 54, 60, 63], "prefect": [49, 57, 64, 67], "corporationnam": 49, "corporationlegaltyp": 49, "beauti": [49, 50, 52, 54, 60], "screen": [49, 68], "font": [49, 63], "encod": [49, 54, 58, 65, 67, 73], "typic": [49, 54, 59], "pdfreader": 49, "reader": 49, "extract_text": 49, "color_nam": 50, "cornflowerblu": 50, "scott": 50, "881": [50, 59], "patricia": 50, "nsouth": 50, "jeremi": 50, "06087": 50, "date_of_birth": 50, "minimum_ag": 50, "1927": 50, "donald": 50, "teacher": 50, "secondari": 50, "sill": 50, "email": [47, 50, 54], "her": [50, 74], "ringslap": 50, "boatbench": 50, "thirti": 50, "mighti": 50, "hors": [50, 54], "a_th": 50, "khaki": 50, "wad": 50, "tote": 50, "twenti": [50, 54], "four": [50, 73], "eighteen": 50, "garlic": 50, "arm": 50, "god": [50, 54], "himself": 50, "wait": [50, 52, 55, 58, 68], "hat": 50, "birmingpoop": 50, "paragraph": 50, "agustin": 50, "neutral": [50, 52], "jerk": 50, "concern": 50, "badli": 50, "agn": 50, "basil": 50, "box": [50, 60], "slate": 50, "assesford": 50, "testasia": 50, "fantasticheartsound": 50, "hurl": 50, "danc": [50, 54], "arztotzka": 50, "cape": 50, "bui": [50, 59], "tub": 50, "boot": 50, "assembl": [50, 52], "jean": 50, "seth": 50, "violetbag": 50, "laudabl": 50, "lampton": 50, "birmingobject": 50, "cybertron": 50, "urllib": 50, "request": [50, 52, 55, 58, 65, 73], "urlopen": 50, "randomus": 50, "ava": 50, "hansen": 50, "street": 50, "3526": [50, 67], "georg": 50, "worcest": 50, "merseysid": 50, "kingdom": [50, 54], "postcod": 50, "k7z": 50, "3wb": 50, "9627": 50, "6871": 50, "timezon": [50, 59, 67], "tokyo": [45, 50], "seoul": 50, "osaka": 50, "sapporo": 50, "yakutsk": 50, "login": [50, 52], "uuid": [50, 62, 68], "253e53f9": 50, "9553": 50, "4345": 50, "9047": 50, "fb18aec51cf": 50, "heavywolf743": 50, "cristina": 50, "salt": 50, "xwnpqwtd": 50, "md5": 50, "2b5037da7d78258f167d5a3f8dc24edb": 50, "sha1": 50, "fabbede0577b3fed686afd319d5ab794f1b35b02": 50, "sha256": [50, 67], "d42e2061f9c283c4548af6c617727215c79ecafc74b9f3a294e6cf09afc5906f": 50, "dob": 50, "1948": 50, "21t10": 50, "053z": 50, "73": [50, 59, 63, 67, 68], "2011": [50, 52, 60], "19t03": 50, "830z": 50, "phone": [50, 54, 60], "015242": 50, "07811": 50, "0700": 50, "326": 50, "155": [50, 68], "nino": 50, "ht": 50, "portrait": 50, "women": 50, "jpg": [50, 68], "med": 50, "thumbnail": 50, "thumb": 50, "aubin": 50, "martin": [50, 59], "8496": 50, "rue": 50, "du": 50, "b\u00e2t": 50, "argent": 50, "strasbourg": 50, "meurth": 50, "et": [50, 59], "mosel": 50, "franc": 50, "83374": 50, "3192": 50, "0062": 50, "eastern": 50, "australia": [50, 59, 63], "guam": 50, "vladivostok": 50, "54b9bfa9": 50, "5e86": 50, "4335": 50, "8ae3": 50, "164d85df98e7": 50, "heavyladybug837": 50, "kendra": 50, "lcemyr5": 50, "2fbd9e05d992eb74f7afcccec02581fc": 50, "530a1bc71a986415176606ea377961d2ce381e5d": 50, "f5ee7bc47f5615e89f1729dcb49632c6b76a90ba50eb42d782e2790398ebc539": 50, "12t05": 50, "463z": 50, "2006": [50, 59], "28t03": 50, "433z": 50, "inse": 50, "1nnan48231023": 50, "men": 50, "interest": [50, 59], "monk": 50, "attr1": 50, "attr2": 50, "attr3": 50, "attr4": 50, "attr5": 50, "attr6": 50, "websit": [50, 62, 66, 74], "soup": 50, "stackoverflow": 50, "2081586": 50, "wanted_list": 50, "scraper": [], "build": [50, 59, 60, 64, 65, 67], "command": [50, 52, 54, 59, 64, 65, 66], "metaclass": 50, "ternari": 50, "substr": [50, 56, 62, 67], "dataread": [50, 65], "pandas_read": 50, "snippet": [50, 66, 68, 73, 74], "daili": [50, 52, 59, 68, 74], "pandas_dataread": 50, "av": 50, "api_kei": [50, 51, 59], "gehid": 50, "outputtenv": 50, "alphavantage_api_kei": 50, "trendreq": 50, "hl": 50, "tz": [50, 67], "360": [50, 68], "build_payload": 50, "kw_list": 50, "interest_over_tim": 50, "twitter": [50, 54, 55], "reddit": [47, 50], "snsscrape": 50, "tweet": 50, "hashtag": [50, 54], "khuyentran16": 50, "khuyen_tweet": 50, "publicli": 50, "censu": 50, "gov": 50, "cdc": 50, "datacommons_panda": 50, "plotli": [50, 55, 60], "px": [50, 55, 60], "median_incom": 50, "build_time_seri": 50, "geoid": 50, "median_income_person": 50, "overtim": 50, "process_t": 50, "count_person": 50, "usa": [50, 59], "count_person_mal": 50, "count_person_femal": 50, "count_robberi": 50, "count_criminalactivities_robberi": 50, "googlenew": 50, "set_time_rang": 50, "hagan": 50, "nhra": 50, "car": [50, 59], "media": [50, 52], "espn": 50, "feb": 50, "desc": 50, "matt": 50, "quickest": 50, "ngive": 50, "toni": 50, "stewart": 50, "race": 50, "qualifi": 50, "nset": 50, "stori": 50, "33381149": 50, "img": 50, "gif": [50, 63], "base64": 50, "r0lgodlhaqabaiaaap": 50, "yh5baekaaealaaaaaabaaeaaaictaeaow": 50, "fuel": [50, 63], "stock": 50, "promis": [50, 52], "pit": 50, "auto": [2, 50, 52, 60], "club": 50, "racewai": 50, "pomona": 50, "pack": 50, "nworld": 50, "drag": 50, "luca": 50, "oil": 50, "wintern": 50, "cast": [45, 50, 68], "broadwai": 50, "reviv": 50, "girl": [50, 54], "star": [50, 68], "playbil": 50, "newli": 50, "peter": 50, "franci": 50, "jame": 50, "ephi": 50, "naardema": 50, "moran": 50, "benko": 50, "margaret": 50, "hall": 50, "beani": 50, "feldstein": 50, "ramin": 50, "karimloo": 50, "robert": 50, "hight": 50, "fridai": 50, "night": 50, "ncamp": 50, "nwintern": 50, "33324340": 50, "owner": [50, 60], "ron": 50, "capp": 50, "autoweek": 50, "defend": 50, "champion": 50, "enter": [48, 50], "automak": 50, "nlong": 50, "him": 50, "susan": 50, "wade": 50, "a39160639": 50, "dodgemopar": 50, "under": [50, 52, 58, 68], "bu": 50, "video": 50, "highli": [50, 73], "anticip": 50, "nperform": 50, "preview": 50, "naugust": 50, "wilson": [50, 56], "broadwayworld": 50, "rehears": 50, "20220309": 50, "watch": 50, "sitzprob": 50, "theatermania": 50, "nfirst": 50, "orchestra": 50, "nkarimloo": 50, "fe_93550": 50, "stephen": 50, "colbert": 50, "prep": 50, "primetim": 50, "picklebal": 50, "cb": [50, 57], "hollywood": 50, "nthe": 50, "pickl": [2, 50, 53, 59, 62, 68], "celebr": 50, "competitor": 50, "vie": 50, "ngherkin": 50, "hollywoodreport": 50, "1235111617": 50, "randi": 50, "meyer": 50, "debut": 50, "inject": [50, 55, 56], "nitro": 50, "chao": 50, "midwest": 50, "nit": 50, "ntake": 50, "lauri": 50, "zaleski": 50, "talk": [50, 59], "farm": 50, "washington": [50, 59], "entendr": 50, "nanim": 50, "lunat": 50, "joke": 50, "sanctuari": 50, "she": [50, 54, 74], "nbuilt": 50, "washingtonpost": 50, "get_related_quest": 50, "Is": [50, 51, 54, 58, 59, 66], "career": 50, "concept": [50, 54, 62, 67, 68], "get_answ": 50, "has_answ": 50, "related_quest": 50, "stress": 50, "answer": [50, 51, 52, 54, 59], "NO": 50, "primarili": 50, "misconcept": 50, "beginn": 50, "discov": [50, 54, 60, 66], "domain": [50, 62], "realis": 50, "studi": 50, "oct": 50, "projectpro": 50, "522": [50, 54], "20short": 50, "20answer": 50, "20to": 50, "20the": 50, "20learn": 50, "20by": 50, "20work": 50, "20hard": 50, "displayed_link": 50, "snippet_str": 50, "snippet_data": 50, "snippet_typ": 50, "snippet_str_bodi": 50, "raw_text": 50, "ndata": 50, "noct": 50, "facebook_scrap": 50, "get_profil": 50, "get_group_info": 50, "thedachshundown": 50, "2685753618191566": 50, "member": [50, 52, 67], "128635": 50, "welcom": [50, 63], "npost": 50, "advis": 50, "lover": 50, "nyou": 50, "pic": 50, "ve": 50, "viral": 50, "seen": [50, 63], "rule": 50, "AND": [50, 56], "guidelin": [50, 64], "Be": 50, "aggress": 50, "backyard": [50, 60], "breed": 50, "spam": 50, "unrel": 50, "sell": [50, 59], "prohibit": 50, "forward": 50, "risk": [46, 50, 52, 53, 55, 59], "promot": [2, 50], "fish": [50, 60], "buyer": 50, "everyon": 50, "scam": 50, "sir": 50, "ladi": 50, "nwe": 50, "appreci": 50, "approv": 50, "shirt": [50, 62], "mug": 50, "canva": 50, "campaign": [50, 59], "thank": 50, "pawown": 50, "collectio": 50, "zuck": 50, "friend_count": 50, "follower_count": 50, "following_count": 50, "cover_photo": 50, "scontent": 50, "ord5": 50, "fbcdn": 50, "net": 50, "t31": 50, "18172": 50, "19575079_10103832396388711_8894816584589808440_o": 50, "stp": 50, "cp0_dst": 50, "jpg_e15_fr_q65": 50, "_nc_cat": 50, "ccb": 50, "_nc_sid": 50, "ed5ff1": 50, "_nc_ohc": 50, "z5jceahnv3aax9ihcdv": 50, "_nc_ht": 50, "00_afctbrp26zwk0onprfkbpjlrlfdwwlmlv1_xlkevlke_yw": 50, "oe": 50, "63ca953d": 50, "profile_pictur": 50, "t39": 50, "30808": 50, "312257846_10114737758665291_6588360857015169674_n": 50, "jpg_e15_q65_s120x120": 50, "dbb9e7": 50, "x2_muzaxc2cax9w6lz6": 50, "00_afdikcbbddzcymhxd": 50, "yjp2stit_vgpqrm9oeibsydfg8ba": 50, "63a81f9": 50, "zuckerberg": 50, "chan": 50, "ndecemb": 50, "nmeta": 50, "nfounder": 50, "ceo": 50, "nfebruari": 50, "npalo": 50, "alto": 50, "nbring": 50, "togeth": [47, 48, 50, 51, 55, 58, 60, 62], "harvard": 50, "ncomput": 50, "psycholog": 50, "nphillip": 50, "exet": 50, "academi": 50, "nclassic": 50, "nclass": 50, "nardslei": 50, "nhigh": 50, "1998": [50, 59], "php": 50, "104022926303756": 50, "refid": 50, "palo": 50, "105506396148790": 50, "dobb": 50, "ferri": 50, "hometown": 50, "quot": [47, 50, 54], "fortun": 50, "favor": 50, "bold": 50, "virgil": 50, "aeneid": 50, "284": [48, 50], "grow": [50, 64], "pablo": 50, "picasso": 50, "albert": 50, "einstein": 50, "pycausalimpact": 52, "advertis": 52, "effect": [52, 54, 58, 59, 73], "intervent": [52, 59], "tsa": 52, "arima_process": 52, "armaprocess": 52, "r_": 52, "ma": [52, 59], "arma_process": 52, "generate_sampl": 52, "nsampl": [52, 54], "800": [52, 57], "pre_period": [52, 59], "799": [52, 59], "post_period": [52, 59], "ci": [52, 59], "summari": [52, 53, 54, 58, 59, 66, 73], "posterior": [52, 59], "cumul": [52, 59], "18006": 52, "15994": 52, "15871": 52, "16110": 52, "1896": [52, 57], "2135": 52, "approx": [52, 59], "absenc": [52, 59, 60], "counterfactu": [52, 59], "yield": [52, 59], "discuss": [51, 52, 59], "individu": [29, 48, 52, 59], "meaningfulli": [52, 59], "interpret": [52, 59, 65], "overal": [52, 59], "taken": [52, 59, 60], "unlik": [52, 59, 68], "due": [21, 52, 59, 62, 65], "fluctuat": [52, 59], "bear": [52, 59], "substant": [52, 59], "goal": [52, 54, 59, 74], "underli": [52, 54, 59], "bayesian": [52, 59], "advanc": [52, 57, 59], "languag": 52, "zeroshotgptclassifi": 52, "unseen": 52, "skllm": 52, "skllmconfig": 52, "set_openai_kei": 52, "your_kei": 52, "set_openai_org": 52, "your_organis": 52, "get_classification_dataset": 52, "demo": 52, "clf": [52, 59], "openai_model": 52, "gpt": [52, 54], "turbo": 52, "metric": [52, 54, 58, 60, 64, 67], "accuracy_scor": 52, "make_pipelin": [48, 52], "especi": [15, 29, 47, 52, 57, 59, 60, 63, 65, 66, 67], "logisticregress": [48, 52], "logist": 52, "regress": [52, 59], "svm": [2, 52, 64], "svc": [2, 52], "make_pip": 52, "grid_param": 52, "svc__c": 52, "svc__gamma": 52, "hypertun": 52, "cv": 52, "y_pred": [52, 59, 67], "y_actual": 52, "y_predict": 52, "testabl": 52, "deploi": [52, 57, 58], "incorpor": [52, 54, 59, 74], "modellibrari": 52, "wordlist": [52, 54], "nltk": [52, 54], "punkt": [52, 54], "inherit": 52, "_predict": 52, "nounphraseextractor": 52, "noun_phrase_extractor": 52, "noun_phras": [52, 54], "noun_extractor": 52, "strategi": [2, 52, 58], "memory_byt": 52, "model_nam": 52, "microsecond": [52, 67], "time_": 52, "232699939166196e": 52, "test_cas": [52, 58], "3191997974645346e": 52, "sentimentanalyz": 52, "sentiment_analyz": 52, "nlp_model": 52, "assetsmanag": 52, "lazy_load": 52, "remot": [52, 53, 66], "asset": [52, 59], "988200114690699e": 52, "depend": [52, 56, 58], "00894871700074873": 52, "751099964370951e": 52, "006440052002290031": 52, "model_collect": 52, "subject": [52, 54], "techniqu": [52, 54, 59], "pca": [52, 54], "complic": [52, 60, 62], "lucikili": 52, "load_credit": 52, "defaut": 52, "princip": 52, "pc_1": 52, "pc_2": 52, "equival": [45, 47, 52, 54, 56, 58], "sensit": 52, "varianc": [52, 59], "elimin": [45, 48, 52, 53, 58, 63, 66, 73], "Then": [50, 52, 63, 68, 73], "featureimport": 52, "decisiontreeclassifi": [52, 60, 64], "load_occup": 52, "viz": 52, "seem": [52, 59], "light": [52, 60, 68], "co2": 52, "temperatur": [51, 52, 60, 62, 73], "hyperparamet": [52, 60], "neither": 52, "nor": 52, "loader": 52, "validation_curv": 52, "max_depth": [52, 60], "param_nam": 52, "param_rang": 52, "f1": 52, "higher": [52, 58, 59], "spot": 52, "decreas": [2, 52, 57, 63], "decid": [52, 65], "plot_decision_region": 52, "gridspec": 52, "ensembl": 52, "randomforestclassifi": [52, 58], "ensemblevoteclassifi": 52, "iris_data": 52, "clf1": 52, "clf2": 52, "clf3": 52, "eclf": 52, "vote": 52, "soft": [52, 54], "gs": 52, "fig": [52, 54, 59, 60], "lab": 52, "grd": 52, "forest": 52, "rbf": [2, 52, 59], "kernel": [2, 52, 64, 67], "subplot": [52, 59, 60], "legend": [52, 58, 59, 60], "wandb": 52, "monitor": [52, 53], "suit": 52, "eas": 52, "distribut": [59, 60, 67, 73], "label_col": 52, "to_fram": 52, "df_train": 52, "df_test": 52, "stratifi": 52, "rf_clf": 52, "ds_train": 52, "cat_featur": [52, 58], "ds_test": 52, "full_suit": 52, "suite_result": 52, "1mwandb": 52, "33mkhuyentran1401": 52, "relogin": 52, "forc": [52, 59, 65, 73], "to_wandb": 52, "local": [52, 54, 56, 57, 59, 65, 67, 68, 73], "chapter5": [52, 58], "20220314_094658": 52, "1yf63l3g": 52, "sync": [52, 68], "mud": 52, "mouss": 52, "ai": [52, 68], "1yf63l3gsync": 52, "109": 52, "artifact": 52, "minor": 52, "randomoversampl": 52, "linearsvc": 52, "n_inform": 52, "n_repeat": 52, "n_class": 52, "imblearn": 52, "over_sampl": 52, "ro": 52, "x_resampl": 52, "y_resampl": 52, "fit_resampl": 52, "ax0": 52, "ax1": 52, "nrow": [52, 59], "ncol": [52, 59], "sharei": 52, "xi": 52, "yi": 52, "resampl": 52, "mapieregressor": 52, "regressor": 52, "make_regress": 52, "nois": 52, "alpha": [52, 59, 67], "y_pi": 52, "regression_coverage_scor": 52, "coverage_scor": 52, "enumer": 52, "scatter": [52, 55, 60], "c1": [], "argsort": [52, 54], "ls": [52, 58, 60], "fill_between": [52, 59], "ravel": [52, 57], "forecast": 52, "massiv": 52, "distributedmlforecast": 52, "dask": 52, "lgb": 52, "dasklgbmforecast": 52, "target_transform": [52, 59], "series_ddf": 52, "fcst": [52, 59], "lag": [52, 59], "hash": 52, "diabet": 52, "load_diabet": 52, "linear": 52, "render": [52, 60], "nbviewer": 52, "linearregressionlinearregress": 52, "dump": [2, 52, 55, 59], "diabetes_model": 52, "sample_data": 52, "mlemmodel": 52, "rev": [52, 64, 73], "uri": 52, "project_uri": 52, "fs": 52, "fsspec": [52, 65], "localfilesystem": 52, "0x16b631430": 52, "localartifact": 52, "563": [52, 59], "c57e456e8a0768326655a8b52cde4f47": 52, "__root__": 52, "installablerequir": 52, "package_nam": 52, "extra_index": 52, "source_url": 52, "vc": 52, "vcs_commit": 52, "processors_cach": 52, "sklearnmodel": 52, "simplepickleio": 52, "signatur": [52, 55, 67], "numpyndarraytyp": 52, "kw_onli": 52, "vararg": 52, "varargs_typ": 52, "varkw": 52, "varkw_typ": 52, "call_ord": 52, "object_typ": 52, "ndarrai": [52, 62], "init": [53, 59, 65, 66], "gdrive": 53, "lynnbbt": 53, "4j0ida0ekyqqzzbc93juuuubvh": 53, "pull": [53, 68], "checkout": [53, 66], "characterist": [53, 58, 60], "graph": [53, 59, 60, 65, 67], "sv": [53, 58], "show_html": 53, "valuabl": [53, 66], "quantiti": [47, 53, 54, 56, 58], "prof_view": 53, "prof_df": 53, "est": 53, "lower_1": 53, "upper_1": 53, "inf": [53, 59], "frequent_item": 53, "frequent_str": 53, "boolean": [53, 54], "tensor": 52, "00015": 53, "frequentitem": 53, "summarytyp": 53, "q_01": 53, "q_05": 53, "q_10": 53, "q_25": 53, "q_75": 53, "q_90": 53, "q_95": 53, "q_99": 53, "stddev": [53, 58], "cloud": [53, 76], "boilerpl": [53, 58, 63], "ssh": 53, "iter": [52, 53, 58, 59, 62, 67, 74], "who": [53, 54, 57], "interact": [52, 53, 55, 58, 59, 67], "auth": 53, "remoteauth": 53, "awsauth": 53, "authent": 53, "rmt_auth": 53, "from_password": 53, "aw": [53, 54], "aws_auth": 53, "aws_access_key_id": 53, "aws_access_kei": 53, "aws_secret_access_kei": 53, "aws_secret_kei": 53, "remotedir": 53, "awss3dir": 53, "rmt_dir": 53, "bucket": 53, "create_if_miss": 53, "aws_dir": 53, "transfer_to": 53, "dst": [53, 67], "recurs": [53, 62], "noun": 54, "phrase": [51, 54], "spell": 54, "download_corpora": 54, "word_count": 54, "defaultdict": 54, "beuti": 54, "mlxtend": 54, "generalize_nam": 54, "tran": [54, 74], "firstname_output_lett": 54, "kh": 54, "dataquest": 54, "lex": 54, "rank": 54, "blog": 54, "kept": 54, "motiv": 54, "someth": [54, 58, 67, 68], "behind": [54, 56], "skill": [51, 54], "gain": [54, 59], "fundament": [54, 60, 68], "meetup": 54, "teach": 54, "learner": 54, "spaci": [54, 65], "streamlit": 54, "streamlit_app": 54, "en_core_web_sm": 54, "browser": [52, 54, 67, 68], "1mhttp": 54, "localhost": [54, 58], "8501": 54, "ic": [54, 62, 67], "frozen": [54, 57, 67], "sweeten": 54, "num2word": [], "nineteen": 54, "libari": [], "ordin": [54, 67], "nineteenth": 54, "ordinal_num": 54, "2019th": 54, "lang": 54, "vi": [54, 60, 68], "hai": 54, "ngh\u00ecn": 54, "l\u1ebb": 54, "m\u01b0\u1eddi": 54, "ch\u00edn": 54, "es": 54, "mil": 54, "diecinuev": 54, "punctuat": 54, "stopword": 54, "hero": 54, "duck": [54, 58, 67], "pond": 54, "nltk_data": 54, "unzip": 54, "corpora": 54, "pipelin": [2, 47, 54, 58, 59, 62, 68, 73], "chain": [54, 56, 62], "remove_punctu": 54, "remove_stopword": 54, "remove_whitespac": 54, "gdown": 54, "cnn": 54, "kaggl": 54, "uc": [54, 55], "1qpgcz8mud5ptt8qjr79xq6koqnjut": 54, "4d": 54, "small_cnn": 54, "tfidf": 54, "scatterplot": [54, 60], "1000x300": 54, "appear": 54, "word_frequ": 54, "eat": [54, 60], "000135": 54, "0537": 54, "barplot": 54, "_decor": 54, "valid": [2, 47, 54, 60, 63, 64, 67], "misinterpret": 54, "newspap": 54, "mathdatasimplifi": [54, 62, 68], "dbt": 54, "publish_d": 54, "top_imag": 54, "wp": 54, "upload": [54, 55], "con": 54, "png": [54, 60], "dbtyou": 54, "warehous": 54, "snapshot": [54, 59], "cleans": 54, "property_typ": 54, "ramsrigouthamg": 54, "boudinfl": 54, "pke": 54, "universal_tagset": 54, "explos": 54, "sense2vec": 54, "s2v_reddit_2015_md": 54, "tar": [54, 67], "gz": [54, 67], "xvf": 54, "pprint": 54, "payload": 54, "weather": 54, "went": 54, "walk": [54, 58, 59, 60], "chat": 54, "neighbor": [54, 59, 64], "labrador": 54, "qe": 54, "boolqgen": 54, "predict_boolq": 54, "neighborhood": 54, "faq": 54, "qg": 54, "predict_shortq": 54, "wordninja": 54, "surpris": 54, "honeyinthejar": 54, "honei": 54, "ihavetwoappl": 54, "aratherblusterdai": 54, "bluster": 54, "automated_readability_index": 54, "ari": 54, "grade": [6, 54], "10th": 54, "11th": 54, "consciou": 54, "psychologist": 54, "marvel": 54, "acquir": [54, 57], "perfect": [54, 68], "pronunci": 54, "recogn": 54, "face": 54, "reading_tim": 54, "ms_per_char": 54, "fuzz": 54, "indel": 54, "tomorrow": 54, "tommorrow": 54, "24561403508771": 54, "54545454545454": 54, "token_sort_ratio": 54, "torch": [53, 54, 59], "negat": 54, "templat": 54, "po": [54, 58], "war": 54, "window": 54, "facebook": 54, "closur": 54, "tpp": 54, "jointli": 54, "vector": [52, 54, 60], "wordcloud": 54, "to_list": 54, "293": 54, "pre": [52, 54, 62, 64, 67, 73], "285": 54, "joint": 54, "023": 54, "dens": [52, 54], "656": [54, 68], "get_num_top": 54, "topic_word": 54, "word_scor": 54, "topic_num": 54, "get_top": 54, "semant": [], "cosin": 54, "generate_topic_wordcloud": 54, "plural_noun": 54, "he": 54, "plural_verb": 54, "feminin": 54, "singular_noun": 54, "compare_verb": 54, "fruit1": 54, "fruit2": 54, "keywordprocessor": 54, "kw_processor": [], "kw_dict": [], "chief": [], "add_keywords_from_dict": [], "keyword_dict": [], "fluent": [], "extract_keyword": [], "preprocessor": [48, 52, 54], "textpreprocessor": 54, "socialtoken": 54, "emoticon": 54, "text_processor": 54, "allcap": 54, "elong": 54, "emphasi": 54, "censor": 54, "corpu": 54, "unpack_hashtag": 54, "unpack_contract": 54, "unpack": 54, "spell_correct_elong": 54, "lowercas": [54, 67], "emoji": 54, "coolyazzy94": 54, "retweeeet": 54, "suck": 54, "haha": 54, "7rdymcvpkx": 54, "pre_process_doc": 54, "1gram": 54, "2gram": 54, "retweet": 54, "tong": 54, "chromadb": 54, "reli": [54, 58], "sole": 54, "translat": [45, 54, 67], "get_or_create_collect": 54, "man": [51, 54], "noodl": 54, "carri": 54, "babi": 54, "ride": 54, "query_result": 54, "query_text": 54, "pasta": 54, "n_result": 54, "5690374970436096": 54, "5929027199745178": 54, "chart": [54, 55], "bokeh": 55, "altair": 55, "dp": 55, "gapmind": 55, "gdppercap": 55, "lifeexp": 55, "pop": 55, "hover_nam": 55, "log_x": 55, "size_max": 55, "datat": 55, "successfulli": [47, 54, 55, 65, 67, 73], "yourfileid": 55, "1ji1cmxqnwsmc": 55, "vbl8dny6b4anbtbbky3": 55, "120mb": 55, "1mb": 55, "concis": [15, 31, 55, 56, 63], "transmiss": 55, "reconstruct": 55, "serd": 55, "from_json": 55, "to_json": [55, 63], "from_yaml": 55, "to_yaml": 55, "nname": [55, 63], "malici": [53, 55, 68], "safeti": 55, "verifi": [47, 55, 56], "tamper": 55, "urlsafeseri": 55, "auth_": 55, "eyjpzci6nswibmftzsi6imtodxllbnryyw4ifq": 55, "3cqlkhp1myeus8jnqmgv_mbrxsq": 55, "secret": [55, 66], "int8": 57, "float32": 57, "20640": 57, "fetch_california_h": [52, 57, 60], "scipi": [52, 57], "boxcox1p": 57, "pandas_appli": 57, "averoom": [52, 57], "swifter_appli": 57, "num_experi": 57, "swifter_tim": 57, "pandas_vs_swift": 57, "cprofil": 57, "cprofilers_exampl": 57, "246355": 57, "240252": 57, "primit": 57, "311": 57, "ncall": 57, "tottim": 57, "percal": 57, "cumtim": 57, "lineno": [57, 67], "__array_function__": 57, "copyto": 57, "ndim": 57, "prod": 57, "importlib": 57, "_bootstrap": 57, "1002": [56, 57], "_gcd_import": 57, "610": [57, 68], "353": 57, "1017": 57, "_handle_fromlist": 57, "1208": 57, "002": [57, 59], "527": [54, 57, 59], "004": 57, "147": [57, 68], "__enter__": 57, "151": [57, 68], "__exit__": [57, 68], "003": 57, "157": [57, 68], "_get_module_lock": 57, "524": [57, 67], "681": [57, 59], "194": [57, 59], "_lock_unlock_modul": 57, "310": [57, 59], "211": 57, "_call_with_frames_remov": 57, "4196": 57, "_verbose_messag": 57, "232": 57, "_requires_builtin_wrapp": 57, "521": [57, 59], "342": 57, "406": [57, 63], "_new_modul": 57, "880": 57, "005": [57, 58], "376": 57, "cach": [57, 67], "727": 57, "389": [57, 68], "498": [57, 59], "397": 57, "has_loc": 57, "spec_from_load": 57, "009": 57, "477": 57, "_init_module_attr": 57, "495": [57, 59], "549": [57, 59, 67], "module_from_spec": 57, "650": 57, "_load_unlock": 57, "520": 57, "725": 57, "find_spec": 57, "746": [57, 59], "create_modul": 57, "754": 57, "exec_modul": 57, "771": 57, "is_packag": 57, "497": [57, 67], "1530": 57, "863": 57, "867": [57, 68], "890": [57, 59], "_find_spec": 57, "937": [57, 68], "_sanity_check": 57, "956": 57, "_find_and_load_unlock": 57, "986": 57, "_find_and_load": 57, "_bootstrap_extern": 57, "1004": [56, 57], "1029": 57, "get_filenam": 57, "011": 57, "1034": 57, "1075": 57, "path_stat": 57, "1153": 57, "021": 57, "1164": 57, "058": 57, "1172": 57, "3858": 57, "006": 57, "_path_join": 57, "listcomp": 57, "812": 57, "_path_split": 57, "1624": 57, "genexpr": 57, "1317": 57, "_path_hook": 57, "820": 57, "1330": 57, "_path_importer_cach": 57, "007": 57, "_path_stat": 57, "026": 57, "1367": 57, "_get_spec": 57, "1399": 57, "704": [57, 59], "_path_is_mode_typ": 57, "1459": 57, "1465": 57, "474": [57, 59], "1493": 57, "733": [57, 68], "022": [57, 68], "1498": 57, "651": 57, "154": [57, 68], "_path_isfil": 57, "1549": 57, "_fill_cach": 57, "159": 57, "_path_isdir": 57, "1590": 57, "path_hook_for_filefind": 57, "pyinstrument_exampl": 57, "__": [57, 63], "durat": [24, 57, 58, 59, 60], "v4": 57, "31m0": [57, 58], "24m": 57, "15m": 57, "2mpyinstrument_exampl": 57, "2mpanda": 57, "4416": 57, "346": 57, "15mis_even": 57, "new_method": 57, "mod": [57, 59], "2m": [57, 65], "225": 57, "265": 57, "897": 57, "runpi": [57, 67], "_run_cod": [57, 67], "2mrunpi": 57, "textwrap": 57, "prev": 57, "15t09": 57, "restaur": [51, 57], "cook": [50, 57], "waiter": 57, "stove": 57, "sequenti": 57, "shout": 57, "count_to": 57, "highest_numb": 57, "sy": [57, 58, 60], "wall": 57, "submit": [57, 62, 67, 76], "862": 57, "manul": 57, "flow_run": [57, 68], "58a68b34": 57, "713": 57, "776": 57, "781": 57, "824": 57, "829": 57, "837": 57, "848": 57, "850": 57, "task_run": [57, 68], "043": 57, "062": 57, "daunt": [56, 57], "hardwar": 57, "facilit": 57, "costli": 57, "resourc": [57, 64, 74], "forget": [58, 64], "describ": [58, 73], "intention": 58, "idea": 58, "calculate_averag": 58, "todo": [58, 64], "test_calculate_average_two_num": 58, "Will": 58, "test_calculate_average_empty_list": 58, "unclear": 58, "misunderstand": 58, "contain_word": 58, "test_contain_word_1": 58, "test_contain_word_2": 58, "cowork": 58, "test_contain_word_exact": 58, "test_contain_word_different_cas": 58, "pytest_benchmark_exampl": 58, "list_comprehens": 58, "len_list": 58, "test_concat": 58, "linux": [58, 68, 73], "pluggi": [58, 73], "timer": 58, "perf_count": 58, "disable_gc": 58, "min_round": 58, "min_tim": 58, "000005": 58, "max_tim": 58, "calibration_precis": 58, "warmup": 58, "warmup_iter": 58, "rootdir": [58, 73], "hydra": [58, 73], "faker": 58, "anyio": [58, 68, 73], "32m": [56, 58, 65, 67, 73], "iqr": 58, "mop": 58, "286": 58, "4501": 58, "745": [58, 59], "5498": 58, "3872": 58, "6583": 58, "297": 58, "5001": 58, "3500": 58, "2686": 58, "5843": 58, "2322": 58, "162101": 58, "interquartil": 58, "1st": 58, "quartil": 58, "3rd": 58, "1m1": [58, 65, 73], "pytest_parametr": 58, "text_contain_word": 58, "noth": [58, 62], "test_text_contain_word": 58, "darwin": [58, 73], "bin": [58, 60, 65], "cachedir": 58, "pytest_cach": 58, "32mpass": 58, "1m2": [58, 65], "n2": [58, 59], "perc_differ": 58, "test_is_float": 58, "pytest_combin": 58, "directorybasedexampledatabas": 58, "typeguard": [58, 73], "1m4": 58, "pytest_without_id": 58, "1m3": 58, "pytest_id": 58, "pytest_param": 58, "1mcollect": 58, "pytest_fixtur": 58, "extract_senti": 58, "sentimetn": 58, "example_data": 58, "test_extract_senti": 58, "my_data": 58, "test_divis": 58, "test_modulu": 58, "modulu": 58, "scope": 58, "pytest_scop": 58, "pytest_skip": 58, "add_two": 58, "version_info": 58, "reason": 58, "eequir": 58, "test_add_two": 58, "33mskip": 58, "marker": [58, 60], "pytest_mark_xfail": 58, "divide_two_num": [], "test_divide_by_zero": [], "33mx": 58, "caplog": 58, "test_log": 58, "getlogg": 58, "logger": [58, 67], "test_divide_by_0": 58, "rare": 58, "writfil": 58, "pytest_repeat_exampl": 58, "generate_numb": 58, "test_generate_numb": 58, "1m100": 58, "frustrat": 58, "pytest_sugar_exampl": 58, "test_benchmark_exampl": 58, "test_parametr": 58, "test_fixtur": 58, "test_repeat_exampl": 58, "1mtest": 58, "36mpytest_sugar_exampl": 58, "0mtest_benchmark_exampl": 58, "32m1": [58, 65, 73], "40m": 58, "0mtest_fixtur": 58, "32m2": [58, 65], "0mtest_parametr": 58, "32m4": 58, "0mtest_repeat_exampl": 58, "32m23": 58, "32m42": 58, "32m62": 58, "32m81": 58, "32m100": 58, "302": 58, "8003": 58, "328": 58, "2844": 58, "9087": 58, "321": [58, 62], "5999": 58, "2495": 58, "866": [58, 68], "2220": 58, "0461": 58, "90868": 58, "104": [58, 62], "pytest_step": 58, "sum_test": 58, "average_2_num": 58, "steps_data": 58, "test_step": 58, "perc_difference_test": 58, "test_calc_suit": 58, "test_pick": 58, "plus_on": [56, 58, 67], "test_plus_on": 58, "branch": [58, 63], "untrack": 58, "31mtest_pick": 58, "repetit": [58, 68], "get_dog": 58, "test_get_dog": 58, "unittest": [], "testdog": 58, "testcas": 58, "test_walk": 58, "test_bark": 58, "constantli": 58, "verif": 58, "test_freezegun": 58, "freeze_tim": 58, "get_day_of_week": 58, "test_get_day_of_week": 58, "succe": 58, "patch": [58, 60], "connectionerror": 58, "5432": 58, "test_get_data_fail": 58, "mock_get": 58, "side_effect": 58, "test_get_data_succe": 58, "return_valu": 58, "properli": 58, "save_result": 58, "test_pyfakef": [], "file_nam": 58, "test_save_result": 58, "my_fil": 58, "create_dir": [], "poor": [58, 59], "reliabl": [51, 58], "available_fruit": 58, "nearby_stor": 58, "pa": 58, "dataframeschema": 58, "isin": 58, "less_than": [24, 58], "schemaerror": 58, "wise": 58, "failure_cas": 58, "check_input": 58, "get_total_pric": 58, "abbrevi": [58, 67], "price1": 58, "values_chang": 58, "new_valu": 58, "old_valu": 58, "ignore_ord": 58, "experience1": 58, "experience2": 58, "exclude_path": 58, "cmpare": 58, "259": 58, "significant_digit": 58, "dirty_equ": 58, "isnow": 58, "ispartialdict": 58, "islist": 58, "isstr": 58, "istruelik": 58, "timedelta": [58, 59, 67], "shop": 58, "is_mal": 58, "check_ord": 58, "scenario": [15, 52, 58, 59], "against": [56, 58, 60, 65, 73], "commut": 58, "test_hypothesi": 58, "test_floats_are_commut": 58, "37m": [58, 73], "00m": [58, 73], "94mdef": [58, 73], "92mtest_floats_are_commut": 58, "31mtest_hypothesi": 58, "94massert": [58, 73], "31me": [58, 73], "falsifi": [], "saw": [58, 62], "signal": [58, 68], "36m": [58, 67], "0mtest_hypothesi": 58, "31m": [58, 67, 73], "31m100": 58, "31mtest_floats_are_commut": 58, "robust": 58, "categorymismatchtraintest": 58, "new_categori": 58, "train_d": 58, "test_d": 58, "testfind": 58, "percent": [58, 63], "mislabel": 58, "conflictinglabel": 58, "recommend": [54, 58], "categorical_list": 58, "were": [6, 54, 58, 68], "therefor": [48, 58], "heurist": 58, "establish": 58, "phish": 58, "load_data": 58, "load_fitted_model": 58, "train_dataset": 58, "test_dataset": 58, "columntransform": [48, 52, 58], "simpleimput": [48, 52, 58], "urllength": 58, "numdigit": 58, "numparam": 58, "num_": 58, "entropi": 58, "hashttp": 58, "dsr": 58, "dse": 58, "bodylength": 58, "numtitl": 58, "numimag": 58, "numlink": 58, "specialchar": 58, "scriptlength": 58, "sbr": 58, "bscr": 58, "sscr": 58, "imput": [48, 52, 58], "most_frequ": [48, 58], "onehotencod": [48, 52, 58], "ext": 58, "criterion": 58, "simplemodelcomparison": 58, "minmaxscal": 58, "feature_rang": 58, "scaled_data": 58, "invers": 58, "original_data": 58, "inverse_transform": 58, "restor": 58, "crucial": [58, 59, 60], "assess": 58, "launch": [51, 58, 76], "popul": [52, 58, 66], "rate": [58, 59, 60, 73], "ab_test": 58, "lesampl": 58, "conversion_r": 58, "min_detectable_effect": 58, "get_size_per_vari": 58, "20177": 58, "reach": [58, 68], "ledataset": 58, "samplelesuccess": 58, "lesuccess": 58, "confidence_level": 58, "get_verdict": 58, "cleanup": 58, "addition": [48, 56, 58], "isol": 58, "test_postgr": 58, "test_query_result": 58, "cur": 58, "test_tabl": 58, "serial": [2, 45, 58, 59], "varchar": [45, 58], "alic": [32, 45, 47, 58], "fetchal": 58, "dash": 58, "obsolet": 58, "evolv": [58, 73], "formula": 58, "testmod": 58, "ok": [2, 58], "relev": [47, 58], "criteria": 58, "fact": [58, 63], "test_chatbot": 58, "factual_consist": 58, "factualconsistencymetr": 58, "llmtestcas": 58, "run_test": 58, "assert_test": 58, "shoe": 58, "elig": 58, "refund": 58, "actual_output": 58, "factual_consistency_metr": 58, "minimum_scor": 58, "2kdownload": 58, "factualconsistencymodel": 58, "th": 58, "1a": [58, 65], "2k": [58, 65], "0mrun": 58, "teardown": 58, "sessionfinish": 58, "slowest": 58, "vv": 58, "3m": 58, "1mpass": 58, "1mfailur": 58, "1msuccess": 58, "factual": 58, "9911543130874634": 58, "find_dat": 59, "17th": 59, "00am": 59, "hope": 59, "realli": 59, "dayofweek": 59, "dayofyear": 59, "is_month_end": 59, "is_month_start": 59, "is_quarter_end": 59, "is_quarter_start": 59, "is_year_end": 59, "is_year_start": 59, "date_str": 59, "quit": 59, "inconveni": [59, 63], "423992": 59, "tzinfo": [59, 67], "utc": [59, 67], "cst": 59, "to_timezon": 59, "dsttzinfo": 59, "forgot": 59, "working_hour": 59, "timeseri": 59, "histogram": [59, 60], "16666666666666666": 59, "3333333333333333": 59, "166666666666666": 59, "confirm": 59, "us_holidai": 59, "unitedst": 59, "whatev": 59, "abl": [59, 66], "independ": [59, 60], "japan": 59, "us_cal": 59, "luther": 59, "king": 59, "jr": 59, "labor": 59, "columbu": 59, "veteran": 59, "thanksgiv": 59, "christma": 59, "is_working_dai": 59, "get_working_days_delta": 59, "ja_cal": 59, "foundat": 59, "emperor": 59, "vernal": 59, "equinox": 59, "showa": 59, "constitut": 59, "greeneri": 59, "marin": 59, "mountain": 59, "respect": [48, 59, 68, 73], "autumn": 59, "sport": 59, "labour": 59, "load_wineind": 59, "train_siz": 59, "150": [47, 59, 68, 74], "auto_arima": 59, "blue": [59, 63], "sunspot": 59, "boxcoxendogtransform": 59, "load_sunspot": 59, "2700": 59, "boxcox": 59, "lmbda2": 59, "autoarima": 59, "suppress_warn": 59, "rb": [2, 59], "stepwis": 59, "minim": [59, 63], "aic": 59, "10383": 59, "210": [59, 62], "10020": 59, "218": 59, "9831": 59, "422": 59, "10381": 59, "212": 59, "9830": 59, "357": 59, "9817": 59, "480": 59, "508": 59, "413": 59, "996": 59, "9820": 59, "047": 59, "213": [59, 67], "896": 59, "9818": 59, "625": 59, "10385": 59, "9816": 59, "628": 59, "710": 59, "722": [52, 59], "9813": 59, "247": [59, 68], "9819": 59, "401": 59, "9834": 59, "327": 59, "9815": 59, "242": [54, 59, 68], "236": [59, 68], "564": 59, "9811": 59, "253": 59, "230": 59, "9814": 59, "636": 59, "409": 59, "9832": 59, "334": 59, "248": 59, "055": 59, "546": 59, "878": 59, "73630214": 59, "72738664": 59, "33806937": 59, "97670263": 59, "94336951": 59, "27600697": 59, "76335004": 59, "06207145": 59, "18910652": 59, "76778119": 59, "01474934": 59, "41947969": 59, "57286429": 59, "30950555": 59, "63971231": 59, "nicer": 60, "customiz": 60, "set_them": 60, "node": [56, 60], "ab": [56, 60], "bc": 60, "data_science_flowchart": 60, "5236": 60, "122": 60, "6750": 60, "tooltip": 60, "3288": 60, "6625": 60, "popup": 60, "mt": 60, "hood": 60, "meadow": 60, "add_to": 60, "repositori": 60, "wine": 60, "classifi": [48, 59, 60], "target_nam": 60, "wine_typ": 60, "feature_nam": 60, "tune": [52, 54, 60], "hip": 60, "lr": [52, 60], "r2": 60, "sgd": 60, "adam": 60, "from_iter": 60, "javascript": [60, 62, 68], "ipythonexperimentdisplai": 60, "0x10b683730": 60, "strongli": 60, "presenc": 60, "soybean": 60, "_openml": 60, "404": 60, "msno": 60, "dendrogram": 60, "hierarch": 60, "cluster": [2, 52, 54, 60], "nulliti": 60, "fulli": 60, "discolor": 60, "germin": 60, "draw": 60, "matplotlib_venn": 60, "venn2": 60, "set_label": 60, "healthi": [54, 60], "group1": 60, "group2": 60, "cicl": 60, "venn3": 60, "rectangl": 60, "ds": [54, 59, 60], "da": [54, 60], "off": [60, 67], "mass": 60, "inlin": 60, "rc": [], "read_tabl": 60, "susanli2016": 60, "fruit_data_with_color": 60, "fruit_label": 60, "fruit_nam": 60, "fruit_subtyp": 60, "color_scor": 60, "granny_smith": 60, "180": [59, 60], "mandarin": 60, "84": [60, 63], "braeburn": 60, "172": 60, "pairplot": 60, "axisgrid": [], "pairgrid": [], "0x7f30a3be1a30": [], "distinct": [59, 60], "pairwis": [54, 60], "scaled_featur": 60, "lastli": 60, "embed": 60, "color_palett": [], "gca": [], "set_aspect": [], "datalim": [], "fontsiz": [52, 59], "degrad": 60, "dashboard": 60, "tab": [60, 67], "datadrifttab": 60, "california_data_drift_report": 60, "column_map": 60, "classdiagram": 60, "is_mamm": 60, "is_pet": 60, "fur_color": 60, "scale_color": 60, "swim": 60, "logic": [6, 47, 60, 64], "td": 60, "feel": [60, 76], "sick": 60, "doctor": 60, "dress": 60, "confusion_matrix": [60, 64], "prettier": 60, "pretty_confusion_matrix": 60, "pp_matrix_from_data": 60, "purd": 60, "dark": 60, "dracula": 60, "radii": 60, "aura": 60, "ayu": 60, "challenger_deep": 60, "duft": 60, "dufte_bar": 60, "duftifi": 60, "gruvbox": 60, "nord": 60, "onedark": 60, "pacoti": 60, "pitaya_smoothi": 60, "solar": 60, "tab10": [59, 60], "tab20": 60, "tab20r": 60, "tokyo_night": 60, "edece": 60, "edgecolor": 60, "facecolor": 60, "15141b": 60, "labelcolor": 60, "xtick": [52, 60], "ytick": [52, 60], "framealpha": 60, "savefig": 60, "boxplot": 60, "boxprop": 60, "capprop": 60, "flierprop": 60, "markeredgecolor": 60, "whiskerprop": 60, "prop_cycl": 60, "cycler": 60, "82e2ff": 60, "ffca85": 60, "61ffca": 60, "ff6767": 60, "a277ff": 60, "f694ff": 60, "6d6d6d": 60, "nbextens": 60, "prefix": [60, 67], "widgetsnbextens": 60, "32mok": 60, "js": [60, 68], "depict": 60, "sankeywidget": 60, "anna": 60, "chicago": 60, "jose": 60, "milwauke": 60, "bussi": 60, "trip": [59, 60], "famili": [52, 60], "visit": [24, 59, 60], "vacat": 60, "to_dict": 60, "auto_save_png": 60, "audienc": 60, "transit": [59, 60], "coupl": 60, "lai": 60, "egg": [60, 66], "airborn": 60, "zoo": 60, "data_id": 60, "965": [60, 68], "add_data_fram": 60, "640px": 60, "360px": 60, "penguin": 60, "adeli": 60, "ipyvizzustori": 60, "slide": 60, "slide1": 60, "add_slid": 60, "slide2": 60, "suggest": [52, 60, 73], "statannot": 60, "wonder": 60, "test_ind": 60, "apply_and_annot": 60, "00e": 60, "vs": [54, 60], "p_val": 60, "507e": 60, "643e": 60, "508e": 60, "874e": 60, "171": 60, "880e": 60, "adjusttext": 60, "plot_text": 60, "bo": 60, "va": 60, "adjust_text": 60, "chicken": [60, 62], "growth": 60, "chart_typ": 60, "progress": [60, 68], "paper": 60, "x_valu": 60, "y1_valu": 60, "randn": [60, 65], "y2_valu": 60, "y3_valu": 60, "colors10": 60, "colors5": 60, "timestamp": [60, 67], "378": 60, "dpi": 60, "set_xlim": 60, "set_ylim": 60, "set_xtick": 60, "set_ytick": 60, "strftime": [45, 58, 60, 67, 73], "set_yticklabel": 60, "n10": 60, "nhour": 60, "yellowbrick": 60, "countvector": 60, "freqdistvisu": 60, "fetch_20newsgroup": [54, 60], "newsgroups_train": 60, "feature_extract": 60, "stop_word": 60, "get_feature_nam": 60, "openstreetmap": 60, "stad": 60, "van": 60, "zon": 60, "heerhugowaard": 60, "netherland": 60, "vm": 60, "iri": 60, "scatter_chart": 60, "sepal_length": 60, "petal_width": 60, "hist_chart": 60, "sepal_width": 60, "dropdown": [60, 66], "necessarili": [61, 74], "food_box": 62, "time_func_complex": 62, "end_tim": 62, "test_func_complex": 62, "time_func_simpl": 62, "test_func_simpl": 62, "regex": [59, 62], "anybutwhitespac": 62, "quantifi": [54, 59, 62], "oneormor": 62, "any_but_spac": 62, "optional_schem": 62, "get_pattern": 62, "get_match": 62, "deer": 62, "varieti": [50, 59, 62], "fav_food": 62, "temp": 62, "temps_f": 62, "degc": 62, "degf": 62, "celsiu": 62, "fahrenheit": 62, "unyt_arrai": 62, "572": 62, "synchron": [62, 66, 68], "sync_map": 62, "async_map": 62, "copper": 62, "spong": 62, "async": [62, 68], "3c3112ef": 62, "191": 62, "208": 62, "362": [62, 68], "380": 62, "685": 62, "persistedresult": [62, 68], "serializer_typ": [62, 68], "storage_block_id": [62, 68], "45e1a1fc": 62, "bdc8": 62, "4f8d": 62, "8945": 62, "287d12b46d33": 62, "storage_kei": [62, 68], "ad7912161ab44a6d8359f8089a16202d": 62, "fe83574cd0df4fc5838ef902beb34f6b": 62, "ba18fe9c568845ecbad03c25df353655": 62, "orchestr": [62, 68], "tutori": [62, 63, 67, 68], "basic": [15, 62, 67, 68, 74], "delet": [63, 66], "symbol": [6, 63, 65], "strip_interact": 63, "run_interact": 63, "clean_cod": 63, "termcolor": 63, "cprint": 63, "figlet_format": 63, "___": 63, "slant": 63, "____": 63, "bell": [50, 63], "fire_exampl": 63, "get_mean": [58, 63, 64, 68], "get_modulo": 63, "typer_exampl": 63, "add_numb": [6, 63], "invalid": [2, 6, 15, 63, 68], "cyan": 63, "src": 63, "latexifi": 63, "with_latex": 63, "mathrm": 63, "triangleq": 63, "4ac": 63, "2a": [63, 65], "autoencod": 63, "manim": 63, "overwhelm": 64, "navig": [64, 66], "arrang": 64, "unsort": 64, "fl_score": 64, "classification_report": 64, "roc_curv": 64, "gridsearchcv": 64, "stratifiedkfold": 64, "naive_bay": 64, "gaussiannb": [52, 64], "multinomialnb": 64, "kneighborsclassifi": [52, 64], "timeseriessplit": 64, "name_of_your_fil": 64, "repo": [64, 66, 73], "timothycroslei": 64, "hook": [64, 73], "interrogate_exampl": 64, "plus_two": 64, "multiply_thre": 64, "mirror": [62, 64], "mypy_exampl": 64, "union": [64, 68], "get_name_pric": 64, "v0": [51, 64], "910": 64, "test_refurb": 64, "furb109": 64, "furb108": 64, "err": 64, "silenc": 64, "liter": [51, 64], "stick": 64, "dosisod": 64, "eradicate_test": 64, "wemak": 64, "validationerror": [24, 64], "basemodel": [24, 51, 64], "splitconfig": 64, "split_data": 64, "341": 64, "type_error": 64, "stack": [52, 64], "list_rang": 64, "setup": [52, 63, 64, 65, 67, 68], "n_rang": 64, "consumpt": 64, "memory_profiler_test": 64, "del": 64, "mprof": 64, "1s": [64, 65, 66], "202": 64, "152": [64, 68], "pose": [48, 52, 53, 59, 64], "difficulti": 64, "dead_cod": 64, "dataprocessor": 64, "clean_data": 64, "jendrikseipp": 64, "later": [52, 59, 64], "old_venv": 65, "new_venv": 65, "uninstal": 65, "jinja2": [65, 67], "redo": 65, "typer": 65, "htmlmin": 65, "phik": 65, "multimethod": 65, "tangl": 65, "unicod": 65, "vision": 65, "missingno": 65, "freez": [65, 73], "pyinstrument": 65, "pypi": [65, 73], "proxi": [65, 73], "http_proxi": [65, 73], "3128": [65, 73], "https_proxi": [65, 73], "1080": [65, 73], "charset": [65, 73], "savepath": [65, 73], "dynam": 65, "compat": [52, 59, 65, 67, 68], "pin": [65, 73], "flask": [65, 67], "top_github_scrap": 65, "scrape_repo": 65, "scrape_us": 65, "reqs1": 65, "datacommon": 65, "reqs2": 65, "cmpreq": 65, "suddenli": 65, "broke": 65, "36mpanda": 65, "36mnumpi": 65, "34mupdat": 65, "34mresolv": 65, "3s": 65, "34mwrite": 65, "lock": 65, "1mpackag": 65, "34m5": 65, "34m0": 65, "39minstal": 65, "36msix": 65, "39m": [65, 68], "34mpend": 65, "0j": 65, "34minstal": 65, "36mpython": 65, "dateutil": 65, "36mpytz": 65, "1m2021": 65, "3a": 65, "32m2021": 65, "pyproject": 65, "toml": 65, "earlier": 65, "1msolverproblemerror": 65, "1mbecaus": 65, "chapter6": 65, "puzzl": 65, "solver": 65, "1m241": 65, "36m_solv": 65, "2m237": 65, "39mresult": 65, "39mpackag": 65, "2m238": 65, "1mexcept": 65, "39moverrideneed": 65, "1ma": 65, "39me": 65, "2m239": 65, "1mreturn": 65, "1mself": [65, 67], "39msolve_in_compatibility_mod": 65, "39moverrid": 65, "39muse_latest": 65, "2m240": 65, "39msolvefailur": 65, "1mrais": 65, "39msolverproblemerror": 65, "2m242": 65, "2m243": 65, "1mdict": 65, "2m244": 65, "depth_first_search": 65, "2m245": 65, "packagenod": 65, "39m_packag": 65, "39maggregate_package_nod": 65, "34mname": 65, "34mversion": 65, "34mdescript": 65, "34mdepend": 65, "34m4": 65, "39mremov": 65, "34mremov": 65, "publish": 65, "onefil": 65, "spec": [52, 59, 65], "255826": 65, "038615": 65, "850358": 65, "318558": 65, "255311": 65, "618789": 65, "434642": 65, "474813": 65, "676099": 65, "662942": 65, "314174": 65, "142569": 65, "704812": 65, "095609": 65, "156275": 65, "999871": 65, "839902": 65, "366550": 65, "818387": 65, "512015": 65, "conveni": [47, 59, 65], "colleagu": 65, "your_local_fold": 66, "gh": 66, "fetch": [59, 66, 68], "mess": 66, "clone": 66, "highlight": [59, 66], "yournam": 66, "quick": 66, "hassl": 66, "compil": [50, 66, 73], "pr": 66, "outdat": 66, "pull_request": 66, "ubuntu": 66, "permiss": 66, "kanhari": 66, "env": [52, 66, 68, 73], "github_token": 66, "openai_api_kei": [51, 66, 73], "bytes_or_buff": 67, "capit": 67, "casefold": 67, "suitabl": 67, "caseless": 67, "fillchar": 67, "utf": 67, "strict": 67, "codec": 67, "endswith": 67, "suffix": 67, "expandtab": 67, "tabsiz": 67, "format_map": 67, "isalnum": 67, "isalpha": 67, "isascii": 67, "ascii": 67, "isdecim": 67, "isdigit": 67, "isidentifi": 67, "isnumer": 67, "isprint": 67, "printabl": 67, "isspac": 67, "istitl": 67, "ljust": 67, "justifi": 67, "lstrip": 67, "maketran": 67, "usabl": 67, "partit": [52, 56, 67], "rfind": 67, "rindex": 67, "rjust": 67, "rpartit": 67, "rsplit": 67, "maxsplit": 67, "delimit": 45, "rstrip": 67, "trail": 67, "splitlin": 67, "keepend": 67, "boundari": 67, "strip": [50, 67], "swapcas": 67, "titlecas": 67, "zfill": 67, "pad": 67, "edit_data": 67, "log_loc": 67, "1165738010": 67, "struggl": 67, "loguru_vs_log": 67, "logging_exampl": 67, "basicconfig": 67, "asctim": 67, "levelnam": 67, "funcnam": 67, "critic": 67, "802": [59, 67], "loguru_exampl": 67, "catch": [67, 68], "mean_squared_error": 67, "file_": 67, "evaluate_result": 67, "y_true": 67, "mean_square_err": 67, "root_mean_square_err": 67, "ipykernel_174022": 67, "1865479429": 67, "0x7f279588f430": 67, "0x7f27958bfca0": 67, "inner_f": 67, "0x7f27958bfb80": 67, "_regress": 67, "335": 67, "y_type": 67, "multioutput": 67, "_check_reg_target": 67, "0x7f27958b7af0": 67, "check_consistent_length": 67, "0x7f279676e040": 67, "319": 67, "icrecream": 67, "itself": [67, 73], "trace": 67, "alreadi": [54, 67, 68], "heat": [50, 67, 73], "headach": 67, "pyheat_exampl": 67, "ph": 67, "create_heatmap": 67, "show_heatmap": 67, "57aff36d5f6d": 67, "lego": 67, "sklego": 67, "pandas_util": 67, "log_step": 67, "print_fn": 67, "make_copi": 67, "drop_column": [29, 67], "encode_cat_vari": 67, "000239": 67, "n_ob": 67, "n_col": 67, "002117": 67, "003217": 67, "tqdm": [59, 60, 67], "arbitrari": [48, 53, 67], "example1": 67, "example2": 67, "task1": 67, "task2": 67, "my_flow": 67, "ui": 67, "wednesdai": 68, "get_incoming_data": 68, "train_model": 68, "retrain": 68, "run_pend": 68, "file_to_run": 68, "chime": 68, "listen": 68, "awai": [59, 68], "knock": 68, "email_send": 68, "recipient_email": 68, "your_email": 68, "your_second_email": 68, "adress": 68, "sender_email": 68, "grandma": 68, "s_email": 68, "gmail": 68, "train_your_nicest_model": 68, "your_nicest_paramet": 68, "slack": 68, "channel": [52, 68], "everybodi": 68, "sequenc": 68, "echo": 68, "virtual": [56, 68], "poetri": 68, "shell": [67, 68], "pull_data": 68, "dvc": [58, 68, 73], "install_al": 68, "customer_segment": 68, "md": [63, 68], "webbrows": 68, "open_new": 68, "explicitli": 68, "tediou": [67, 68], "star_script": 68, "square_root": 68, "deg_to_rad": 68, "radian": 68, "edit": 68, "earli": 68, "draft": 68, "effort": 68, "monkey_exampl": 68, "stub": 68, "meant": 68, "wifi": 68, "bulb": 68, "laptop": 68, "bedroom": 68, "bathroom": 68, "livingroom": 68, "run_process": 68, "cancel": [67, 68], "timeout_second": 68, "687": 68, "arrog": 68, "goshawk": 68, "979": 68, "e6feb297": 68, "982": 68, "561": 68, "exceed": 68, "timeout": 68, "1239": 68, "orchestrate_task_run": 68, "await": [67, 68], "run_sync": 68, "fn": [51, 68], "asyncutil": 68, "run_sync_in_interruptible_worker_thread": 68, "tg": 68, "start_soon": 68, "_backend": 68, "_asyncio": 68, "658": 68, "__aexit__": 68, "cancellederror": 68, "asyncio": [67, 68], "_core": 68, "_task": 68, "timeouterror": 68, "788": 68, "timedout": 68, "nasyncio": 68, "ndure": 68, "ntimeouterror": 68, "790": [59, 68], "orchestrate_flow_run": 68, "flow_cal": 68, "run_sync_in_worker_thread": 68, "to_thread": 68, "get_asynclib": 68, "3z": 68, "svlh9jv14ps3j6cc964tbjg40000gq": 68, "ipykernel_83306": 68, "3092424982": 68, "__call__": 68, "enter_task_run_engin": 68, "run_async_from_worker_thread": 68, "begin_run": 68, "from_thread": 68, "asynclib": 68, "run_async_from_thread": 68, "970": 68, "commandlinetool": 68, "framework": [48, 52, 53, 67, 68], "concurr": [47, 68], "_base": 68, "445": 68, "__get_result": 68, "390": 68, "_except": 68, "874": 68, "get_task_call_return_valu": 68, "_result": 68, "final_st": 68, "raise_on_failur": 68, "_get_state_result": 68, "get_state_except": 68, "wait_for": 68, "result_factori": 68, "interrupt": 68, "1234": 68, "1235": 68, "1236": 68, "timeout_scop": 68, "1237": 68, "1238": 68, "1241": 68, "exc": 68, "__fn": 68, "send_interrupt_to_thread": 68, "partial": 68, "capture_worker_thread_and_result": 68, "notset": 68, "taskgroup": 68, "exc_typ": 68, "exc_val": 68, "exc_tb": 68, "654": 68, "655": 68, "442": [59, 68], "return_st": 68, "438": 68, "get_call_paramet": 68, "440": 68, "return_typ": 68, "enter_flow_run_engine_from_flow_cal": 68, "443": 68, "444": [59, 68], "446": [54, 68], "447": 68, "in_async_main_thread": 68, "portal": 68, "153": 68, "start_blocking_port": 68, "156": 68, "283": 68, "blockingport": 68, "268": 68, "269": 68, "270": 68, "callabl": [48, 68], "coroutin": [67, 68], "t_retval": 68, "271": 68, "272": 68, "273": 68, "274": 68, "thread": [47, 67, 68], "275": 68, "281": 68, "start_task_soon": 68, "_state": 68, "388": 68, "391": 68, "392": 68, "cycl": [63, 68], "393": 68, "219": 68, "_call_func": 68, "216": [47, 68], "217": 68, "add_done_callback": 68, "callback": 68, "retval": 68, "220": 68, "_cancelled_exc_class": 68, "inject_cli": 68, "with_injected_cli": 68, "client_context": 68, "new_client": 68, "setdefault": 68, "create_then_begin_flow_run": 68, "235": 68, "238": 68, "get_state_result": 68, "backward": 68, "is_crash": 68, "is_fail": 68, "datadocu": 68, "result_from_state_with_data_docu": 68, "partial_flow_run_context": 68, "604": [59, 68], "605": [59, 68], "606": 68, "607": 68, "608": 68, "609": [59, 68], "612": [59, 68], "waited_for_task_run": 68, "wait_for_task_runs_and_report_crash": 68, "613": 68, "flow_run_context": 68, "task_run_futur": 68, "614": 68, "616": 68, "continu": [50, 68], "outcom": [59, 68], "capacitylimit": 68, "sniffio": 68, "current_async_library_cvar": 68, "936": 68, "queue": 68, "put_nowait": 68, "workerthread": 68, "865": 68, "baseexcept": 68, "868": 68, "869": 68, "356": 68, "358": 68, "363": 68, "364": 68, "task_runn": 68, "sequentialtaskrunn": 68, "365": 68, "366": 68, "367": 68, "731": 68, "732": 68, "isasync": 68, "736": 68, "737": [67, 68], "738": 68, "sync_port": 68, "runtimeerror": 68, "964": 68, "966": 68, "967": 68, "run_coroutine_threadsaf": 68, "968": [63, 68], "threadloc": 68, "969": 68, "extra_task_input": 68, "872": 68, "_wait": 68, "875": 68, "876": 68, "prefectfutur": 68, "1233": 68, "1242": 68, "failaftercontextmanag": 68, "116": 68, "_cancel_scop": 68, "117": 68, "cancel_cal": 68, "occasion": [50, 68], "retry_delay_second": 68, "flaky_funct": 68, "bald": 68, "caiman": 68, "906": 68, "8095224b": 68, "908": 68, "1449": 68, "ipykernel_36167": 68, "3817304312": 68, "awaitingretri": 68, "propos": 68, "569": [59, 68], "013": 68, "512": 68, "2c195477": 68, "a9d1": 68, "4b59": 68, "9a9e": 68, "80b00f96c464": 68, "84ff6378ce894b6fb1823e60b1d201b4": 68, "previou": [59, 62, 73], "icon": [73, 76], "corner": [73, 76], "latex": 73, "3x": 73, "papermil": 73, "tag": [59, 73], "parameter": 73, "magic": [], "load_ext": 73, "12t09": 73, "438535": 73, "cpython": 73, "gcc": 73, "x86_64": 73, "architectur": 73, "64bit": 73, "ivers": 73, "pipreqsnb": 73, "pipreq": 73, "scikit_learn": 73, "seppar": 73, "experiment": 73, "pytest": [24, 56, 73], "qq": [56, 73], "autoconfig": 73, "multiply_by_two": 73, "test_multiply_by_two": 73, "31mf": 73, "failur": 73, "1m_____________________________": 73, "sample1": 73, "expected1": 73, "______________________________": [58, 73], "33msampl": 73, "92mtest_multiply_by_two": 73, "56d7928444c9": 73, "tmpospmc1tm": 73, "isort": 73, "flake8": 73, "example_notebook": 73, "ipnb": 73, "reformat": [], "cell_1": 73, "f401": 73, "chapter7": 73, "rede": 73, "spread": 74, "awar": 74, "knowledg": 74, "bite": 74, "700": [59, 74], "mailbox": 74, "subscrib": 74, "wrote": 74, "100k": 74, "toward": 74, "500": [2, 56, 59, 63, 74], "mission": 74, "button": 76, "colab": 76, "subsequ": [45, 48, 59], "set_output": 48, "60000": 48, "70000": 48, "414214": 48, "neat": 51, "sk": 51, "dude": 51, "ness": 51, "dudeifi": 51, "bodi": [51, 67], "yo": 51, "functioncal": 51, "tea": [2, 51], "sweetness_percentag": 51, "create_milk_tea": 51, "boba": 51, "froth_milk": 51, "textur": 51, "foami": 51, "hot": [50, 51], "cold": 51, "froth": 51, "coffee_typ": 51, "configure_coffe": 51, "latt": 51, "pandas_on_spark": 56, "familiar": [47, 56], "ps": 56, "psdf": 56, "006482": [], "201401": [], "959126": [], "712733": [], "369599": [], "396453": [], "392501": [], "822455": [], "156499": [], "169058": [], "646378": [], "789393": [], "902216": [], "127352": [], "269125": [], "638909": [], "04922": [], "090836": [], "83575": [], "174097": [], "spark_data": 56, "numeric_featur": 48, "categorical_featur": 48, "numeric_transform": [48, 52], "categorical_transform": [48, 52], "sparse_output": 48, "verbose_feature_names_out": 48, "x_transform": 48, "cat1_a": 48, "cat1_b": 48, "cat1_c": 48, "cat2_x": 48, "cat2_i": 48, "cat2_z": 48, "791093": 48, "393167": 48, "707107": 48, "174741": 48, "266871": 48, "043685": 48, "wrong": 6, "calculate_grad": 6, "constraint": [24, 58], "test_processing_fn": 58, "in_rang": 58, "out_schema": 58, "add_column": 58, "val3": 58, "check_output": 58, "processing_fn": 58, "nullabl": 58, "spark": 52, "collabor": 52, "reduct": [52, 54], "linalg": 52, "maxit": 52, "regparam": 52, "model1": 52, "aggregationdepth": 52, "treeaggreg": 52, "elasticnetparam": 52, "elasticnet": 52, "penalti": 52, "binomi": 52, "multinomi": 52, "featurescol": 52, "fitintercept": 52, "labelcol": 52, "lowerboundsoncoeffici": 52, "coeffici": 52, "constrain": 52, "undefin": 52, "lowerboundsonintercept": 52, "beequal": 52, "oflass": 52, "maxblocksizeinmb": 52, "maximum": [52, 59], "predictioncol": 52, "probabilitycol": 52, "calibr": 52, "treat": [52, 56, 73], "rawpredictioncol": 52, "rawpredict": 52, "converg": 52, "toler": 52, "upperboundsoncoeffici": 52, "upperboundsonintercept": 52, "weightcol": 52, "0019392203169556147": 52, "9980607796830444": 52, "995731919571047": 52, "004268080428952992": 52, "01200463023637096": 52, "987995369763629": 52, "cond": 68, "time_of_week": 68, "file_exist": 68, "myfil": 68, "do_work": 68, "time_of_dai": 68, "do_hourly_at_night": 68, "weekli": 68, "mon": 68, "sat": 68, "do_twice_a_week": 68, "fill_dict": 29, "variant": 48, "skub": 48, "dedupl": 48, "duplic": [48, 56], "make_deduplication_data": 48, "duplicated_food": 48, "chocol": 48, "broccoli": 48, "jalapeno": 48, "zucchini": 48, "entries_per_exampl": 48, "300": [2, 47, 48, 52, 56], "prob_mistake_per_lett": 48, "letter": 48, "cgocol": 48, "chqcolat": 48, "chocoltt": 48, "most_common": 48, "195": [48, 67], "jalaoeno": 48, "chocdlat": 48, "ehocol": 48, "chocolatw": 48, "brocroli": 48, "brojcoli": 48, "broccsli": 48, "broccqli": 48, "bxoccoli": 48, "sroccoli": 48, "brzccoli": 48, "jylapeno": 48, "jalaponi": 48, "closest": 48, "deduplicated_data": 48, "translation_t": 48, "qalapeno": 48, "jalapenh": 48, "jalapeto": 48, "oalapeno": 48, "jalqceno": 48, "jzlapeno": 48, "dotenv": 46, "expos": 46, "codebas": 46, "unauthor": 46, "myusernam": 46, "playlist": 68, "resolut": [67, 68], "yt": 68, "youtu": 68, "ukctvrjsol0": 68, "thumbnail_url": 68, "ytimg": 68, "hq720": 68, "stream": 68, "itag": 68, "mime_typ": 68, "3gpp": 68, "144p": 68, "fp": 68, "8fp": 68, "vcodec": 68, "mp4v": 68, "acodec": 68, "mp4a": 68, "mp4": 68, "360p": 68, "30fp": 68, "avc1": 68, "42001e": 68, "720p": 68, "64001f": 68, "webm": 68, "vp9": 68, "480p": 68, "4d401f": 68, "244": 68, "4d401e": 68, "243": 68, "240p": 68, "4d4015": 68, "160": [59, 68], "4d400c": 68, "278": 68, "audio": 68, "abr": 68, "48kbp": 68, "128kbp": 68, "249": 68, "50kbp": 68, "opu": 68, "250": [2, 68], "70kbp": 68, "251": 68, "160kbp": 68, "mime": 68, "plnk6m_jbrvnopnqnvrwaytz2g4nftngz": 68, "si": 68, "bk4o05ihmgqsynk2": 68, "proper": 2, "current_statu": 2, "gate": 2, "statuscod": 2, "trend": 59, "trendforecast": 59, "fh": 59, "distance_bas": 59, "kneighborstimeseriesclassifi": 59, "dtw": 59, "_x": 30, "_y": 30, "merged_df": 30, "val_x": 30, "val_i": 30, "_df1": 30, "_df2": 30, "val_df1": 30, "val_df2": 30, "a3d9b1": 52, "06b1cf": 52, "f8d347": 52, "e48789": 52, "linewidth": [52, 59], "group_column": 58, "value_column": [58, 59], "test_cget_mean": 58, "thrown": 58, "pytest_to_fail": 58, "test_get_mean": 58, "u4": 59, "integer_column": 47, "select_dtyp": 47, "other_column": 47, "abi64str1": 47, "anomali": 59, "rpt": 59, "sigma": 59, "num_breakpoint": 59, "true_breakpoint": 59, "pw_constant": 59, "noise_std": 59, "algo": 59, "pelt": 59, "predicted_breakpoint": 59, "datapipelin": 2, "drop_missing_data": 2, "standardize_data": 2, "processed_data": 2, "encode_categorical_data": 2, "c_a": 2, "c_b": 2, "024695": 2, "161895": 2, "439155": 2, "387298": 2, "146385": 2, "317465": 2, "refactor": 2, "pluggabl": 2, "dataprocessingstrategi": 2, "dropmissingdatastrategi": 2, "standardizedatastrategi": 2, "add_strategi": 2, "extend": 2, "reorder": [2, 62], "encodedatastrategi": 2, "pickleablemodel": 2, "kmean": [2, 54], "make_blob": 2, "to_pickl": 2, "from_pickl": 2, "deseri": 2, "pickleablekmean": 2, "n_cluster": [2, 54], "pickleablesvm": 2, "n_init": 2, "kmeans_file_path": 2, "kmeans_model": 2, "pickleablemixin": 2, "safeguard": 56, "attack": 56, "item_price_panda": 56, "item_id": 56, "item_pric": 56, "id_val": 56, "heartbeatreceiv": [], "executor": [], "driver": [], "heartbeat": [], "976371": [], "exce": [], "120000": [], "sparkcontext": [], "schedul": [], "inbox": [], "sparkexcept": [], "awaitresult": [], "sparkthreadutil": [], "scala": [], "threadutil": [], "rpc": [], "rpctimeout": [], "rpcenv": [], "setupendpointrefbyuri": [], "102": 67, "setupendpointref": [], "rpcutil": [], "makedriverref": [], "blockmanagermasterendpoint": [], "driverendpoint": [], "lzycomput": [], "124": [], "isexecutoral": [], "688": 59, "anonfun": [], "receiveandrepli": [], "applyorels": [], "netti": [], "safelycal": [], "messageloop": [], "receiveloop": [], "anon": [], "threadpoolexecutor": [], "runwork": [], "1149": [], "624": [], "750": 56, "rpcendpointnotfoundexcept": [], "endpoint": [52, 59], "coarsegrainedschedul": [], "mbp": [], "62398": [], "nettyrpcenv": [], "asyncsetupendpointrefbyuri": [], "flatmap": [], "307": [], "impl": [], "transformwith": [], "callbackrunn": [], "executioncontextimpl": [], "executewithvalu": [], "defaultpromis": [], "trycomplet": [], "288": [], "187": [], "batchingexecutor": [], "batch": 47, "processbatch": [], "runtim": [], "java8": [], "jfunction0": [], "mcv": [], "sp": [], "blockcontext": [], "withblockcontext": [], "internalcallbackexecutor": [], "unbatchedexecut": [], "trysuccess": [], "onsuccess": [], "askabort": [], "localnettyrpccallcontext": [], "nettyrpccallcontext": [], "repli": [], "rpcendpointverifi": [], "rpcendpointref": [], "asksync": [], "blockmanagermast": [], "registerblockmanag": [], "blockmanag": [], "reregist": [], "642": [], "reportheartbeat": [], "1223": [], "295": [], "loguncaughtexcept": [], "1928": [], "runnableadapt": [], "511": 59, "futuretask": [], "runandreset": [], "308": [], "scheduledthreadpoolexecutor": [], "scheduledfuturetask": [], "301": [], "294": [], "dispatchoraddcallback": [], "316": [], "oncomplet": [], "306": [], "exit": [], "62413": [], "opt": 67, "homebrew": 67, "cellar": 67, "6_1": 67, "socketserv": [], "317": [], "_handle_request_noblock": [], "process_request": [], "client_address": [], "348": [], "finish_request": [], "requesthandlerclass": [], "755": [], "poll": [], "accum_upd": [], "267": [], "rfile": [], "num_upd": [], "read_int": [], "596": [], "eoferror": [], "jupyter_ai": 73, "your_api_key_her": 73, "chatgpt": 73, "spatial": 73, "laplacian": 73, "commonli": 73, "conduct": 73, "monthli": [59, 73], "yyyi": [67, 73], "mm": [67, 73], "monthly_d": 73, "unnot": 11, "unequ": 11, "mistralai": 51, "mistral": 51, "7b": 51, "assist": 51, "pyfakef": 58, "filesystem": 58, "test_tmp_path": 58, "lazypredict": 52, "supervis": 52, "lazyclassifi": 52, "load_breast_canc": 52, "ignore_warn": 52, "custom_metr": 52, "balanc": [2, 52, 59], "roc": 52, "auc": 52, "989474": 52, "987544": 52, "989462": 52, "0150008": 52, "sgdclassifi": 52, "0109992": 52, "mlpclassifi": 52, "985965": 52, "986904": 52, "985994": 52, "426": [52, 67], "perceptron": 52, "984797": 52, "0120046": 52, "98269": 52, "985934": 52, "0200036": 52, "logisticregressioncv": 52, "262997": 52, "982456": 52, "979942": 52, "982437": 52, "0140011": 52, "calibratedclassifiercv": 52, "975728": 52, "982357": 52, "0350015": 52, "passiveaggressiveclassifi": 52, "975439": 52, "974448": 52, "975464": 52, "0130005": 52, "labelpropag": 52, "0429988": 52, "labelspread": 52, "0310006": 52, "97193": 52, "969594": 52, "033": 52, "gradientboostingclassifi": 52, "967486": 52, "971869": 52, "166998": 52, "quadraticdiscriminantanalysi": 52, "964912": 52, "966206": 52, "965052": 52, "0119994": 52, "histgradientboostingclassifi": 52, "968421": 52, "964739": 52, "968387": 52, "682003": 52, "ridgeclassifiercv": 52, "963272": 52, "971736": 52, "0130029": 52, "ridgeclassifi": 52, "960525": 52, "968242": 52, "0119977": 52, "adaboostclassifi": 52, "961404": 52, "959245": 52, "961444": 52, "204998": 52, "extratreesclassifi": 52, "957138": 52, "961362": 52, "0270066": 52, "95503": 52, "961276": 52, "0560005": 52, "baggingclassifi": 52, "947368": 52, "954577": 52, "947882": 52, "0559971": 52, "bernoullinb": 52, "950877": 52, "951003": 52, "951072": 52, "0169988": 52, "lineardiscriminantanalysi": 52, "950816": 52, "961089": 52, "0199995": 52, "954386": 52, "949536": 52, "954337": 52, "0139935": 52, "nusvc": 52, "943215": 52, "954014": 52, "019989": 52, "936842": 52, "933693": 52, "936971": 52, "0170023": 52, "nearestcentroid": 52, "933506": 52, "946801": 52, "0160074": 52, "extratreeclassifi": 52, "922807": 52, "912168": 52, "922462": 52, "0109999": 52, "checkingclassifi": 52, "361404": 52, "191879": 52, "0170043": 52, "dummyclassifi": 52, "512281": 52, "489598": 52, "518924": 52, "0119965": 52, "add_constraint": 47, "salary_gt_0": 47, "deltaprotocolerror": 47, "invari": 47, "sql_metdata": 45, "sql_metadata": 45, "parser": [45, 63], "parsed_queri": 45, "alias1": 45, "columns_dict": 45, "alias": [45, 62], "columns_alias": 45, "limit_and_offset": 45, "unchang": 73, "themselv": 73, "example_notebook2": 73, "test_exampl": 73, "test_func": 73, "tb": 73, "hypothesi": 73, "pyenv": [58, 59, 73], "jupyter_cli": 73, "deprecationwarn": 73, "migrat": 73, "platformdir": 73, "jupyter_platform_dir": 73, "jupyter_cor": 73, "v6": 73, "jupyter_data_dir": 73, "jupyter_runtime_dir": 73, "secure_writ": 73, "advers": 59, "streamlin": [], "pandasdataset": 59, "deeparestim": 59, "aileennielsen": 59, "timeseriesanalysiswithpython": 59, "airpasseng": 59, "parse_d": [59, 60], "training_data": 59, "test_gen": 59, "generate_inst": 59, "prediction_length": 59, "trainer_kwarg": 59, "max_epoch": 59, "1954": 59, "ticket": 62, "_ticket": 62, "get_ticket": 62, "_price": 62, "discount": 62, "discount_amount": 62, "apply_discount": 62, "deepli": [54, 62], "unread": 62, "calculate_discounted_pric": 62, "concert": 62, "bind_opt": 62, "from_opt": 62, "bring": [50, 56], "56976095832509": [], "43383865728208": [], "68113195098398": [], "col_nam": 29, "market": [56, 59], "coincid": 59, "causalimpact": 59, "willianfuk": 59, "arma_data": 59, "125": [24, 59], "3756": 59, "3609": 59, "3592": 59, "3628": 59, "164": [24, 59], "galact": 54, "unstructur": 54, "galacticdataset": 54, "filter_func": 54, "from_hugging_face_stream": 54, "tiiuae": 54, "falcon": 54, "refinedweb": 54, "dedup_field": 54, "max_sampl": 54, "detect_languag": 54, "__languag": 54, "4975": 54, "ru": 54, "nl": 54, "pt": [53, 54], "sh": 54, "eo": 54, "ceb": 54, "detect_pii": 54, "__pii__email": 54, "__pii__phon": 54, "__pii__credenti": 54, "1443": 54, "pii": 54, "__pii__ani": 54, "blogspot": 54, "filter_str": 54, "107937": 54, "get_embed": 54, "input_field": 54, "get_cluster_info": 54, "__cluster": 54, "overwritten": 54, "fine": [50, 54], "4902": 54, "31476": 54, "1095": 54, "1125": 54, "709": 54, "1224": 54, "749": 54, "cluster_id": 54, "cluster_s": 54, "advantag": [32, 52], "superior": [32, 52], "data_s": 32, "s_numpi": 32, "s_pyarrow": 32, "numpy_memori": 32, "pyarrow_memori": 32, "helper": 56, "showcas": 56, "bob": [45, 47, 56], "array_append": 56, "array_prepend": 56, "array_contain": 56, "array_distinct": 56, "withcolumn": 56, "has_": 56, "beforehand": 47, "maxim": 47, "glob": 47, "group_bi": 47, "collect_al": 47, "pytorch": 53, "upon": 53, "unpickl": 53, "guarante": 53, "therebi": 53, "safe_open": 53, "save_fil": 53, "weight1": 53, "weight2": 53, "devic": 53, "get_tensor": 53, "suffici": 59, "pytz": 59, "pari": [45, 59], "paris_tim": 59, "toronto": 59, "toronto_timezon": 59, "toronto_tim": 59, "astimezon": [59, 67], "future_datetim": 59, "843320": 59, "in_timezon": 59, "398059": 59, "qs": 59, "extend_panda": 59, "download_return": 59, "spy": 59, "peach": 15, "54095055783208": 56, "46593810642427": 56, "52092805080465": 56, "smith": [47, 56], "johnson": [47, 56], "temporari": [], "createorreplacetempview": 56, "modified_nam": 56, "encapsul": 56, "modify_nam": 56, "stringtyp": 56, "returntyp": 56, "simplefunctionregistri": 56, "py3": 67, "whl": 67, "kb": 67, "contourpi": [], "fonttool": [], "kiwisolv": [], "pillow": [], "pypars": [], "zipp": [], "49mnotic": [], "49m": [], "49m23": [], "49m24": [], "49mpip": [], "restart": [], "curvatur": 59, "far": 59, "datagener": 59, "kneeloc": 59, "figure2": 59, "kneedl": 59, "curv": 59, "concav": 59, "direct": [45, 58, 59], "plot_knee_norm": 59, "log1p": 48, "69314718": 48, "09861229": 48, "38629436": 48, "feature1": 48, "feature2": 48, "log_transform": 48, "result1": 56, "THEN": 56, "result2": 56, "assign_category_label": 56, "pytest_mark": 58, "test_long_running_funct": 58, "test_database_interact": 58, "test_function_1": 58, "test_function_2": 58, "deselect": 58, "32m3": 58, "subscriptionplan": 15, "get_plan_detail": 15, "subscript": 15, "basic_plan": 15, "premium_plan": 15, "great_tabl": 63, "appeal": 63, "footer": [54, 63], "island": [59, 63], "islands_mini": 63, "ascend": 63, "rowname_col": 63, "tab_head": 63, "landmass": 63, "subtitl": 63, "tab_source_not": 63, "source_not": 63, "almanac": 63, "1975": 63, "mcneil": 63, "1977": 63, "wilei": 63, "tab_stubhead": 63, "fmt_number": 63, "sep_mark": 63, "988": 63, "506": 63, "antarctica": 63, "borneo": 63, "280": 63, "baffin": 63, "184": 63, "britain": 63, "celeb": 63, "axel": 63, "heiberg": 63, "__pydantic_self__": 24, "162": 24, "__tracebackhide__": 24, "163": 24, "__pydantic_validator__": 24, "validate_python": 24, "self_inst": 24, "int_pars": 24, "input_valu": 24, "input_typ": 24, "feasibl": 21, "extrem": [21, 59], "large_log": 21, "log_entri": 21, "large_log_fil": 21, "process_log_entri": 21, "lazili": 21, "consolid": 50, "recipe_scrap": 50, "scrape_m": 50, "cookieandk": 50, "thai": 50, "curri": 50, "veget": [50, 51], "total_tim": 50, "ingredi": [50, 54], "\u00bc": 50, "cup": 50, "jasmin": 50, "rice": 50, "grain": 50, "rins": 50, "tablespoon": 50, "coconut": 50, "chop": 50, "pinch": 50, "grate": 50, "fresh": 50, "ginger": 50, "inch": 50, "nub": 50, "clove": 50, "press": 50, "minc": 50, "peel": 50, "diagon": 50, "thick": 50, "ounc": 50, "water": 50, "thinli": 50, "kale": 50, "tough": 50, "rib": 50, "tuscan": 50, "lacinato": 50, "dinosaur": 50, "teaspoon": 50, "turbinado": 50, "tamari": 50, "soi": 50, "sauc": [50, 54], "vinegar": 50, "lime": 50, "juic": 50, "garnish": 50, "cilantro": 50, "flake": 50, "sriracha": 50, "chili": 50, "pot": 50, "boil": 50, "overflow": 50, "drain": 50, "readi": 50, "fluff": 50, "fork": 50, "nto": 50, "warm": 50, "skillet": 50, "sprinkl": 50, "stir": 50, "soften": 50, "transluc": 50, "fragrant": 50, "nadd": 50, "tender": 50, "mixtur": 50, "simmer": 50, "gentl": 50, "nremov": 50, "punch": 50, "bowl": 50, "spici": 50, "nutrient": 50, "calori": 50, "340": 50, "sugarcont": 50, "sodiumcont": 50, "473": 50, "mg": 50, "fatcont": 50, "saturatedfatcont": 50, "transfatcont": 50, "carbohydratecont": 50, "fibercont": 50, "proteincont": 50, "cholesterolcont": 50, "computation": 59, "proven": 59, "classic": 59, "rnn": 59, "nbeat": 59, "airpassengersdf": 59, "nf": 59, "input_s": 59, "max_step": 59, "tqdmwarn": 60, "iprogress": 60, "ipywidget": 60, "readthedoc": 60, "user_instal": 60, "autonotebook": [59, 60], "notebook_tqdm": 60, "pytorch_lightn": [], "nn": [], "checkpoint": [], "save_hyperparamet": [], "gpu": [], "mp": 47, "tpu": [], "ipu": [], "hpu": [], "lightning_log": [], "mae": [], "padder_train": [], "constantpad1d": [], "temporalnorm": [], "modulelist": [], "trainabl": [], "900": [], "789": [], "saniti": [], "trainer": [], "connector": [], "data_connector": [], "val_dataload": [], "bottleneck": [], "num_work": [], "train_dataload": [], "fit_loop": [], "log_every_n_step": [], "epoch": [], "miscalcul": [], "autograd": [], "aten": [], "sgn": [], "fall": [], "implic": [], "runner": 67, "mpsfallback": [], "_execution_engin": [], "run_backward": [], "02it": [], "v_num": [], "train_loss_step": [], "460": 59, "train_loss_epoch": [], "78it": [], "tsdataset": [], "sourcetensor": [], "detach": [], "requires_grad_": [], "tempor": [], "predict_dataload": [], "81it": [], "nixtla_id_as_col": 59, "adopt": [], "suppress": [], "unique_id": 59, "1961": [], "607208": [], "421": [], "863037": [], "493": [], "197845": [], "499": [], "307739": [], "199921": [], "587": [], "497253": [], "091309": [], "662": [], "209167": [], "577": [], "726501": [], "089569": [], "432": [], "609131": [], "420624": [], "mirascop": [], "your_api_kei": 51, "openaiextractor": 51, "meetingdetail": 51, "topic": 51, "particip": 51, "meetingextractor": 51, "extract_schema": 51, "prompt_templ": 51, "upcom": 51, "15th": 51, "sarah": [51, 56], "meeting_detail": 51, "lack": 51, "ipytest": 56, "actual_df": 56, "expected_df": 56, "assertdataframeequ": 56, "test_query_return_correct_number_of_row": 56, "song": 24, "release_d": 24, "beats_per_minut": 24, "multiple_of": 24, "song1": 24, "believ": 24, "dragon": 24, "greater_than": 24, "charli": 45, "david": 45, "ev": 45, "berlin": 45, "predefin": 45, "with_column": 47, "to_uppercas": 47, "comment_karma": 47, "respond": 51, "helpfulli": 51, "wider": 51, "databas": [51, 63], "executemani": 51, "openaical": 51, "openaicallparam": 51, "get_item_info": 51, "item_nam": [], "fetchon": 51, "sorri": 51, "groceryitemqueri": 51, "call_param": 51, "query_tool": 51, "nixtla": 59, "financi": 59, "nixtlacli": 59, "nixtla_cli": 59, "my_api_key_provided_by_nixtla": 59, "time_column": 59, "jbrownle": 59, "6550": 59, "8728": 59, "12026": 59, "14395": 59, "14587": 59, "time_col": 59, "target_col": 59, "timegpt_fcst_df": 59, "1969": 59, "14672": 59, "101562": 59, "15793": 59, "253906": 59, "21517": 59, "191406": 59, "22996": 59, "332031": 59, "25959": 59, "019531": 59, "max_insample_length": 59, "first_nam": 56, "age_after_10_year": 56, "reusabl": 2, "volum": [2, 59], "smoothi": 2, "breakfast": 2, "tropic": 2, "blast": 2, "dark_background": 60, "72befa": 60, "e583b6": 60, "72fcdb": 60, "color_list": 60, "autoet": 59, "generate_seri": 59, "n_seri": 59, "horizon": 59, "spark_df": 59, "30138168803582194": 59, "2724415914984484": 59, "211827399669452": 59, "322947056533328": 59, "218793605631347": 59, "sf": 59, "season_length": 59, "485": [], "lo": [59, 67], "hi": 59, "261609": [], "0255513": [], "4976664": [], "1963573": [], "9603": [], "432415": [], "28230855": [], "04625102": [], "5183661": [], "2641948": [], "0281373": [], "5002524": [], "2624528": [], "0263953": [], "4985104": [], "resource_track": [], "leak": [], "semaphor": [], "shutdown": [], "executorenv": 59, "tqdmexperimentalwarn": 59, "consol": [59, 68], "overhead": 56, "pandas_plus_on": 56, "488073": [], "62014": [], "62028": [], "347": [], "747": 59, "keyword_processor": 54, "add_keyword": 54, "clean_nam": 54, "new_sent": 54, "replace_keyword": 54, "917809": [], "56356": [], "56367": [], "handle_unknown": 52, "numerical_column": 52, "categorical_column": 52, "param_grid": 52, "model__n_estim": 52, "model__max_depth": 52, "model__min_samples_split": 52, "grid_search": 52, "tabularpredictor": 52, "predictor": 52, "disguis": 68, "malwar": 68, "mislead": 68, "shutil": 68, "iterdir": 68, "is_dir": 68, "rmtree": 68, "unlink": 68, "plain_text": 68, "plain": 68, "xml": 68, "nsome": 68, "ini": 68, "yml": 68, "nage": 68, "34mexampl": 68, "37mexampl": 68, "bankaccount": 2, "initial_bal": 2, "_balanc": 2, "isnotnul": 56, "1l": [], "scan": 56, "existingrdd": 56, "301782": [], "60847": [], "60857": [], "former": 59, "unavoid": 59, "latter": 59, "robot_execution_failur": 59, "download_robot_execution_failur": 59, "load_robot_execution_failur": 59, "f_x": 59, "f_y": 59, "f_z": 59, "t_x": 59, "t_y": 59, "t_z": 59, "extract_relevant_featur": 59, "features_filt": 59, "column_id": 59, "column_sort": 59, "83it": 59, "dd": 47, "ddf": 47, "npartit": 47, "mlforecast": 59, "utilsforecast": 59, "uncertainti": 59, "plot_seri": 59, "s3": [59, 60], "amazonaw": [59, 60], "m4": 59, "h1": 59, "586": 59, "559": 59, "uid": 59, "forecasts_df": 59, "renam": 59, "palett": 59, "set_size_inch": 59, "predictioninterv": 59, "kneighborsregressor": 59, "mlf": 59, "prediction_interv": 59, "n_window": 59, "lag_featur": 59, "lag24": 59, "lag48": 59, "lag72": 59, "lag96": 59, "lag120": 59, "lag144": 59, "lag168": 59, "date_featur": 59, "num_thread": 59, "454151": 59, "615": 59, "597": 59, "550958": 59, "601": 59, "310692": 59, "037187": 59, "620": 59, "871115": 59, "623": 59, "597610": 59, "627": 59, "357344": 59, "599": 59, "090": 59, "603": 59, "631": 59, "702": 59, "538": 59, "415217": 59, "551": 59, "491": 59, "913415": 59, "094072": 59, "337321": 59, "493112": 59, "568": 59, "736361": 59, "584": 59, "917018": 59, "675": 59, "534": 59, "535": 59, "567": 59, "525": 59, "703": 59, "496": 59, "797892": 59, "509": 59, "458": 59, "432874": 59, "483280": 59, "481": 59, "705219": 59, "890565": 59, "112505": 59, "162911": 59, "475": 59, "020": 59, "488": 59, "492": 59, "526": 59, "530": 59, "544": 59, "462": 59, "689475": 59, "114933": 59, "435": 59, "849278": 59, "808787": 59, "482": 59, "570164": 59, "489": 59, "529672": 59, "264017": 59, "423": 59, "451": 59, "504": 59, "705": 59, "439": 59, "784731": 59, "384": 59, "182476": 59, "400": [56, 59], "101658": 59, "419": 59, "176045": 59, "393416": 59, "467803": 59, "386986": 59, "394": 59, "555": 59, "645": 59, "test_with_forecast": 59, "plot_random": 59, "80l": 56, "orders_df": 56, "1001": 56, "1003": 56, "lee": 56, "1005": 56, "tom": 56, "600": 56, "customer_nam": 56, "revenu": 56, "total_revenu": 56, "top_custom": [], "order_count": 56, "ntop": [], "nnumber": 56, "2550": 56, "985951": [], "52614": [], "52648": [], "strong": [54, 59], "sim_randomwalk": 59, "utils_func": 59, "smoother": 59, "lowesssmooth": 59, "timestep": 59, "process_nois": 59, "measure_nois": 59, "smooth_fract": 59, "get_interv": 59, "shade": 59, "smooth_data": 59, "polycollect": 59, "0x15b25a8e0": 59, "eda": 60, "pyg": 60, "graphic": [], "walker": [], "kanari": 60, "ap": 60, "northeast": 60, "bike_sharing_dc": 60, "holidai": 60, "feeling_temp": 60, "humid": 60, "winspe": 60, "casual": 60, "winter": 60, "0014": 60, "0000": 60, "9982": 60, "0016": 60, "0032": 60, "0010": 60, "0x137d39650": 60, "decis": 59, "histor": 59, "simul": 59, "goog": 59, "2013": 59, "808": 59, "2303900": 59, "795": 59, "2202500": 59, "794": 59, "804": 59, "791": 59, "2026100": 59, "801": 59, "806": 59, "2265800": 59, "797": 59, "807": 59, "796": 59, "2175400": 59, "sma": 59, "roll": 59, "crossov": 59, "smacross": 59, "precomput": 59, "sma1": 59, "sma2": 59, "invest": 59, "broker": 59, "commiss": 59, "realist": 59, "bt": 59, "stat": 59, "3116": 59, "exposur": 59, "067039": 59, "equiti": 59, "68221": 59, "96986": 59, "peak": 59, "68991": 59, "21986": 59, "582": 59, "219699": 59, "458242": 59, "ann": 59, "266427": 59, "volatil": 59, "383008": 59, "sharp": 59, "658271": 59, "sortino": 59, "288779": 59, "calmar": 59, "763748": 59, "drawdown": 59, "082172": 59, "581506": 59, "win": 59, "255319": 59, "11931": 59, "worst": 59, "629898": 59, "074326": 59, "profit": 59, "factor": 59, "190805": 59, "606294": 59, "sqn": 59, "990216": 59, "_strategi": 59, "_equity_curv": 59, "_trade": 59, "entryb": 59, "shuffl": [], "7000": 56, "joined_df": 56, "scene": 56, "competit": 59, "y_df": 59, "743": 59, "744": 59, "785": 59, "756": 59, "719": 59, "748": 59, "cross_valid": 59, "cross_validation_df": 59, "691": 59, "726797": 59, "678": 59, "618": 59, "559522": 59, "167938": 59, "680": 59, "930997": 59, "981893": 59, "plot_cv": 59, "df_cv": 59, "last_n": 59, "gridspec_kw": 59, "hspace": 59, "notic": 59, "said": 59, "opencv": 63, "pypdf2": 63, "read_pdf": 63, "tablelist": 63, "parsing_report": 63, "to_html": 63, "to_sqlit": 63, "ki": 63, "km": 63, "nspeed": 63, "naccel": 63, "nstop": 63, "nidl": 63, "2012_2": 63, "2145_1": 63, "4234_1": 63, "2032_2": 63, "4171_1": 63, "173": 63, "codecut": 74, "electron": 47, "cloth": 47, "pandas_df": 47, "polars_df": 47, "categorypricestri64": 47, "categoryquantitypricestri64i64": 47, "5200": 47, "1020": 47, "4300": 47, "666667": 47, "categoryquantitypricestri64f64": 47, "1225": 47, "12216": 47, "my_project": 73, "hierarchicalforecast": 59, "numba": 59, "reconcil": 59, "leisur": 59, "tourism": 59, "quarter": 59, "s_df": 59, "12251": 59, "wale": 59, "outback": 59, "nsw": 59, "780860": 59, "33131": 59, "western": 59, "648865": 59, "22034": 59, "fleurieu": 59, "peninsula": 59, "31119": 59, "victoria": 59, "phillip": 59, "2017": 59, "063034": 59, "7671": 59, "405": 59, "891206": 59, "18339": 59, "queensland": 59, "mackai": 59, "135284": 59, "23043": 59, "limeston": 59, "coast": 59, "visi": 59, "604546": 59, "22129": 59, "738053": 59, "11349": 59, "hunter": 59, "226040": 59, "16599": 59, "brisban": 59, "490809": 59, "y_test_df": 59, "y_train_df": 59, "act": 59, "canberra": 59, "perth": 59, "425": 59, "y_hat_df": 59, "y_fitted_df": 59, "zza": 59, "forecast_fitted_valu": 59, "coher": 59, "hierarchicalreconcili": 59, "bottomup": 59, "hrec": 59, "y_rec_df": 59, "25990": 59, "068359": 59, "24380": 59, "257812": 59, "24458": 59, "490234": 59, "22902": 59, "765625": 59, "23974": 59, "056641": 59, "22412": 59, "982422": 59, "24563": 59, "455078": 59, "23127": 59, "439453": 59, "24516": 59, "759766": 59, "abstract": 54, "contextu": 54, "newsgroup": 54, "18000": 54, "topic_model": 54, "993": [], "484": [], "huggingfac": [], "disabl": 67, "deadlock": [], "tokenizers_parallel": [], "980": [], "get_topic_info": 54, "representative_doc": 54, "6789": 54, "1_to_the_is_of": 54, "refus": 54, "1823": 54, "0_game_team_games_h": 54, "game": 54, "player": 54, "hock": 54, "rivalri": 54, "ahem": 54, "jokerit": 54, "630": 54, "1_key_clipper_chip_encrypt": 54, "clipper": 54, "chip": 54, "encrypt": 54, "escrow": 54, "expert": 54, "cryptographi": 54, "scie": 54, "2_idjits_ites_cheek_danc": 54, "idjit": 54, "ites": 54, "cheek": 54, "yep": 54, "nyep": 54, "ndanc": 54, "3_israel_israeli_jews_arab": 54, "israel": 54, "isra": 54, "jew": 54, "jewish": 54, "nthi": 54, "010318688564543007": 54, "008992489388365084": 54, "0071658097402482355": 54, "006986923839656088": 54, "00631255726099582": 54, "006207025740053": 54, "hockei": 54, "006108581738112714": 54, "0057638598847672895": 54, "005625421684874428": 54, "005577343029862753": 54, "topics_": 54, "visualize_top": 54, "tf": 54, "idf": 54, "visualize_barchart": 54, "top_n_top": 54, "perhap": [], "n_gram_rang": [], "update_top": [], "011119596146117955": [], "nasa": [], "0047697533973351915": [], "shuttl": [], "0044533985251824495": [], "orbit": [], "004129278694477752": [], "spacecraft": [], "004011023125258004": [], "satellit": [], "003783732360211832": [], "moon": [], "003639954930862572": [], "lunar": [], "0034753177228921146": [], "002821040122532999": [], "mar": [], "0028033947303940923": [], "afterward": [], "reduce_top": [], "nr_topic": [], "666": [], "berttop": 54, "modern": [52, 63], "argparse_exampl": 63, "argumentpars": 63, "add_argu": 63, "parse_arg": 63, "click_exampl": 63, "vbox": [], "322": [], "dedup": [], "floatprogress": [], "999393": [], "mlflow": [], "prone": [15, 47, 52], "anyon": 52, "infer_signatur": 52, "start_run": 52, "model_info": 52, "log_model": 52, "sk_model": 52, "artifact_path": 52, "model_uri": 52, "f8b0fc900aa14cf0ade8d0165c5a9f11": 52, "1e20d72afccf450faa3b8a9806a97e83": 52, "sklearn_pyfunc": 52, "pyfunc": 52, "load_model": 52, "inspect": 52, "mlrun": 52, "mlmodel": 52, "conda": 52, "python_env": 52, "python_funct": 52, "virtualenv": 52, "loader_modul": 52, "model_path": 52, "predict_fn": 52, "python_vers": 52, "pickled_model": 52, "serialization_format": 52, "cloudpickl": 52, "sklearn_vers": 52, "post1": 52, "mlflow_vers": 52, "model_size_byt": 52, "model_uuid": 52, "e7487bc3c4ab417c965144efcecaca2f": 52, "run_id": 52, "utc_time_cr": 52, "516963": 52, "outlin": 52, "forg": 52, "psutil": 52, "build_depend": 52, "setuptool": 52, "wheel": [52, 67], "get_data_for_last_week": 58, "test_main": 58, "test_get_data_for_last_week": 58, "mock_datetim": 58, "assert_called_onc": 58, "behav": 58, "infix": 62, "travers": 62, "unfold": 62, "first_fiv": 62, "skip_first_two": 62, "pip3": 52, "fastapi": [], "unfamiliar": 52, "versatil": 52, "mobil": 52, "divers": 52, "mse": 52, "ml_app": 52, "medinc": 52, "houseag": 52, "avebedrm": 52, "aveoccup": 52, "curl": 52, "1400": 52, "discoveri": 54, "essenc": 54, "surpass": 54, "sentence_transform": 54, "sentencetransform": 54, "cosine_similar": 54, "oatmeal": 54, "cooki": 54, "bake": 54, "chia": 54, "pud": 54, "fri": 54, "oreo": 54, "sunda": 54, "caramel": 54, "bacon": 54, "cheeseburg": 54, "pizza": 54, "minilm": 54, "l6": 54, "recipe_embed": 54, "find_similar_recip": 54, "top_k": 54, "query_embed": 54, "top_indic": 54, "dessert": 54, "healthier": 54, "clearli": 54, "unhealthi": 54, "pygment": 67, "mdurl": 67, "removeprefix": 67, "removesuffix": 67, "32m2024": 67, "329": 67, "1merror": 67, "36m__main__": 67, "36m14": 67, "1man": 67, "caught": 67, "mainprocess": 67, "31530": 67, "mainthread": 67, "8332868224": 67, "1mtraceback": 67, "_run_module_as_main": 67, "ipykernel_launch": 67, "launch_new_inst": 67, "launch_inst": 67, "ipykernel": 67, "kernelapp": 67, "ipkernelapp": 67, "traitlet": 67, "1053": 67, "0x107d28860": 67, "0x104cdf1d0": 67, "io_loop": 67, "baseasyncioloop": 67, "0x107d29760": 67, "tornado": 67, "asynciomainloop": 67, "0x107d3fc90": 67, "asyncio_loop": 67, "run_forev": 67, "baseeventloop": 67, "0x105c9fb00": 67, "_unixselectoreventloop": 67, "1mbase_ev": 67, "33m607": 67, "35mrun_forev": 67, "35m": 67, "1m_run_onc": 67, "_run_onc": 67, "0x105ca1940": 67, "33m1922": 67, "35m_run_onc": 67, "1mhandl": 67, "1m_run": 67, "_run": 67, "0x105c32840": 67, "task_wakeup": 67, "fini": 67, "6d0": 67, "1mevent": 67, "33m80": 67, "35m_run": 67, "1m_context": 67, "1mrun": 67, "1m_callback": 67, "1m_arg": 67, "_arg": 67, "_callback": 67, "_context": 67, "kernelbas": 67, "dispatch_queu": 67, "process_on": 67, "0x1077f2fc0": 67, "ipkernel": 67, "ipythonkernel": 67, "0x107d40a50": 67, "513": 67, "dispatch": 67, "zmq": 67, "0x10848d250": 67, "0x10848d610": 67, "dispatch_shel": 67, "418": 67, "execute_request": 67, "0x107a77320": 67, "758": 67, "reply_cont": 67, "do_execut": 67, "0x107a71240": 67, "run_cel": 67, "zmqinteractiveshel": 67, "0x107d15c60": 67, "zmqshell": 67, "0x107d68490": 67, "store_histori": 67, "silent": 67, "cell_id": 67, "efficient_python_tricks_and_": 67, "nimport": 67, "nfrom": 67, "nlogger": 67, "interactiveshel": 67, "3024": 67, "_run_cel": 67, "0x106bc3ce0": 67, "3079": 67, "coro": 67, "run_cell_async": 67, "0x1086c18a0": 67, "_pseudo_sync_runn": 67, "0x106baae80": 67, "async_help": 67, "3284": 67, "has_rais": 67, "run_ast_nod": 67, "code_ast": 67, "cell_nam": 67, "ipykernel_31530": 67, "1455742643": 67, "ast": 67, "importfrom": 67, "0x10881c0d0": 67, "0x10881f310": 67, "0x10881fc10": 67, "exp": 67, "0x10881f5b0": 67, "0x106bc8040": 67, "3466": 67, "run_cod": 67, "async_": 67, "asi": 67, "executionresult": 67, "108825410": 67, "execution_count": 67, "error_before_exec": 67, "error_in_exec": 67, "executioninfo": 67, "0x17346b750": 67, "0x106bc80e0": 67, "exec": 67, "code_obj": 67, "user_global_n": 67, "user_n": 67, "__package__": 67, "0x106ba3830": 67, "1m1455742643": 67, "33m14": 67, "1mevaluate_result": 67, "1my_tru": 67, "1my_pr": 67, "1marrai": 67, "0x172e23e20": 67, "33m9": 67, "35mevaluate_result": 67, "1mmean_square_err": 67, "1mmean_squared_error": 67, "0x173478180": 67, "_param_valid": 67, "0x1734780e0": 67, "0x173457ba0": 67, "0x172e205e0": 67, "457": 67, "1mvalueerror": 67, "hide": 67, "dunder": 67, "nodoc": 67, "ret": 67, "grai": 67, "py2": 67, "colorama": 67, "asttoken": 67, "25ldone": 67, "25hrequir": 67, "werkzeug": 67, "itsdanger": 67, "blinker": 67, "markupsaf": 67, "25h": 67, "235994": 67, "23d469a3676f399435ed1581b0da936ef614a134749520be801eb96aadeb19b6": 67, "ce": 67, "bb": 67, "26835a451cc11eb8d362d2d2b2c322220c6d61edc825233820": 67, "25l": 67, "inspector": 67, "examin": 67, "prepend": 67, "949190": 67, "repr": 67, "fold": 67, "999999": 67, "0001": 67, "000001": 67, "nonetyp": 67, "ctime": 67, "fromisocalendar": 67, "iso": 67, "fromisoformat": 67, "8601": 67, "fromordin": 67, "prolept": 67, "gregorian": 67, "fromtimestamp": 67, "posix": 67, "isocalendar": 67, "isoformat": 67, "ddt": 67, "ss": [45, 67], "mmm": 67, "uuu": 67, "isoweekdai": 67, "timetupl": 67, "localtim": 67, "timetz": 67, "__class__": 67, "toordin": 67, "tzname": 67, "utcfromtimestamp": 67, "utcnow": 67, "utcoffset": 67, "utctimetupl": 67, "test_rm_fil": 58, "rm_file": 58, "test_with_unittest_mock": 58, "mock_remov": 58, "assert_called_once_with": 58, "test_unix_f": 58, "mocker": 58, "wherea": 58, "nest": 15, "vari": 45, "transpil": 45, "hive": 45, "date_format": 45, "yy": 45, "backtick": 45, "converted_pric": 45, "tradition": 47, "simplic": 47, "customers_data": 47, "last_upd": 47, "updates_data": 47, "delta_table_path": 47, "customers_delta": 47, "current_timestamp": 47, "whennotmatchedinsert": 47}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"pytest": [0, 43, 58, 69, 75], "cach": [0, 43, 69, 75], "directori": [0, 23, 43, 58, 69, 75], "python": [1, 2, 4, 5, 6, 7, 9, 11, 13, 14, 15, 16, 17, 18, 21, 25, 27, 45, 46, 48, 49, 50, 52, 53, 54, 55, 57, 58, 59, 60, 62, 63, 64, 65, 67, 68], "built": 1, "method": [1, 2, 7, 8, 11, 19, 20, 25, 27, 42, 52, 58], "class": [2, 19, 24, 27, 58, 60], "inherit": 2, "abstract": 2, "declar": [2, 27, 58], "without": [2, 50, 62], "implement": 2, "vs": [7, 19, 47, 52, 56, 58, 66], "composit": [], "choos": 58, "right": [], "design": 2, "approach": [59, 62], "distinguish": 2, "instanc": 2, "level": 2, "getattr": 2, "better": [2, 21, 47, 63, 73], "wai": [2, 21, 47, 53, 60], "get": [2, 5, 7, 8, 9, 14, 16, 22, 23, 25, 33, 35, 40, 42, 49, 50, 52, 73], "attribut": [2, 25], "__call__": 2, "call": [2, 20, 62, 68], "your": [2, 7, 16, 18, 19, 27, 29, 38, 40, 45, 47, 49, 52, 53, 54, 55, 57, 58, 60, 64, 66, 67, 68, 73], "like": [2, 59], "function": [2, 3, 6, 7, 8, 20, 21, 25, 26, 27, 29, 47, 58, 62, 63, 64, 67, 68], "comparison": [2, 4, 42, 47, 52, 58], "static": [2, 64, 68], "us": [2, 4, 5, 6, 7, 14, 16, 21, 24, 25, 27, 29, 30, 31, 32, 33, 34, 40, 42, 45, 46, 47, 48, 49, 50, 58, 60, 62, 66, 67, 68, 73], "ad": 2, "requir": [2, 65, 73], "new": [2, 15, 20, 23, 29, 50], "minim": 2, "data": [2, 11, 18, 19, 21, 24, 31, 32, 33, 37, 40, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 64, 73], "risk": 2, "privat": 2, "variabl": [2, 14, 15, 32, 49, 52], "properti": [33, 58], "decor": [6, 51, 62], "A": [7, 18, 21, 45, 47, 53, 58, 59, 60, 62, 68], "getter": 2, "setter": 2, "__str__": 2, "__repr__": 2, "creat": [2, 7, 18, 23, 31, 40, 45, 46, 49, 50, 52, 54, 58, 60, 63, 65, 68], "string": [2, 7, 8, 11, 16, 29, 32, 37, 45, 49, 54, 59, 62], "represent": 2, "object": [2, 7, 25, 40, 55, 58, 63, 67], "__add__": 2, "add": [2, 19, 27, 33, 47, 57, 59, 60, 67], "two": [2, 5, 10, 11, 19, 23, 30, 39, 42, 52, 58, 62, 63, 65, 67], "optim": [2, 29, 32, 47, 56], "memori": [2, 32, 56, 57, 64], "usag": [2, 32, 57, 64], "slot": 2, "code": [2, 3, 6, 7, 15, 16, 29, 45, 46, 48, 49, 50, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 66, 67, 68, 73], "speed": [3, 47, 57, 67], "concurr": [3, 57], "execut": [3, 15, 25, 47, 58, 63, 65, 67, 68], "task": [3, 7], "separ": 3, "cpu": 3, "compar": [3, 19, 39, 53, 63, 65, 67], "The": [3, 7, 16, 18, 33, 35, 47, 49, 53, 54, 58, 59, 60, 73, 74], "time": [3, 25, 33, 48, 50, 52, 57, 58, 59, 67, 68], "between": [3, 10, 11, 19, 35, 39, 42, 53, 58, 60, 62], "2": [3, 10, 21, 31, 32, 35, 53, 54, 55], "save": 3, "disk": 3, "space": [3, 42, 59], "larg": [3, 14, 21, 31, 45, 47, 51, 57, 63], "dataset": [3, 45, 48, 50, 52, 53, 54], "parquet": [3, 31, 47], "datetim": [4, 31, 33, 59], "timedelta": 4, "calcul": [4, 16, 35, 54], "end": 4, "base": [4, 11, 20, 30, 32, 33, 34, 42, 49, 58, 65, 68, 73], "start": [4, 37, 68], "durat": 4, "date": [4, 16, 24, 33, 59], "month": 4, "featur": [4, 15, 48, 49, 52, 53, 59], "arithmet": 4, "oper": [4, 5, 7, 11, 15, 20, 22, 26, 29, 40, 42, 45, 47, 56], "dictionari": [5, 18, 22, 25, 29, 35, 62], "updat": [5, 30, 47, 56], "With": [5, 16, 21, 25, 30, 37, 47, 58], "item": [5, 8, 18, 20, 22, 25, 40], "from": [5, 9, 11, 22, 23, 31, 34, 35, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 59, 63, 64, 66, 68, 74], "anoth": [5, 16, 20, 23, 30, 34, 66], "kei": [5, 18, 21, 50, 62], "paramet": [5, 7, 27, 58, 64], "max": [5, 9, 42], "find": [5, 9, 10, 16, 25, 33, 35, 37, 49, 50, 52, 58, 59, 62, 64], "largest": [5, 40], "valu": [5, 7, 9, 13, 18, 21, 25, 27, 29, 33, 34, 35, 38, 40, 42], "dict": 5, "default": [5, 18], "doesn": 5, "t": [5, 7, 46], "exist": 5, "doubl": [5, 14, 42], "nest": [5, 7, 21, 25, 62], "miss": [5, 29, 33, 60, 64], "fromkei": 5, "list": [5, 7, 8, 9, 10, 11, 12, 16, 18, 21, 22, 25, 32, 34, 37, 40, 42, 67], "revers": 5, "comprehens": [5, 8, 60, 67], "merg": [5, 30, 47], "union": [5, 10, 15, 27], "3": [5, 11, 15, 52, 54, 56], "9": 5, "iter": [5, 8, 11, 13, 20, 21, 29, 57], "omit": [6, 25], "els": [6, 7], "claus": 6, "improv": [2, 6], "readabl": [2, 6, 7, 15, 16, 30, 52, 57, 60, 62, 67], "when": [6, 7, 13, 18, 30, 31, 33, 39, 48, 52, 58, 68], "Not": [6, 7, 18, 27, 58], "lambda": 6, "how": [6, 48, 63, 76], "pass": [6, 7, 55], "an": [6, 7, 8, 11, 15, 16, 18, 21, 26, 27, 29, 42, 50, 52, 54, 60, 68], "arbitrari": [6, 49], "number": [6, 14, 16, 24, 33, 35, 42, 50, 54], "argument": [6, 7, 20, 21], "good": 7, "practic": [7, 46], "write": [7, 15, 27, 31, 45, 48, 58, 62, 73], "meaning": [7, 54], "name": [7, 34, 40, 49, 54, 58], "assign": [7, 15, 29, 40, 58], "complex": [7, 47, 56], "condit": [7, 8, 15, 21, 42, 58], "make": [7, 19, 31, 57, 63], "more": [7, 21], "avoid": [7, 56], "duplic": 7, "underscor": [7, 14], "_": 7, "ignor": [7, 13, 39], "That": [7, 27, 48], "Will": 7, "Be": [7, 27], "index": [7, 16, 25, 33, 34, 39, 42], "For": [7, 21, 49, 54], "loop": [7, 21], "slice": [7, 54], "indic": 7, "statement": [7, 15, 45], "stop": [7, 67], "copi": [7, 31, 65], "instead": [7, 14, 46], "deepcopi": 7, "side": 7, "effect": [7, 40], "enumer": 7, "counter": [7, 18], "while": 7, "don": [7, 46], "multipl": [7, 9, 13, 14, 16, 18, 22, 29, 30, 40, 47, 56, 58], "OR": 7, "concaten": 7, "join": [7, 11, 48, 56], "should": [7, 27, 74], "onli": [6, 7, 19, 34, 58], "do": 7, "One": [7, 16, 18, 37, 42, 50, 52, 54, 57, 58, 59, 66, 67, 68], "have": 7, "fewer": [7, 20], "than": [7, 21], "four": 7, "flag": 7, "s": [7, 11, 20, 24, 25, 32, 34, 35, 37, 40, 42, 47, 48, 49, 50, 51, 52, 57, 59, 67, 73], "condens": 7, "If": [7, 34], "line": [7, 46, 50, 52, 54, 55, 57, 59, 63, 64, 67, 68], "effici": [7, 21, 31, 32, 45, 47, 48, 54, 58], "check": [7, 8, 23, 42, 58, 62, 64], "type": [7, 15, 20, 27, 32, 64, 68], "try": 7, "except": [7, 29, 58], "never": [7, 67], "catch": 7, "all": [7, 8, 30, 34, 35, 42, 58], "clean": [7, 13, 54, 73], "error": [7, 56, 58], "handl": [7, 32, 45, 48, 59], "logic": [7, 56], "why": 7, "__name__": 7, "__main__": 7, "matter": 7, "script": [7, 63], "appli": [8, 20, 21, 29, 40, 47, 57], "element": [8, 9, 11, 21, 25, 29, 30, 35, 42, 49], "ani": [8, 42, 63, 65, 67], "true": [8, 11, 19], "inter": 8, "ar": [8, 18, 23, 39, 42, 68], "filter": [8, 21, 31, 34, 47, 62], "evalu": [8, 56, 58], "map": [8, 29, 60, 62], "each": [8, 29, 35, 40], "sort": [8, 36, 64], "tupl": 8, "first": 8, "second": [8, 66], "random": [9, 40, 50], "choic": 9, "randomli": 9, "select": [9, 33, 34, 35], "weight": [9, 52], "sampl": [9, 40], "heapq": 9, "n": [9, 25, 33, 40], "interact": [10, 45, 60, 63], "set": [10, 47, 58], "intersect": 10, "differ": [10, 11, 21, 35, 39, 40, 42, 53, 58, 62, 73], "turn": [11, 32, 35, 40, 42], "zip": [11, 21], "associ": 11, "order": [11, 18, 36, 39], "unzip": 11, "append": [11, 47], "extend": [11, 13], "unpack": 13, "perform": [14, 47, 58, 59, 64], "floor": 14, "divis": 14, "forward": [14, 29], "slash": 14, "fraction": 14, "numer": 14, "result": 14, "decim": [14, 16], "format": [14, 16, 38, 54], "confirm": 14, "whether": [14, 39], "Is": [14, 21, 52], "modulu": 14, "switch": [], "structur": [15, 18, 49, 51], "pattern": [15, 37, 62], "match": [15, 16, 25, 48, 54, 62], "10": [11, 15], "x": [15, 27], "y": [15, 27], "walru": 15, "express": [15, 16, 21, 34, 47, 62], "fine": 15, "grain": 15, "traceback": [15, 67], "11": 15, "control": [16, 53, 58, 73], "print": [16, 26, 38, 67], "f": 16, "pad": 16, "zero": 16, "enhanc": [2, 6, 15, 16, 30, 48, 56], "comma": 16, "debug": [16, 67, 73], "equal": [16, 35, 39, 42, 58], "sign": 16, "substr": [16, 37], "re": 16, "sub": 16, "replac": [16, 29, 33, 42, 54, 68], "regular": [16, 62], "split": [16, 25, 29, 48], "charact": 16, "multilin": 16, "difflib": 16, "sequencematch": 16, "detect": [16, 59, 60, 68], "almost": 16, "similar": [16, 39, 48, 53], "articl": [16, 54], "get_close_match": 16, "best": [16, 46, 47, 49], "certain": [16, 35, 42], "word": [16, 54, 57], "util": 17, "librari": [17, 45, 47, 58, 59, 68], "collect": 18, "count": [18, 34, 35], "occurr": 18, "namedtupl": 18, "lightweight": [18, 68], "mang": 18, "defaultdict": 18, "return": [6, 18, 32, 48], "avail": 18, "ordereddict": 18, "chainmap": 18, "combin": [18, 20, 21, 30, 58], "unit": [18, 56, 58, 62, 73], "normal": 19, "frozen": 19, "read": [19, 31, 33, 45, 66, 76], "post": 19, "init": 19, "functool": 20, "partial": 20, "gener": [20, 21, 50, 54, 58, 59, 60, 63, 65, 68, 73], "singledispatch": 20, "current": [20, 23, 29, 35], "reduc": [20, 32, 54], "cumul": [20, 35], "itertool": 21, "through": 21, "pair": 21, "product": [21, 52], "starmap": 21, "compress": 21, "boolean": [21, 34], "groupbi": [21, 40], "group": [21, 25, 33, 35, 40], "zip_longest": 21, "length": [21, 42], "dropwhil": 21, "drop": [21, 48, 60], "until": 21, "fals": [21, 52], "itemgett": 22, "pathlib": 23, "file": [23, 33, 46, 47, 55, 58, 64, 65, 66, 68, 73], "access": [23, 33, 35, 62], "home": 23, "parent": 23, "path": 23, "rel": 23, "same": [23, 58, 73], "pydash": 25, "work": [25, 33, 37, 45, 56, 58, 59], "flatten": [25, 42], "flatten_deep": 25, "deepli": 25, "chunk": [25, 31], "style": [25, 38, 60], "chain": [25, 29], "custom": [25, 30, 48], "plant": 25, "sympi": 26, "motiv": 26, "what": [26, 74], "basic": [26, 52], "symbol": 26, "equat": [26, 73], "expand": [26, 54], "factor": 26, "simplifi": [8, 15, 24, 26, 45, 47, 51, 52, 56, 58, 59, 62, 67], "solv": [26, 48], "substitut": 26, "trigonometr": 26, "deriv": 26, "integr": [2, 26, 45, 51, 52, 73], "limit": [26, 68], "special": 26, "latex": [26, 38, 42, 63], "callabl": 27, "specifi": [27, 30, 31], "input": [27, 58], "hint": 27, "annot": [27, 49, 60, 68], "metadata": [27, 45, 52], "typehint": 27, "final": 27, "overridden": 27, "liter": 27, "possibl": [27, 58], "typevar": 27, "flexibl": [27, 59], "context": 27, "depend": [27, 65], "panda": [28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 45, 47, 50, 56, 57, 58, 67], "chang": [29, 35, 42, 59, 68], "datafram": [29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 47, 48, 49, 50, 56, 57, 58], "pipe": [29, 62], "column": [29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 42, 56, 59], "elementwis": 29, "seri": [29, 33, 34, 35, 37, 40, 52, 59], "explod": 29, "transform": [29, 34, 40, 47, 48, 62], "row": [29, 30, 33, 34, 35, 36, 37, 40, 42], "fill": 29, "previou": [29, 33], "most": 29, "frequent": 29, "categori": [29, 40, 48, 58], "encod": [29, 48], "categor": [29, 32, 36, 48, 49], "rais": 29, "combine_first": 30, "null": [30, 62], "df": [30, 34, 35], "suffix": 30, "includ": [30, 32], "insert": 30, "Into": [30, 40, 49, 65], "locat": [30, 49, 50, 60], "leverag": [31, 56, 59], "pyarrow": [31, 32, 45], "fix": 31, "unnam": 31, "0": [31, 32, 33], "csv": [31, 33, 45, 47], "websit": [31, 68], "divid": 31, "html": 31, "tabl": [31, 40, 45, 47, 48, 63], "mode": [31, 47], "manipul": [32, 37, 40, 62], "select_dtyp": 32, "subset": [32, 34], "exclud": [32, 34], "Their": [32, 34, 49], "dtype": 32, "infer_object": 32, "sai": 32, "goodby": 32, "convers": 32, "parse_d": [31, 33], "convert": [33, 54, 59, 62], "dateoffset": 33, "interv": [33, 35, 42, 52, 59], "timestamp": 33, "roll": 33, "averag": 33, "datapoint": 33, "grouper": 33, "specif": [33, 36, 42, 58, 68], "frequenc": [33, 48, 54, 60], "dt": 33, "within": [33, 35, 73], "year": 33, "rang": 33, "reindex": 33, "befor": 33, "after": [33, 58, 68], "resampl": 33, "shift": [33, 35], "period": 33, "isin": 34, "contain": [34, 35, 37, 62], "queri": [34, 47, 54, 56], "nan": 34, "clip": 34, "outlier": 34, "loc": 35, "iloc": 35, "pd": 35, "pct_chang": 35, "percentag": 35, "prior": 35, "diff": 35, "take": [35, 42], "numpi": [35, 41, 42, 62], "arrai": [32, 35, 42, 56, 62], "to_dict": 35, "corrwith": 35, "comput": [35, 40, 59], "pairwis": 35, "correl": [35, 48, 60], "cut": 35, "bin": 35, "discret": 35, "qcut": 35, "size": [35, 40], "cumsum": 35, "sum": 35, "over": [2, 35, 40, 42, 50, 52, 58], "cummax": 35, "maximum": 35, "set_categori": 36, "str": 37, "text": [37, 38, 49, 52, 54, 60, 63], "startswith": 37, "highlight": 38, "easier": [38, 56], "analysi": [38, 52, 58, 59, 64], "color": 38, "background": 38, "gradient": 38, "displai": [38, 60, 73], "cell": 38, "to_markdown": 38, "markdown": [38, 68], "test": [39, 42, 50, 52, 54, 56, 58, 73], "assert_fram": 39, "agg": 40, "aggreg": 40, "pivot_t": 40, "pivot": 40, "melt": 40, "unpivot": 40, "crosstab": 40, "cross": [40, 59], "tabul": 40, "stack": 40, "align": 40, "ravel": 42, "np": 42, "squeez": 42, "remov": [42, 64, 65], "ax": 42, "posit": 42, "argsort": 42, "rank": 42, "where": [42, 68], "linspac": 42, "evenli": 42, "assert_almost_equ": 42, "up": [42, 47, 57], "precis": 42, "scienc": [44, 53], "tool": [44, 46, 47, 53, 54, 57, 59, 61, 63, 65, 67], "sql": [45, 47, 53, 56], "dynam": [45, 58], "templat": 45, "fuguesql": 45, "spark": [45, 47, 56, 59], "dask": [45, 47], "sqlmodel": 45, "databas": [45, 58], "sqlfluff": 45, "linter": 45, "auto": [45, 59], "formatt": [45, 73], "postgresml": 45, "machin": [45, 52, 68], "learn": [45, 48, 52, 59, 68], "postgresql": [45, 58], "duckdb": 45, "sqlpars": [], "extract": [45, 49, 50, 51, 54, 59, 62, 63], "compon": [45, 49], "hard": 46, "hydra": 46, "dotenv": [], "load": 47, "secret": [], "inform": [46, 54, 73], "env": 46, "docopt": 46, "beauti": [46, 67], "command": [46, 63, 67, 68, 73], "interfac": [46, 59, 63], "document": 46, "tqdm": 47, "progress": [47, 58, 67], "bar": [47, 58, 67], "pandarallel": 47, "simpl": [47, 53, 58], "parallel": 47, "pandasai": 47, "gain": 47, "insight": 47, "ai": [47, 48, 54, 73], "fugu": 47, "engin": [47, 48, 54, 59], "version": [47, 53, 73], "delta": 47, "lake": 47, "partit": 47, "overwrit": 47, "scan": 47, "mismatch": [47, 48, 58], "polar": 47, "blaze": 47, "fast": [47, 52, 54, 59], "process": [21, 47, 54, 56], "12x": 47, "lazi": [47, 52, 56], "har": [47, 54, 59], "stratifi": 48, "fashion": 48, "scikit": [48, 52, 59], "strategi": [48, 59], "prevent": [11, 48, 52], "leakag": [48, 52], "rare": 48, "label": [48, 58], "dirti": [48, 58], "dirty_cat": 48, "fuzzi": 48, "snorkel": 48, "programmat": 48, "build": [48, 49, 52, 54, 63], "train": [48, 58, 59], "sketch": 48, "assist": 48, "understand": [48, 59], "content": [48, 68], "distfit": 49, "theoret": 49, "distribut": [49, 52, 53, 56], "geopi": 49, "fastai": [49, 57, 59], "cont_cat_split": 49, "continu": 49, "cardin": 49, "patsi": 49, "yarl": 49, "url": 49, "pigeon": 49, "quickli": [49, 57], "jupyt": [49, 60, 70, 73], "notebook": [49, 60, 68, 70, 73], "probablepeopl": 49, "pars": [49, 62], "unstructur": 49, "supercharg": [49, 52], "pdf": [49, 63], "pypdf": 49, "faker": 50, "fake": 50, "silli": 50, "produc": [50, 67], "user": 50, "fetch_openml": 50, "openml": 50, "autoscrap": 50, "autom": [50, 59, 66, 68], "web": [50, 54, 55], "scrape": 50, "reader": 50, "variou": 50, "internet": 50, "sourc": 50, "directli": 50, "pytrend": 50, "trend": 50, "keyword": [6, 50, 54], "googl": [50, 55], "search": [50, 54], "snscrape": 50, "social": [50, 54], "network": 50, "servic": [50, 58], "datacommon": 50, "statist": [50, 54, 60], "about": [50, 73, 74], "median": 50, "incom": 50, "california": 50, "peopl": 50, "u": 50, "robberi": 50, "people_also_ask": 50, "wrapper": 50, "also": 50, "ask": 50, "facebook": 50, "public": 50, "page": [50, 66], "api": [50, 56, 60], "languag": [51, 54], "model": [51, 52, 54, 57, 58, 59, 60], "llm": [51, 52, 58], "causalimpact": 52, "causal": [52, 59], "relat": [52, 58], "event": 52, "chatgpt": 52, "pipelin": [48, 52, 67], "gridsearchcv": 52, "scale": [52, 59], "squar": 52, "rmse": 52, "sklearn": [52, 59], "mean_squared_error": 52, "modelkit": 52, "ml": [52, 57, 58, 63], "system": 52, "decompos": 52, "high": [52, 60], "dimension": [52, 60], "three": 52, "dimens": [52, 54, 60], "visual": [52, 54, 60, 65, 67], "import": [52, 64, 65, 68, 73], "yellowbrick": 52, "valid": [24, 52, 58, 59], "curv": 52, "determin": 52, "estim": [52, 54, 59], "underfit": 52, "overfit": 52, "mlxtend": 52, "plot": [52, 60], "decis": [52, 60], "region": 52, "classifi": 52, "deepcheck": [52, 58], "bias": 52, "track": 52, "imbalanc": 52, "deal": 52, "predict": [52, 59, 68], "mapi": 52, "mlforecast": 52, "scalabl": 52, "mlem": 52, "captur": [52, 60], "manag": [45, 53, 65, 73], "dvc": 53, "project": [53, 65], "sweetviz": 53, "quadrat": 53, "speadsheet": 53, "whylog": 53, "log": [52, 53, 58, 67], "made": [52, 53, 56, 59], "easi": [52, 53, 59], "fluke": 53, "easiest": [53, 60], "move": 53, "around": 53, "natur": 54, "textblob": 54, "sumi": 54, "summar": [54, 66], "spacy_streamlit": 54, "app": 54, "textaci": 54, "contigu": 54, "sequenc": 54, "preprocess": [48, 54], "texthero": 54, "wordfreq": 54, "36": 54, "newspaper3k": 54, "questgen": 54, "question": 54, "ninja": 54, "lump": 54, "togeth": 54, "textstat": 54, "rapidfuzz": 54, "rapid": [52, 54], "checklist": 54, "nlp": 54, "top2vec": 54, "quick": 54, "topic": 54, "english": 54, "contract": 54, "inflect": 54, "plural": 54, "singular": 54, "indefinit": 54, "flashtext": 54, "sentenc": [], "ekphrasi": 54, "media": 54, "chroma": 54, "lightn": 54, "solut": [47, 54], "embed": 54, "share": [55, 58], "download": [55, 66, 68], "datapan": 55, "publish": 55, "gdown": 55, "drive": 55, "pyserd": 55, "effortless": 55, "serial": 55, "deseri": 55, "dataclass": [15, 55], "itsdanger": 55, "safe": [53, 55], "trust": 55, "untrust": 55, "environ": [55, 65], "back": 55, "df_shrink": 57, "shrink": 57, "swifter": 57, "23": 57, "faster": [47, 57], "pyinstrument": 57, "profil": [57, 67], "coval": 57, "resum": 58, "break": 58, "fail": 58, "descript": [58, 63], "short": 58, "benchmark": 58, "fixtur": 58, "mark": 58, "parametr": 58, "twice": 58, "id": 58, "case": 58, "onc": [45, 58], "per": 58, "session": 58, "skipif": 58, "skip": 58, "met": 58, "xfail": 58, "expect": [58, 74], "verifi": 58, "repeat": 58, "sugar": 58, "show": 58, "failur": [58, 68], "instantli": 58, "step": 58, "pick": 58, "run": [45, 58, 68, 73], "unstag": 58, "git": [58, 66], "setup": 58, "freezegun": 58, "freez": 58, "simul": 58, "extern": [51, 58], "mock": 58, "pyfakef": [], "pandera": 58, "deepdiff": 58, "deep": [58, 68], "assert": 58, "hypothesi": 58, "conflict": 58, "leab": 58, "ab": 58, "incorpor": 58, "suit": 58, "maintain": 58, "accuraci": [51, 58], "docstr": [58, 64], "exampl": 58, "doctest": 58, "deepev": 58, "datefind": 59, "automat": [59, 60, 64, 68], "add_datepart": 59, "relev": [51, 59], "maya": 59, "trace": 59, "unevenli": 59, "holidai": 59, "workalendar": 59, "dai": 59, "pmdarima": 59, "r": 59, "arima": 59, "power": 59, "seaborn": 60, "matplotlib": 60, "graphviz": 60, "flowchart": 60, "idea": 60, "folium": 60, "dtreeviz": 60, "interpret": [54, 60], "tree": [60, 63], "hiplot": 60, "missingno": 60, "dendogram": 60, "venn": 60, "diagram": 60, "squarifi": 60, "treemap": 60, "umap": 60, "reduct": 60, "evid": 60, "drift": 60, "mermaid": 60, "flow": 60, "chart": 60, "pretti": 60, "confus": 60, "matrix": 60, "matplotx": 60, "extens": [2, 60], "ipysankeywidget": 60, "ipython": [60, 68, 73], "sankei": 60, "widget": 60, "ipyvizzu": 60, "anim": [60, 63], "eas": [60, 66], "stori": 60, "present": 60, "lux": 60, "intellig": 60, "discoveri": 60, "signific": 60, "adjust": 60, "blox": 60, "attract": 60, "lovelyplot": 60, "nice": 60, "figur": 60, "gif": 60, "token": 60, "corpora": 60, "prettymap": 60, "paint": 60, "vizro": 60, "modular": [2, 56, 60], "applic": [60, 65], "cool": 61, "altern": 62, "box": 62, "dot": 62, "notat": 62, "modul": [62, 65], "shorter": 62, "inflix": [], "pregex": 62, "human": [62, 63], "bracket": 62, "pampi": 62, "dictdiff": 62, "unyt": 62, "asynchron": 62, "prefect": [62, 68], "output": [51, 63], "strip": 63, "pyfiglet": 63, "uniqu": 63, "letter": 63, "out": [56, 63], "ordinari": 63, "fire": 63, "cli": [63, 66], "typer": 63, "few": 63, "view": [56, 63, 67], "rich": [63, 67], "latexify_pi": 63, "math": [63, 73], "manimml": 63, "common": 63, "concept": 63, "review": 64, "isort": 64, "1": 64, "interrog": 64, "mypi": 64, "checker": [64, 73], "refurb": 64, "refurbish": 64, "modern": [64, 68], "codebas": 64, "erad": 64, "junk": 64, "comment": 64, "pydant": [24, 64], "enforc": [47, 64], "runtim": [64, 68], "perfplot": 64, "snippet": 64, "analyz": [54, 64], "vultur": 64, "dead": 64, "virtualenv": 65, "clone": 65, "virtual": 65, "pip": [65, 66], "autoremov": 65, "packag": [65, 73], "Its": 65, "unus": 65, "pipreq": 65, "txt": [65, 73], "pydep": 65, "poetri": 65, "pyinstal": 65, "bundl": 65, "singl": [6, 65], "github": 66, "bring": 66, "termin": 66, "pull": 66, "branch": 66, "wget": 66, "github1": 66, "browser": 66, "astral": 66, "organ": [58, 66, 68], "star": 66, "instal": 66, "e": 66, "fork": 66, "repositori": 66, "open": [2, 66, 68], "local": 66, "gpt": 66, "commit": 66, "request": 66, "inspect": 67, "report": 67, "consol": 67, "loguru": 67, "icecream": 67, "again": 67, "heartrat": 67, "program": 67, "real": [48, 67], "pyheat": 67, "heatmap": 67, "snoop": [67, 73], "smart": 67, "hyperfin": 67, "timelin": 67, "workflow": 68, "schedul": 68, "At": 68, "notifi": 68, "send": 68, "desktop": 68, "notif": 68, "finish": 68, "sound": 68, "knockknock": 68, "receiv": 68, "email": 68, "makefil": 68, "notedown": 68, "vice": 68, "versa": 68, "removestar": 68, "explicit": 68, "monkeytyp": 68, "whereami": 68, "you": [68, 74], "watchfil": 68, "rerun": 68, "retri": 68, "nbdime": 73, "reus": 73, "across": 73, "watermark": 73, "hardwar": 73, "Being": 73, "ipytest": 73, "nbqa": 73, "thi": [74, 76], "book": [74, 76], "author": 74, "support": 48, "magent": 51, "prompt": 51, "friendli": 56, "big": 56, "make_column_transform": 48, "point": [6, 59], "falsifi": 58, "mllib": 52, "rocketri": 68, "vector": [29, 56], "misspel": 48, "world": 48, "store": [46, 53], "sensit": 46, "secur": 46, "pytub": 68, "youtub": 68, "video": 68, "enum": 2, "aeon": 59, "ultim": 59, "forecast": 59, "classif": 59, "ruptur": 59, "non": 59, "stationari": 59, "signal": 59, "embrac": 2, "close": 2, "principl": 2, "mixin": 2, "pyspark": 56, "reusabl": 56, "parameter": 56, "seamless": 73, "creation": 73, "lab": 73, "strict": 11, "loss": 11, "outlin": 51, "ensur": [2, 51], "consist": 51, "tmp_path": 58, "temporari": [56, 58], "prototyp": 52, "qualiti": 47, "constraint": 47, "testbook": 73, "gluont": 59, "probabilist": 59, "mayb": 62, "tfcausalimpact": 59, "relationship": 59, "galat": 54, "massiv": 54, "5": 56, "safetensor": 53, "tensor": 53, "pendulum": 59, "quantstat": 59, "stock": 59, "udf": 56, "kneed": 59, "knee": 59, "functiontransform": 48, "robust": [48, 59], "great": 63, "scientif": 63, "look": 63, "islic": 21, "stream": [21, 47], "recip": [50, 54], "scraper": 50, "neuralforecast": 59, "streamlin": 59, "neural": 59, "familiar": 59, "syntax": [47, 59], "mirascop": 51, "field": 24, "maxim": 51, "pre": 59, "timegpt": 59, "num2word": 54, "later": 56, "statsforecast": 59, "pandas_udf": 56, "standard": 56, "autogluon": 52, "accur": 52, "magika": 68, "tsfresh": 59, "beyond": [54, 59], "tsmoothi": 59, "exponenti": 59, "smooth": 59, "drag": 60, "pygwalk": 60, "backtest": 59, "assess": 59, "trade": 59, "effortlessli": 59, "slide": 59, "window": 59, "shuffl": 56, "camelot": 63, "scientist": 47, "navig": 73, "top": 73, "magic": 73, "hierarch": 59, "bertop": 54, "bert": 54, "argpars": 63, "click": 63, "mlflow": 52, "pickl": 52, "eleg": 62, "fastapi": 52, "semant": 54, "wat": 67, "explor": 67, "unittest": 58, "sqlglot": 45, "anywher": 45, "upsert": 47}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinxcontrib.bibtex": 9, "sphinx": 56}}) \ No newline at end of file