From 8f4939765bc8a120fde9a4d266f9d2c422e2609b Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 03:02:57 -0400
Subject: [PATCH 01/23] Set the write output column type for forecast functions

---
 evadb/binder/statement_binder.py           | 56 ++++++++++++++++------
 evadb/executor/create_function_executor.py | 11 +++--
 evadb/functions/forecast.py                | 10 ++--
 3 files changed, 57 insertions(+), 20 deletions(-)

diff --git a/evadb/binder/statement_binder.py b/evadb/binder/statement_binder.py
index a90995b43..d4c684ce6 100644
--- a/evadb/binder/statement_binder.py
+++ b/evadb/binder/statement_binder.py
@@ -29,7 +29,12 @@
     resolve_alias_table_value_expression,
 )
 from evadb.binder.statement_binder_context import StatementBinderContext
-from evadb.catalog.catalog_type import NdArrayType, TableType, VideoColumnName
+from evadb.catalog.catalog_type import (
+    ColumnType,
+    NdArrayType,
+    TableType,
+    VideoColumnName,
+)
 from evadb.catalog.catalog_utils import get_metadata_properties, is_document_table
 from evadb.configuration.constants import EvaDB_INSTALLATION_DIR
 from evadb.expression.abstract_expression import AbstractExpression, ExpressionType
@@ -37,7 +42,7 @@
 from evadb.expression.tuple_value_expression import TupleValueExpression
 from evadb.parser.create_function_statement import CreateFunctionStatement
 from evadb.parser.create_index_statement import CreateIndexStatement
-from evadb.parser.create_statement import CreateTableStatement
+from evadb.parser.create_statement import ColumnDefinition, CreateTableStatement
 from evadb.parser.delete_statement import DeleteTableStatement
 from evadb.parser.explain_statement import ExplainStatement
 from evadb.parser.rename_statement import RenameTableStatement
@@ -87,21 +92,44 @@ def _bind_create_function_statement(self, node: CreateFunctionStatement):
                 node.query.target_list
             )
             arg_map = {key: value for key, value in node.metadata}
-            assert (
-                "predict" in arg_map
-            ), f"Creating {node.function_type} functions expects 'predict' metadata."
-            # We only support a single predict column for now
-            predict_columns = set([arg_map["predict"]])
             inputs, outputs = [], []
-            for column in all_column_list:
-                if column.name in predict_columns:
-                    if node.function_type != "Forecasting":
+            if string_comparison_case_insensitive(node.function_type, "ludwig"):
+                assert (
+                    "predict" in arg_map
+                ), f"Creating {node.function_type} functions expects 'predict' metadata."
+                # We only support a single predict column for now
+                predict_columns = set([arg_map["predict"]])
+                for column in all_column_list:
+                    if column.name in predict_columns:
                         column.name = column.name + "_predictions"
+                        outputs.append(column)
                     else:
-                        column.name = column.name
-                    outputs.append(column)
-                else:
-                    inputs.append(column)
+                        inputs.append(column)
+            elif string_comparison_case_insensitive(node.function_type, "forecasting"):
+                # Forecasting models have only one input column which is horizon
+                inputs = [ColumnDefinition("horizon", ColumnType.INTEGER, None, None)]
+                # Currently, we only support univariate forecast which should have three output columns, unique_id, ds, and y.
+                # The y column is required. unique_id and ds will be auto generated if not found.
+                required_columns = set([arg_map.get("predict", "y")])
+                for column in all_column_list:
+                    if column.name == arg_map.get("id", "unique_id"):
+                        outputs.append(column)
+                    elif column.name == arg_map.get("time", "ds"):
+                        outputs.append(column)
+                    elif column.name == arg_map.get("predict", "y"):
+                        outputs.append(column)
+                        required_columns.remove(column.name)
+                    else:
+                        raise BinderError(
+                            f"Unexpected column {column.name} found for forecasting function."
+                        )
+                assert (
+                    len(required_columns) == 0
+                ), f"Missing required {required_columns} columns for forecasting function."
+            else:
+                raise BinderError(
+                    f"Unsupported type of function: {node.function_type}."
+                )
             assert (
                 len(node.inputs) == 0 and len(node.outputs) == 0
             ), f"{node.function_type} functions' input and output are auto assigned"
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index 4abfa3906..69d266d25 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -171,7 +171,7 @@ def handle_forecasting_function(self):
 
         data = aggregated_batch.frames
         if "unique_id" not in list(data.columns):
-            data["unique_id"] = ["test" for x in range(len(data))]
+            data["unique_id"] = [1 for x in range(len(data))]
 
         if "ds" not in list(data.columns):
             data["ds"] = [x + 1 for x in range(len(data))]
@@ -233,9 +233,14 @@ def handle_forecasting_function(self):
         metadata_here = [
             FunctionMetadataCatalogEntry("model_name", model_name),
             FunctionMetadataCatalogEntry("model_path", model_path),
-            FunctionMetadataCatalogEntry("output_column_rename", arg_map["predict"]),
             FunctionMetadataCatalogEntry(
-                "time_column_rename", arg_map["time"] if "time" in arg_map else "ds"
+                "predict_column_rename", arg_map.get("predict", "y")
+            ),
+            FunctionMetadataCatalogEntry(
+                "time_column_rename", arg_map.get("time", "ds")
+            ),
+            FunctionMetadataCatalogEntry(
+                "id_column_rename", arg_map.get("id", "unique_id")
             ),
         ]
 
diff --git a/evadb/functions/forecast.py b/evadb/functions/forecast.py
index 782930891..f7cfb72f9 100644
--- a/evadb/functions/forecast.py
+++ b/evadb/functions/forecast.py
@@ -32,16 +32,18 @@ def setup(
         self,
         model_name: str,
         model_path: str,
-        output_column_rename: str,
+        predict_column_rename: str,
         time_column_rename: str,
+        id_column_rename: str,
     ):
         f = open(model_path, "rb")
         loaded_model = pickle.load(f)
         f.close()
         self.model = loaded_model
         self.model_name = model_name
-        self.output_column_rename = output_column_rename
+        self.predict_column_rename = predict_column_rename
         self.time_column_rename = time_column_rename
+        self.id_column_rename = id_column_rename
 
     def forward(self, data) -> pd.DataFrame:
         horizon = list(data.iloc[:, -1])[0]
@@ -49,10 +51,12 @@ def forward(self, data) -> pd.DataFrame:
             type(horizon) is int
         ), "Forecast UDF expects integral horizon in parameter."
         forecast_df = self.model.predict(h=horizon)
+        forecast_df.reset_index(inplace=True)
         forecast_df = forecast_df.rename(
             columns={
-                self.model_name: self.output_column_rename,
+                "unique_id": self.id_column_rename,
                 "ds": self.time_column_rename,
+                self.model_name: self.predict_column_rename,
             }
         )
         return forecast_df

From 043d67158baa300cbbacc385db5c7eb508397fb7 Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 03:28:19 -0400
Subject: [PATCH 02/23] Fix forecast integration test

---
 evadb/executor/create_function_executor.py    |  4 ++++
 .../long/test_model_forecasting.py            | 19 +++++++++++++------
 2 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index 69d266d25..ef31e7082 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -179,6 +179,10 @@ def handle_forecasting_function(self):
         if "frequency" not in arg_map.keys():
             arg_map["frequency"] = pd.infer_freq(data["ds"])
         frequency = arg_map["frequency"]
+        if frequency is None:
+            raise RuntimeError(
+                f"Can not infer the frequency for {self.node.name}. Please explictly set it."
+            )
 
         try_to_import_forecast()
         from statsforecast import StatsForecast
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index 766d0af95..b7778bba6 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -79,19 +79,23 @@ def test_forecast(self):
         """
         result = execute_query_fetch_all(self.evadb, predict_query)
         self.assertEqual(len(result), 12)
-        self.assertEqual(result.columns, ["airforecast.y"])
+        self.assertEqual(
+            result.columns, ["airforecast.unique_id", "airforecast.ds", "airforecast.y"]
+        )
 
     @forecast_skip_marker
     def test_forecast_with_column_rename(self):
         create_predict_udf = """
             CREATE FUNCTION HomeForecast FROM
             (
-                SELECT saledate, ma FROM HomeData
-                WHERE type = "house" AND bedrooms = 2
+                SELECT type, saledate, ma FROM HomeData
+                WHERE bedrooms = 2
             )
             TYPE Forecasting
             PREDICT 'ma'
-            TIME 'saledate';
+            ID 'type'
+            TIME 'saledate'
+            FREQUENCY 'M';
         """
         execute_query_fetch_all(self.evadb, create_predict_udf)
 
@@ -99,8 +103,11 @@ def test_forecast_with_column_rename(self):
             SELECT HomeForecast(12);
         """
         result = execute_query_fetch_all(self.evadb, predict_query)
-        self.assertEqual(len(result), 12)
-        self.assertEqual(result.columns, ["homeforecast.ma"])
+        self.assertEqual(len(result), 24)
+        self.assertEqual(
+            result.columns,
+            ["homeforecast.type", "homeforecast.saledate", "homeforecast.ma"],
+        )
 
 
 if __name__ == "__main__":

From 0977c1fd3994ccae26bf2527aa02fb9623aa8640 Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 03:55:53 -0400
Subject: [PATCH 03/23] Move the generic utils test

---
 test/unit_tests/utils/test_generic_utils.py | 46 +++++++++++++++++++++
 1 file changed, 46 insertions(+)
 create mode 100644 test/unit_tests/utils/test_generic_utils.py

diff --git a/test/unit_tests/utils/test_generic_utils.py b/test/unit_tests/utils/test_generic_utils.py
new file mode 100644
index 000000000..a46305f96
--- /dev/null
+++ b/test/unit_tests/utils/test_generic_utils.py
@@ -0,0 +1,46 @@
+# coding=utf-8
+# Copyright 2018-2023 EvaDB
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+
+from evadb.utils.generic_utils import string_comparison_case_insensitive
+
+
+class GenericUtilsTests(unittest.TestCase):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+
+    def test_string_matching_case_insensitive(self):
+        """
+        A simple test for string_matching_case_insensitve in generic_utils
+        used by statement_binder
+        """
+
+        test_string_exact_match = string_comparison_case_insensitive(
+            "HuggingFace", "HuggingFace"
+        )
+        test_string_case_insensitive_match = string_comparison_case_insensitive(
+            "HuggingFace", "hugGingFaCe"
+        )
+        test_string_no_match = string_comparison_case_insensitive(
+            "HuggingFace", "HuggingFae"
+        )
+        test_one_string_null = string_comparison_case_insensitive(None, "HuggingFace")
+        test_both_strings_null = string_comparison_case_insensitive(None, None)
+
+        self.assertTrue(test_string_exact_match)
+        self.assertTrue(test_string_case_insensitive_match)
+        self.assertFalse(test_string_no_match)
+        self.assertFalse(test_one_string_null)
+        self.assertFalse(test_both_strings_null)

From 092c03f1926daa5ba08d80cefeaebebf358c8bfb Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 04:07:52 -0400
Subject: [PATCH 04/23] Fix ludwig unittest cases and add unittestcase for
 normal forecasting cases

---
 .../binder/test_statement_binder.py           | 86 +++++++++++++------
 1 file changed, 61 insertions(+), 25 deletions(-)

diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index 16c4842bc..184ec1e36 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -24,7 +24,6 @@
 from evadb.expression.tuple_value_expression import TupleValueExpression
 from evadb.parser.alias import Alias
 from evadb.parser.create_statement import ColumnDefinition
-from evadb.utils.generic_utils import string_comparison_case_insensitive
 
 
 def assert_not_called_with(self, *args, **kwargs):
@@ -367,18 +366,20 @@ def test_bind_create_index(self):
             col.array_dimensions = [1, 10]
             binder._bind_create_index_statement(create_index_statement)
 
-    def test_bind_create_function_should_raise(self):
+    def test_bind_create_function_should_raise_without_predict_for_ludwig(self):
         with patch.object(StatementBinder, "bind"):
             create_function_statement = MagicMock()
+            create_function_statement.function_type = "ludwig"
             create_function_statement.query.target_list = []
             create_function_statement.metadata = []
             binder = StatementBinder(StatementBinderContext(MagicMock()))
             with self.assertRaises(AssertionError):
                 binder._bind_create_function_statement(create_function_statement)
 
-    def test_bind_create_function_should_drop_row_id(self):
+    def test_bind_create_function_should_drop_row_id_for_select_star(self):
         with patch.object(StatementBinder, "bind"):
             create_function_statement = MagicMock()
+            create_function_statement.function_type = "ludwig"
             row_id_col_obj = ColumnCatalogEntry(
                 name=IDENTIFIER_COLUMN,
                 type=MagicMock(),
@@ -445,26 +446,61 @@ def test_bind_create_function_should_drop_row_id(self):
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
 
-    def test_string_matching_case_insensitive(self):
-        """
-        A simple test for string_matching_case_insensitve in generic_utils
-        used by statement_binder
-        """
+    def test_bind_create_function_should_bind_forecast(self):
+        with patch.object(StatementBinder, "bind"):
+            create_function_statement = MagicMock()
+            create_function_statement.function_type = "forecasting"
+            id_col_obj = ColumnCatalogEntry(
+                name="unique_id",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            ds_col_obj = ColumnCatalogEntry(
+                name="ds",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            y_col_obj = ColumnCatalogEntry(
+                name="y",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            create_function_statement.query.target_list = [
+                TupleValueExpression(
+                    name=id_col_obj.name, table_alias="a", col_object=id_col_obj
+                ),
+                TupleValueExpression(
+                    name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
+                ),
+                TupleValueExpression(
+                    name=y_col_obj.name, table_alias="a", col_object=y_col_obj
+                ),
+            ]
+            create_function_statement.metadata = []
+            binder = StatementBinder(StatementBinderContext(MagicMock()))
+            binder._bind_create_function_statement(create_function_statement)
 
-        test_string_exact_match = string_comparison_case_insensitive(
-            "HuggingFace", "HuggingFace"
-        )
-        test_string_case_insensitive_match = string_comparison_case_insensitive(
-            "HuggingFace", "hugGingFaCe"
-        )
-        test_string_no_match = string_comparison_case_insensitive(
-            "HuggingFace", "HuggingFae"
-        )
-        test_one_string_null = string_comparison_case_insensitive(None, "HuggingFace")
-        test_both_strings_null = string_comparison_case_insensitive(None, None)
-
-        assert test_string_exact_match is True
-        assert test_string_case_insensitive_match is True
-        assert test_string_no_match is False
-        assert test_one_string_null is False
-        assert test_both_strings_null is False
+            expected_inputs = [
+                ColumnDefinition(
+                    "horizon",
+                    ColumnType.INTEGER,
+                    None,
+                    None,
+                )
+            ]
+            expected_outputs = list(
+                [
+                    ColumnDefinition(
+                        col_obj.name,
+                        col_obj.type,
+                        col_obj.array_type,
+                        col_obj.array_dimensions,
+                    )
+                    for col_obj in (id_col_obj, ds_col_obj, y_col_obj)
+                ]
+            )
+            self.assertEqual(create_function_statement.inputs, expected_inputs)
+            self.assertEqual(create_function_statement.outputs, expected_outputs)

From 96e40db916342852a666380e2c16a548651a5932 Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 04:10:24 -0400
Subject: [PATCH 05/23] Add unitest cases for forecast with rename in binder.

---
 .../binder/test_statement_binder.py           | 65 ++++++++++++++++++-
 1 file changed, 64 insertions(+), 1 deletion(-)

diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index 184ec1e36..cf26f8c2b 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -446,7 +446,7 @@ def test_bind_create_function_should_drop_row_id_for_select_star(self):
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
 
-    def test_bind_create_function_should_bind_forecast(self):
+    def test_bind_create_function_should_bind_forecast_with_default_columns(self):
         with patch.object(StatementBinder, "bind"):
             create_function_statement = MagicMock()
             create_function_statement.function_type = "forecasting"
@@ -504,3 +504,66 @@ def test_bind_create_function_should_bind_forecast(self):
             )
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
+
+    def test_bind_create_function_should_bind_forecast_with_renaming_columns(self):
+        with patch.object(StatementBinder, "bind"):
+            create_function_statement = MagicMock()
+            create_function_statement.function_type = "forecasting"
+            id_col_obj = ColumnCatalogEntry(
+                name="type",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            ds_col_obj = ColumnCatalogEntry(
+                name="saledate",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            y_col_obj = ColumnCatalogEntry(
+                name="ma",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            create_function_statement.query.target_list = [
+                TupleValueExpression(
+                    name=id_col_obj.name, table_alias="a", col_object=id_col_obj
+                ),
+                TupleValueExpression(
+                    name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
+                ),
+                TupleValueExpression(
+                    name=y_col_obj.name, table_alias="a", col_object=y_col_obj
+                ),
+            ]
+            create_function_statement.metadata = [
+                ("predict", "ma"),
+                ("id", "type"),
+                ("time", "saledate"),
+            ]
+            binder = StatementBinder(StatementBinderContext(MagicMock()))
+            binder._bind_create_function_statement(create_function_statement)
+
+            expected_inputs = [
+                ColumnDefinition(
+                    "horizon",
+                    ColumnType.INTEGER,
+                    None,
+                    None,
+                )
+            ]
+            expected_outputs = list(
+                [
+                    ColumnDefinition(
+                        col_obj.name,
+                        col_obj.type,
+                        col_obj.array_type,
+                        col_obj.array_dimensions,
+                    )
+                    for col_obj in (id_col_obj, ds_col_obj, y_col_obj)
+                ]
+            )
+            self.assertEqual(create_function_statement.inputs, expected_inputs)
+            self.assertEqual(create_function_statement.outputs, expected_outputs)

From 564837104bad0180c3da34343860d68f7e912be2 Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 04:18:19 -0400
Subject: [PATCH 06/23] Add unittest when an expected column is passed to
 forecasting

---
 .../binder/test_statement_binder.py           | 45 +++++++++++++++++++
 1 file changed, 45 insertions(+)

diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index cf26f8c2b..877e04cc6 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -567,3 +567,48 @@ def test_bind_create_function_should_bind_forecast_with_renaming_columns(self):
             )
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
+
+    def test_bind_create_function_should_raise_forecast_with_unexpected_columns(self):
+        with patch.object(StatementBinder, "bind"):
+            create_function_statement = MagicMock()
+            create_function_statement.function_type = "forecasting"
+            id_col_obj = ColumnCatalogEntry(
+                name="type",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            ds_col_obj = ColumnCatalogEntry(
+                name="saledate",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            y_col_obj = ColumnCatalogEntry(
+                name="ma",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            create_function_statement.query.target_list = [
+                TupleValueExpression(
+                    name=id_col_obj.name, table_alias="a", col_object=id_col_obj
+                ),
+                TupleValueExpression(
+                    name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
+                ),
+                TupleValueExpression(
+                    name=y_col_obj.name, table_alias="a", col_object=y_col_obj
+                ),
+            ]
+            create_function_statement.metadata = [
+                ("predict", "ma"),
+                ("time", "saledate"),
+            ]
+            binder = StatementBinder(StatementBinderContext(MagicMock()))
+
+            with self.assertRaises(BinderError) as cm:
+                binder._bind_create_function_statement(create_function_statement)
+
+            err_msg = "Unexpected column type found for forecasting function."
+            self.assertEqual(str(cm.exception), err_msg)

From 8692ff1d41396132b37b08b06ecb25afb01721b1 Mon Sep 17 00:00:00 2001
From: xzdandy <xzdandy@gmail.com>
Date: Wed, 13 Sep 2023 04:21:27 -0400
Subject: [PATCH 07/23] Add unittest when required columns are missing in
 binder

---
 .../binder/test_statement_binder.py           | 37 +++++++++++++++++++
 1 file changed, 37 insertions(+)

diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index 877e04cc6..6a4ee08de 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -612,3 +612,40 @@ def test_bind_create_function_should_raise_forecast_with_unexpected_columns(self
 
             err_msg = "Unexpected column type found for forecasting function."
             self.assertEqual(str(cm.exception), err_msg)
+
+    def test_bind_create_function_should_raise_forecast_missing_required_columns(self):
+        with patch.object(StatementBinder, "bind"):
+            create_function_statement = MagicMock()
+            create_function_statement.function_type = "forecasting"
+            id_col_obj = ColumnCatalogEntry(
+                name="type",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            ds_col_obj = ColumnCatalogEntry(
+                name="saledate",
+                type=MagicMock(),
+                array_type=MagicMock(),
+                array_dimensions=MagicMock(),
+            )
+            create_function_statement.query.target_list = [
+                TupleValueExpression(
+                    name=id_col_obj.name, table_alias="a", col_object=id_col_obj
+                ),
+                TupleValueExpression(
+                    name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
+                ),
+            ]
+            create_function_statement.metadata = [
+                ("id", "type"),
+                ("time", "saledate"),
+                ("predict", "ma"),
+            ]
+            binder = StatementBinder(StatementBinderContext(MagicMock()))
+
+            with self.assertRaises(AssertionError) as cm:
+                binder._bind_create_function_statement(create_function_statement)
+
+            err_msg = "Missing required {'ma'} columns for forecasting function."
+            self.assertEqual(str(cm.exception), err_msg)

From 1fd3c02ea5ff26153a83e0f21d87388f124ab418 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Wed, 13 Sep 2023 20:59:33 -0400
Subject: [PATCH 08/23] Add neuralforecast support

---
 evadb/executor/create_function_executor.py | 118 +++++++++++++++++----
 evadb/functions/forecast.py                |  14 +--
 evadb/utils/generic_utils.py               |   7 ++
 3 files changed, 112 insertions(+), 27 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index ef31e7082..d9b3f0d80 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -150,14 +150,32 @@ def handle_forecasting_function(self):
             impl_path = Path(f"{self.function_dir}/forecast.py").absolute().as_posix()
         else:
             impl_path = self.node.impl_path.absolute().as_posix()
+        library = "statsforecast"
+        supported_libraries = ["statsforecast", "neuralforecast"]
+        
+        if "horizon" not in arg_map.keys():
+            raise ValueError(
+                "Horizon must be provided while creating function of type FORECASTING"
+            )
+        try:
+            horizon = int(arg_map["horizon"])
+        except:
+            raise ValueError(
+                    "Parameter horizon must be integral."
+                )
 
-        if "model" not in arg_map.keys():
-            arg_map["model"] = "AutoARIMA"
-
-        model_name = arg_map["model"]
+        if "library" in arg_map.keys():
+            try:
+                assert arg_map["library"].lower() in supported_libraries
+            except:
+                raise ValueError(
+                    "EvaDB currently supports "+str(supported_libraries)+" only."
+                )
+            library = arg_map["library"].lower()
 
+        
         """
-        The following rename is needed for statsforecast, which requires the column name to be the following:
+        The following rename is needed for statsforecast/neuralforecast, which requires the column name to be the following:
         - The unique_id (string, int or category) represents an identifier for the series.
         - The ds (datestamp) column should be of a format expected by Pandas, ideally YYYY-MM-DD for a date or YYYY-MM-DD HH:MM:SS for a timestamp.
         - The y (numeric) represents the measurement we wish to forecast.
@@ -176,6 +194,10 @@ def handle_forecasting_function(self):
         if "ds" not in list(data.columns):
             data["ds"] = [x + 1 for x in range(len(data))]
 
+        """
+            Set or infer data frequency
+        """ 
+
         if "frequency" not in arg_map.keys():
             arg_map["frequency"] = pd.infer_freq(data["ds"])
         frequency = arg_map["frequency"]
@@ -184,17 +206,6 @@ def handle_forecasting_function(self):
                 f"Can not infer the frequency for {self.node.name}. Please explictly set it."
             )
 
-        try_to_import_forecast()
-        from statsforecast import StatsForecast
-        from statsforecast.models import AutoARIMA, AutoCES, AutoETS, AutoTheta
-
-        model_dict = {
-            "AutoARIMA": AutoARIMA,
-            "AutoCES": AutoCES,
-            "AutoETS": AutoETS,
-            "AutoTheta": AutoTheta,
-        }
-
         season_dict = {  # https://pandas.pydata.org/docs/user_guide/timeseries.html#timeseries-offset-aliases
             "H": 24,
             "M": 12,
@@ -210,9 +221,68 @@ def handle_forecasting_function(self):
             frequency.split("-")[0] if "-" in frequency else frequency
         )  # shortens longer frequencies like Q-DEC
         season_length = season_dict[new_freq] if new_freq in season_dict else 1
-        model = StatsForecast(
-            [model_dict[model_name](season_length=season_length)], freq=new_freq
-        )
+
+
+        try_to_import_forecast()
+
+        """
+            Neuralforecast implementation
+        """
+        if library == "neuralforecast":
+            from neuralforecast import NeuralForecast
+            from neuralforecast.models import NBEATS
+            from neuralforecast.auto import AutoNBEATS
+            
+            model_dict = {
+                "AutoNBEATS": AutoNBEATS,
+                "NBEATS": NBEATS,
+            }
+
+            if "model" not in arg_map.keys():
+                arg_map["model"] = "NBEATS"
+
+            try:
+                model_name = arg_map["model"]
+            except:
+                raise ValueError(
+                    "Supported models: "+str(model_dict.keys())
+                )
+            
+            model = NeuralForecast(
+                [model_dict[model_name](input_size=2 * horizon, h=horizon, max_steps=50)], freq=new_freq
+            )
+
+
+
+        # """
+        #     Statsforecast implementation
+        # """
+        else:
+            from statsforecast import StatsForecast
+            from statsforecast.models import AutoARIMA, AutoCES, AutoETS, AutoTheta
+
+            model_dict = {
+                "AutoARIMA": AutoARIMA,
+                "AutoCES": AutoCES,
+                "AutoETS": AutoETS,
+                "AutoTheta": AutoTheta,
+            }
+
+            if "model" not in arg_map.keys():
+                arg_map["model"] = "AutoARIMA"
+
+            try:
+                model_name = arg_map["model"]
+            except:
+                raise ValueError(
+                    "Supported models: "+str(model_dict.keys())
+                )
+
+
+
+            model = StatsForecast(
+                [model_dict[model_name](season_length=season_length)], freq=new_freq
+            )
 
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"), self.node.name
@@ -221,13 +291,13 @@ def handle_forecasting_function(self):
         model_path = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
-            str(hashlib.sha256(data.to_string().encode()).hexdigest()) + ".pkl",
+            library+"_"+str(hashlib.sha256(data.to_string().encode()).hexdigest()) + ".pkl",
         )
 
         weight_file = Path(model_path)
         data["ds"] = pd.to_datetime(data["ds"])
         if not weight_file.exists():
-            model.fit(data)
+            model.fit(df=data)
             f = open(model_path, "wb")
             pickle.dump(model, f)
             f.close()
@@ -246,6 +316,12 @@ def handle_forecasting_function(self):
             FunctionMetadataCatalogEntry(
                 "id_column_rename", arg_map.get("id", "unique_id")
             ),
+            FunctionMetadataCatalogEntry(
+                "horizon", horizon
+            ),
+            FunctionMetadataCatalogEntry(
+                "library", library
+            ),
         ]
 
         return (
diff --git a/evadb/functions/forecast.py b/evadb/functions/forecast.py
index f7cfb72f9..25a75caa5 100644
--- a/evadb/functions/forecast.py
+++ b/evadb/functions/forecast.py
@@ -21,7 +21,6 @@
 from evadb.functions.abstract.abstract_function import AbstractFunction
 from evadb.functions.decorators.decorators import setup
 
-
 class ForecastModel(AbstractFunction):
     @property
     def name(self) -> str:
@@ -35,6 +34,8 @@ def setup(
         predict_column_rename: str,
         time_column_rename: str,
         id_column_rename: str,
+        horizon: int,
+        library: str
     ):
         f = open(model_path, "rb")
         loaded_model = pickle.load(f)
@@ -44,13 +45,14 @@ def setup(
         self.predict_column_rename = predict_column_rename
         self.time_column_rename = time_column_rename
         self.id_column_rename = id_column_rename
+        self.horizon = int(horizon)
+        self.library = library
 
     def forward(self, data) -> pd.DataFrame:
-        horizon = list(data.iloc[:, -1])[0]
-        assert (
-            type(horizon) is int
-        ), "Forecast UDF expects integral horizon in parameter."
-        forecast_df = self.model.predict(h=horizon)
+        if self.library == "statsforecast":
+            forecast_df = self.model.predict(h=self.horizon)
+        else:
+            forecast_df = self.model.predict()
         forecast_df.reset_index(inplace=True)
         forecast_df = forecast_df.rename(
             columns={
diff --git a/evadb/utils/generic_utils.py b/evadb/utils/generic_utils.py
index e7836f131..3e523314e 100644
--- a/evadb/utils/generic_utils.py
+++ b/evadb/utils/generic_utils.py
@@ -277,6 +277,13 @@ def try_to_import_forecast():
             """Could not import StatsForecast python package.
                 Please install it with `pip install statsforecast`."""
         )
+    try:
+        from neuralforecast import NeuralForecast  # noqa: F401
+    except ImportError:
+        raise ValueError(
+            """Could not import NeuralForecast python package.
+                Please install it with `pip install neuralforecast`."""
+        )
 
 
 def is_ray_available() -> bool:

From 65ed6e1521018304be1e9759a18ed979e7d0ab63 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Fri, 15 Sep 2023 02:04:53 -0400
Subject: [PATCH 09/23] less horizon no retrain

---
 evadb/executor/create_function_executor.py | 102 ++++++++++++---------
 evadb/functions/forecast.py                |   5 +-
 2 files changed, 60 insertions(+), 47 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index d9b3f0d80..5dbcaeb83 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -152,28 +152,30 @@ def handle_forecasting_function(self):
             impl_path = self.node.impl_path.absolute().as_posix()
         library = "statsforecast"
         supported_libraries = ["statsforecast", "neuralforecast"]
-        
+
         if "horizon" not in arg_map.keys():
             raise ValueError(
                 "Horizon must be provided while creating function of type FORECASTING"
             )
         try:
             horizon = int(arg_map["horizon"])
-        except:
-            raise ValueError(
-                    "Parameter horizon must be integral."
-                )
+        except Exception as e:
+            err_msg = f"{str(e)}. HORIZON must be integral."
+            logger.error(err_msg)
+            raise FunctionIODefinitionError(err_msg)
 
         if "library" in arg_map.keys():
             try:
                 assert arg_map["library"].lower() in supported_libraries
-            except:
-                raise ValueError(
-                    "EvaDB currently supports "+str(supported_libraries)+" only."
+            except Exception:
+                err_msg = (
+                    "EvaDB currently supports " + str(supported_libraries) + " only."
                 )
+                logger.error(err_msg)
+                raise FunctionIODefinitionError(err_msg)
+
             library = arg_map["library"].lower()
 
-        
         """
         The following rename is needed for statsforecast/neuralforecast, which requires the column name to be the following:
         - The unique_id (string, int or category) represents an identifier for the series.
@@ -196,7 +198,7 @@ def handle_forecasting_function(self):
 
         """
             Set or infer data frequency
-        """ 
+        """
 
         if "frequency" not in arg_map.keys():
             arg_map["frequency"] = pd.infer_freq(data["ds"])
@@ -222,7 +224,6 @@ def handle_forecasting_function(self):
         )  # shortens longer frequencies like Q-DEC
         season_length = season_dict[new_freq] if new_freq in season_dict else 1
 
-
         try_to_import_forecast()
 
         """
@@ -230,9 +231,9 @@ def handle_forecasting_function(self):
         """
         if library == "neuralforecast":
             from neuralforecast import NeuralForecast
-            from neuralforecast.models import NBEATS
             from neuralforecast.auto import AutoNBEATS
-            
+            from neuralforecast.models import NBEATS
+
             model_dict = {
                 "AutoNBEATS": AutoNBEATS,
                 "NBEATS": NBEATS,
@@ -242,18 +243,17 @@ def handle_forecasting_function(self):
                 arg_map["model"] = "NBEATS"
 
             try:
-                model_name = arg_map["model"]
-            except:
-                raise ValueError(
-                    "Supported models: "+str(model_dict.keys())
-                )
-            
+                model_here = model_dict[arg_map["model"]]
+            except Exception:
+                err_msg = "Supported models: " + str(model_dict.keys())
+                logger.error(err_msg)
+                raise FunctionIODefinitionError(err_msg)
+
             model = NeuralForecast(
-                [model_dict[model_name](input_size=2 * horizon, h=horizon, max_steps=50)], freq=new_freq
+                [model_here(input_size=2 * horizon, h=horizon, max_steps=50)],
+                freq=new_freq,
             )
 
-
-
         # """
         #     Statsforecast implementation
         # """
@@ -272,40 +272,56 @@ def handle_forecasting_function(self):
                 arg_map["model"] = "AutoARIMA"
 
             try:
-                model_name = arg_map["model"]
-            except:
-                raise ValueError(
-                    "Supported models: "+str(model_dict.keys())
-                )
-
-
+                model_here = model_dict[arg_map["model"]]
+            except Exception:
+                err_msg = "Supported models: " + str(model_dict.keys())
+                logger.error(err_msg)
+                raise FunctionIODefinitionError(err_msg)
 
             model = StatsForecast(
-                [model_dict[model_name](season_length=season_length)], freq=new_freq
+                [model_here(season_length=season_length)], freq=new_freq
             )
 
+        data["ds"] = pd.to_datetime(data["ds"])
+
         model_dir = os.path.join(
-            self.db.config.get_value("storage", "model_dir"), self.node.name
-        )
-        Path(model_dir).mkdir(parents=True, exist_ok=True)
-        model_path = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
-            library+"_"+str(hashlib.sha256(data.to_string().encode()).hexdigest()) + ".pkl",
         )
+        Path(model_dir).mkdir(parents=True, exist_ok=True)
 
-        weight_file = Path(model_path)
-        data["ds"] = pd.to_datetime(data["ds"])
-        if not weight_file.exists():
+        model_save_name = (
+            library
+            + "_"
+            + str(hashlib.sha256(data.to_string().encode()).hexdigest())
+            + "_horizon"
+            + str(horizon)
+            + ".pkl"
+        )
+
+        model_path = os.path.join(model_dir, model_save_name)
+
+        existing_model_files = sorted(
+            os.listdir(model_dir),
+            key=lambda x: int(x.split("horizon")[1].split(".pkl")[0]),
+        )
+        existing_model_files = [
+            x
+            for x in existing_model_files
+            if int(x.split("horizon")[1].split(".pkl")[0]) >= horizon
+        ]
+        if len(existing_model_files) == 0:
             model.fit(df=data)
             f = open(model_path, "wb")
             pickle.dump(model, f)
             f.close()
+        elif not Path(model_path).exists():
+            model_path = os.path.join(model_dir, existing_model_files[-1])
 
         io_list = self._resolve_function_io(None)
 
         metadata_here = [
-            FunctionMetadataCatalogEntry("model_name", model_name),
+            FunctionMetadataCatalogEntry("model_name", arg_map["model"]),
             FunctionMetadataCatalogEntry("model_path", model_path),
             FunctionMetadataCatalogEntry(
                 "predict_column_rename", arg_map.get("predict", "y")
@@ -316,12 +332,8 @@ def handle_forecasting_function(self):
             FunctionMetadataCatalogEntry(
                 "id_column_rename", arg_map.get("id", "unique_id")
             ),
-            FunctionMetadataCatalogEntry(
-                "horizon", horizon
-            ),
-            FunctionMetadataCatalogEntry(
-                "library", library
-            ),
+            FunctionMetadataCatalogEntry("horizon", horizon),
+            FunctionMetadataCatalogEntry("library", library),
         ]
 
         return (
diff --git a/evadb/functions/forecast.py b/evadb/functions/forecast.py
index 25a75caa5..3073ec13f 100644
--- a/evadb/functions/forecast.py
+++ b/evadb/functions/forecast.py
@@ -21,6 +21,7 @@
 from evadb.functions.abstract.abstract_function import AbstractFunction
 from evadb.functions.decorators.decorators import setup
 
+
 class ForecastModel(AbstractFunction):
     @property
     def name(self) -> str:
@@ -35,7 +36,7 @@ def setup(
         time_column_rename: str,
         id_column_rename: str,
         horizon: int,
-        library: str
+        library: str,
     ):
         f = open(model_path, "rb")
         loaded_model = pickle.load(f)
@@ -60,5 +61,5 @@ def forward(self, data) -> pd.DataFrame:
                 "ds": self.time_column_rename,
                 self.model_name: self.predict_column_rename,
             }
-        )
+        )[: self.horizon]
         return forecast_df

From be242ee82aa3e3006cbf08d80c501b164ecf125d Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Mon, 25 Sep 2023 02:57:30 -0400
Subject: [PATCH 10/23] add support for exogenous variables

---
 evadb/executor/create_function_executor.py | 41 ++++++++++++++--------
 1 file changed, 27 insertions(+), 14 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index bb038b2cb..e711882da 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -276,16 +276,16 @@ def handle_forecasting_function(self):
         """
         if library == "neuralforecast":
             from neuralforecast import NeuralForecast
-            from neuralforecast.auto import AutoNBEATS
-            from neuralforecast.models import NBEATS
+            from neuralforecast.auto import AutoNBEATS, AutoNHITS
+            from neuralforecast.models import NHITS
 
             model_dict = {
-                "AutoNBEATS": AutoNBEATS,
-                "NBEATS": NBEATS,
+                "AutoNHITS": AutoNHITS,
+                "NHITS": NHITS,
             }
 
             if "model" not in arg_map.keys():
-                arg_map["model"] = "NBEATS"
+                arg_map["model"] = "AutoNHITS"
 
             try:
                 model_here = model_dict[arg_map["model"]]
@@ -293,11 +293,21 @@ def handle_forecasting_function(self):
                 err_msg = "Supported models: " + str(model_dict.keys())
                 logger.error(err_msg)
                 raise FunctionIODefinitionError(err_msg)
+            model_args = {}
+            if "exogenous" in arg_map.keys():
+                exogenous_args = [x.strip() for x in arg_map["exogenous"].strip().split(",")]
+                model_args["hist_exog_list"] = exogenous_args
+
+            if "auto" not in arg_map["model"].lower():
+                model_args["input_size"] = 2*horizon
+                model_args["max_steps"] = 50
+            
+            model_args["h"] = horizon
 
             model = NeuralForecast(
-                [model_here(input_size=2 * horizon, h=horizon, max_steps=50)],
-                freq=new_freq,
-            )
+                    [model_here(**model_args)],
+                    freq=new_freq,
+                )
 
         # """
         #     Statsforecast implementation
@@ -323,22 +333,25 @@ def handle_forecasting_function(self):
                 logger.error(err_msg)
                 raise FunctionIODefinitionError(err_msg)
 
-            model = StatsForecast(
-                [model_here(season_length=season_length)], freq=new_freq
-            )
+
+            
+            else:
+                model = StatsForecast(
+                    [model_here(season_length=season_length)], freq=new_freq
+                )
 
         data["ds"] = pd.to_datetime(data["ds"])
 
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
+            library,
+            arg_map["model"]
         )
         Path(model_dir).mkdir(parents=True, exist_ok=True)
 
         model_save_name = (
-            library
-            + "_"
-            + str(hashlib.sha256(data.to_string().encode()).hexdigest())
+            str(hashlib.sha256(data.to_string().encode()).hexdigest())
             + "_horizon"
             + str(horizon)
             + ".pkl"

From 583e77868603fe4a0515edd3c972e6ac6808ecbf Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Mon, 25 Sep 2023 10:49:03 -0400
Subject: [PATCH 11/23] Fix exogenous support; add tests

---
 data/forecasting/AirPassengersPanel.csv       | 289 ++++++++++++++++++
 evadb/binder/statement_binder.py              |   8 +-
 evadb/executor/create_function_executor.py    |  18 +-
 .../long/test_model_forecasting.py            |  38 ++-
 4 files changed, 342 insertions(+), 11 deletions(-)
 create mode 100644 data/forecasting/AirPassengersPanel.csv

diff --git a/data/forecasting/AirPassengersPanel.csv b/data/forecasting/AirPassengersPanel.csv
new file mode 100644
index 000000000..a62fe6ef6
--- /dev/null
+++ b/data/forecasting/AirPassengersPanel.csv
@@ -0,0 +1,289 @@
+ds,unique_id,y,trend,ylagged
+1949-01-31,Airline1,112.0,0,112.0
+1949-02-28,Airline1,118.0,1,118.0
+1949-03-31,Airline1,132.0,2,132.0
+1949-04-30,Airline1,129.0,3,129.0
+1949-05-31,Airline1,121.0,4,121.0
+1949-06-30,Airline1,135.0,5,135.0
+1949-07-31,Airline1,148.0,6,148.0
+1949-08-31,Airline1,148.0,7,148.0
+1949-09-30,Airline1,136.0,8,136.0
+1949-10-31,Airline1,119.0,9,119.0
+1949-11-30,Airline1,104.0,10,104.0
+1949-12-31,Airline1,118.0,11,118.0
+1950-01-31,Airline1,115.0,12,112.0
+1950-02-28,Airline1,126.0,13,118.0
+1950-03-31,Airline1,141.0,14,132.0
+1950-04-30,Airline1,135.0,15,129.0
+1950-05-31,Airline1,125.0,16,121.0
+1950-06-30,Airline1,149.0,17,135.0
+1950-07-31,Airline1,170.0,18,148.0
+1950-08-31,Airline1,170.0,19,148.0
+1950-09-30,Airline1,158.0,20,136.0
+1950-10-31,Airline1,133.0,21,119.0
+1950-11-30,Airline1,114.0,22,104.0
+1950-12-31,Airline1,140.0,23,118.0
+1951-01-31,Airline1,145.0,24,115.0
+1951-02-28,Airline1,150.0,25,126.0
+1951-03-31,Airline1,178.0,26,141.0
+1951-04-30,Airline1,163.0,27,135.0
+1951-05-31,Airline1,172.0,28,125.0
+1951-06-30,Airline1,178.0,29,149.0
+1951-07-31,Airline1,199.0,30,170.0
+1951-08-31,Airline1,199.0,31,170.0
+1951-09-30,Airline1,184.0,32,158.0
+1951-10-31,Airline1,162.0,33,133.0
+1951-11-30,Airline1,146.0,34,114.0
+1951-12-31,Airline1,166.0,35,140.0
+1952-01-31,Airline1,171.0,36,145.0
+1952-02-29,Airline1,180.0,37,150.0
+1952-03-31,Airline1,193.0,38,178.0
+1952-04-30,Airline1,181.0,39,163.0
+1952-05-31,Airline1,183.0,40,172.0
+1952-06-30,Airline1,218.0,41,178.0
+1952-07-31,Airline1,230.0,42,199.0
+1952-08-31,Airline1,242.0,43,199.0
+1952-09-30,Airline1,209.0,44,184.0
+1952-10-31,Airline1,191.0,45,162.0
+1952-11-30,Airline1,172.0,46,146.0
+1952-12-31,Airline1,194.0,47,166.0
+1953-01-31,Airline1,196.0,48,171.0
+1953-02-28,Airline1,196.0,49,180.0
+1953-03-31,Airline1,236.0,50,193.0
+1953-04-30,Airline1,235.0,51,181.0
+1953-05-31,Airline1,229.0,52,183.0
+1953-06-30,Airline1,243.0,53,218.0
+1953-07-31,Airline1,264.0,54,230.0
+1953-08-31,Airline1,272.0,55,242.0
+1953-09-30,Airline1,237.0,56,209.0
+1953-10-31,Airline1,211.0,57,191.0
+1953-11-30,Airline1,180.0,58,172.0
+1953-12-31,Airline1,201.0,59,194.0
+1954-01-31,Airline1,204.0,60,196.0
+1954-02-28,Airline1,188.0,61,196.0
+1954-03-31,Airline1,235.0,62,236.0
+1954-04-30,Airline1,227.0,63,235.0
+1954-05-31,Airline1,234.0,64,229.0
+1954-06-30,Airline1,264.0,65,243.0
+1954-07-31,Airline1,302.0,66,264.0
+1954-08-31,Airline1,293.0,67,272.0
+1954-09-30,Airline1,259.0,68,237.0
+1954-10-31,Airline1,229.0,69,211.0
+1954-11-30,Airline1,203.0,70,180.0
+1954-12-31,Airline1,229.0,71,201.0
+1955-01-31,Airline1,242.0,72,204.0
+1955-02-28,Airline1,233.0,73,188.0
+1955-03-31,Airline1,267.0,74,235.0
+1955-04-30,Airline1,269.0,75,227.0
+1955-05-31,Airline1,270.0,76,234.0
+1955-06-30,Airline1,315.0,77,264.0
+1955-07-31,Airline1,364.0,78,302.0
+1955-08-31,Airline1,347.0,79,293.0
+1955-09-30,Airline1,312.0,80,259.0
+1955-10-31,Airline1,274.0,81,229.0
+1955-11-30,Airline1,237.0,82,203.0
+1955-12-31,Airline1,278.0,83,229.0
+1956-01-31,Airline1,284.0,84,242.0
+1956-02-29,Airline1,277.0,85,233.0
+1956-03-31,Airline1,317.0,86,267.0
+1956-04-30,Airline1,313.0,87,269.0
+1956-05-31,Airline1,318.0,88,270.0
+1956-06-30,Airline1,374.0,89,315.0
+1956-07-31,Airline1,413.0,90,364.0
+1956-08-31,Airline1,405.0,91,347.0
+1956-09-30,Airline1,355.0,92,312.0
+1956-10-31,Airline1,306.0,93,274.0
+1956-11-30,Airline1,271.0,94,237.0
+1956-12-31,Airline1,306.0,95,278.0
+1957-01-31,Airline1,315.0,96,284.0
+1957-02-28,Airline1,301.0,97,277.0
+1957-03-31,Airline1,356.0,98,317.0
+1957-04-30,Airline1,348.0,99,313.0
+1957-05-31,Airline1,355.0,100,318.0
+1957-06-30,Airline1,422.0,101,374.0
+1957-07-31,Airline1,465.0,102,413.0
+1957-08-31,Airline1,467.0,103,405.0
+1957-09-30,Airline1,404.0,104,355.0
+1957-10-31,Airline1,347.0,105,306.0
+1957-11-30,Airline1,305.0,106,271.0
+1957-12-31,Airline1,336.0,107,306.0
+1958-01-31,Airline1,340.0,108,315.0
+1958-02-28,Airline1,318.0,109,301.0
+1958-03-31,Airline1,362.0,110,356.0
+1958-04-30,Airline1,348.0,111,348.0
+1958-05-31,Airline1,363.0,112,355.0
+1958-06-30,Airline1,435.0,113,422.0
+1958-07-31,Airline1,491.0,114,465.0
+1958-08-31,Airline1,505.0,115,467.0
+1958-09-30,Airline1,404.0,116,404.0
+1958-10-31,Airline1,359.0,117,347.0
+1958-11-30,Airline1,310.0,118,305.0
+1958-12-31,Airline1,337.0,119,336.0
+1959-01-31,Airline1,360.0,120,340.0
+1959-02-28,Airline1,342.0,121,318.0
+1959-03-31,Airline1,406.0,122,362.0
+1959-04-30,Airline1,396.0,123,348.0
+1959-05-31,Airline1,420.0,124,363.0
+1959-06-30,Airline1,472.0,125,435.0
+1959-07-31,Airline1,548.0,126,491.0
+1959-08-31,Airline1,559.0,127,505.0
+1959-09-30,Airline1,463.0,128,404.0
+1959-10-31,Airline1,407.0,129,359.0
+1959-11-30,Airline1,362.0,130,310.0
+1959-12-31,Airline1,405.0,131,337.0
+1960-01-31,Airline1,417.0,132,360.0
+1960-02-29,Airline1,391.0,133,342.0
+1960-03-31,Airline1,419.0,134,406.0
+1960-04-30,Airline1,461.0,135,396.0
+1960-05-31,Airline1,472.0,136,420.0
+1960-06-30,Airline1,535.0,137,472.0
+1960-07-31,Airline1,622.0,138,548.0
+1960-08-31,Airline1,606.0,139,559.0
+1960-09-30,Airline1,508.0,140,463.0
+1960-10-31,Airline1,461.0,141,407.0
+1960-11-30,Airline1,390.0,142,362.0
+1960-12-31,Airline1,432.0,143,405.0
+1949-01-31,Airline2,412.0,144,412.0
+1949-02-28,Airline2,418.0,145,418.0
+1949-03-31,Airline2,432.0,146,432.0
+1949-04-30,Airline2,429.0,147,429.0
+1949-05-31,Airline2,421.0,148,421.0
+1949-06-30,Airline2,435.0,149,435.0
+1949-07-31,Airline2,448.0,150,448.0
+1949-08-31,Airline2,448.0,151,448.0
+1949-09-30,Airline2,436.0,152,436.0
+1949-10-31,Airline2,419.0,153,419.0
+1949-11-30,Airline2,404.0,154,404.0
+1949-12-31,Airline2,418.0,155,418.0
+1950-01-31,Airline2,415.0,156,412.0
+1950-02-28,Airline2,426.0,157,418.0
+1950-03-31,Airline2,441.0,158,432.0
+1950-04-30,Airline2,435.0,159,429.0
+1950-05-31,Airline2,425.0,160,421.0
+1950-06-30,Airline2,449.0,161,435.0
+1950-07-31,Airline2,470.0,162,448.0
+1950-08-31,Airline2,470.0,163,448.0
+1950-09-30,Airline2,458.0,164,436.0
+1950-10-31,Airline2,433.0,165,419.0
+1950-11-30,Airline2,414.0,166,404.0
+1950-12-31,Airline2,440.0,167,418.0
+1951-01-31,Airline2,445.0,168,415.0
+1951-02-28,Airline2,450.0,169,426.0
+1951-03-31,Airline2,478.0,170,441.0
+1951-04-30,Airline2,463.0,171,435.0
+1951-05-31,Airline2,472.0,172,425.0
+1951-06-30,Airline2,478.0,173,449.0
+1951-07-31,Airline2,499.0,174,470.0
+1951-08-31,Airline2,499.0,175,470.0
+1951-09-30,Airline2,484.0,176,458.0
+1951-10-31,Airline2,462.0,177,433.0
+1951-11-30,Airline2,446.0,178,414.0
+1951-12-31,Airline2,466.0,179,440.0
+1952-01-31,Airline2,471.0,180,445.0
+1952-02-29,Airline2,480.0,181,450.0
+1952-03-31,Airline2,493.0,182,478.0
+1952-04-30,Airline2,481.0,183,463.0
+1952-05-31,Airline2,483.0,184,472.0
+1952-06-30,Airline2,518.0,185,478.0
+1952-07-31,Airline2,530.0,186,499.0
+1952-08-31,Airline2,542.0,187,499.0
+1952-09-30,Airline2,509.0,188,484.0
+1952-10-31,Airline2,491.0,189,462.0
+1952-11-30,Airline2,472.0,190,446.0
+1952-12-31,Airline2,494.0,191,466.0
+1953-01-31,Airline2,496.0,192,471.0
+1953-02-28,Airline2,496.0,193,480.0
+1953-03-31,Airline2,536.0,194,493.0
+1953-04-30,Airline2,535.0,195,481.0
+1953-05-31,Airline2,529.0,196,483.0
+1953-06-30,Airline2,543.0,197,518.0
+1953-07-31,Airline2,564.0,198,530.0
+1953-08-31,Airline2,572.0,199,542.0
+1953-09-30,Airline2,537.0,200,509.0
+1953-10-31,Airline2,511.0,201,491.0
+1953-11-30,Airline2,480.0,202,472.0
+1953-12-31,Airline2,501.0,203,494.0
+1954-01-31,Airline2,504.0,204,496.0
+1954-02-28,Airline2,488.0,205,496.0
+1954-03-31,Airline2,535.0,206,536.0
+1954-04-30,Airline2,527.0,207,535.0
+1954-05-31,Airline2,534.0,208,529.0
+1954-06-30,Airline2,564.0,209,543.0
+1954-07-31,Airline2,602.0,210,564.0
+1954-08-31,Airline2,593.0,211,572.0
+1954-09-30,Airline2,559.0,212,537.0
+1954-10-31,Airline2,529.0,213,511.0
+1954-11-30,Airline2,503.0,214,480.0
+1954-12-31,Airline2,529.0,215,501.0
+1955-01-31,Airline2,542.0,216,504.0
+1955-02-28,Airline2,533.0,217,488.0
+1955-03-31,Airline2,567.0,218,535.0
+1955-04-30,Airline2,569.0,219,527.0
+1955-05-31,Airline2,570.0,220,534.0
+1955-06-30,Airline2,615.0,221,564.0
+1955-07-31,Airline2,664.0,222,602.0
+1955-08-31,Airline2,647.0,223,593.0
+1955-09-30,Airline2,612.0,224,559.0
+1955-10-31,Airline2,574.0,225,529.0
+1955-11-30,Airline2,537.0,226,503.0
+1955-12-31,Airline2,578.0,227,529.0
+1956-01-31,Airline2,584.0,228,542.0
+1956-02-29,Airline2,577.0,229,533.0
+1956-03-31,Airline2,617.0,230,567.0
+1956-04-30,Airline2,613.0,231,569.0
+1956-05-31,Airline2,618.0,232,570.0
+1956-06-30,Airline2,674.0,233,615.0
+1956-07-31,Airline2,713.0,234,664.0
+1956-08-31,Airline2,705.0,235,647.0
+1956-09-30,Airline2,655.0,236,612.0
+1956-10-31,Airline2,606.0,237,574.0
+1956-11-30,Airline2,571.0,238,537.0
+1956-12-31,Airline2,606.0,239,578.0
+1957-01-31,Airline2,615.0,240,584.0
+1957-02-28,Airline2,601.0,241,577.0
+1957-03-31,Airline2,656.0,242,617.0
+1957-04-30,Airline2,648.0,243,613.0
+1957-05-31,Airline2,655.0,244,618.0
+1957-06-30,Airline2,722.0,245,674.0
+1957-07-31,Airline2,765.0,246,713.0
+1957-08-31,Airline2,767.0,247,705.0
+1957-09-30,Airline2,704.0,248,655.0
+1957-10-31,Airline2,647.0,249,606.0
+1957-11-30,Airline2,605.0,250,571.0
+1957-12-31,Airline2,636.0,251,606.0
+1958-01-31,Airline2,640.0,252,615.0
+1958-02-28,Airline2,618.0,253,601.0
+1958-03-31,Airline2,662.0,254,656.0
+1958-04-30,Airline2,648.0,255,648.0
+1958-05-31,Airline2,663.0,256,655.0
+1958-06-30,Airline2,735.0,257,722.0
+1958-07-31,Airline2,791.0,258,765.0
+1958-08-31,Airline2,805.0,259,767.0
+1958-09-30,Airline2,704.0,260,704.0
+1958-10-31,Airline2,659.0,261,647.0
+1958-11-30,Airline2,610.0,262,605.0
+1958-12-31,Airline2,637.0,263,636.0
+1959-01-31,Airline2,660.0,264,640.0
+1959-02-28,Airline2,642.0,265,618.0
+1959-03-31,Airline2,706.0,266,662.0
+1959-04-30,Airline2,696.0,267,648.0
+1959-05-31,Airline2,720.0,268,663.0
+1959-06-30,Airline2,772.0,269,735.0
+1959-07-31,Airline2,848.0,270,791.0
+1959-08-31,Airline2,859.0,271,805.0
+1959-09-30,Airline2,763.0,272,704.0
+1959-10-31,Airline2,707.0,273,659.0
+1959-11-30,Airline2,662.0,274,610.0
+1959-12-31,Airline2,705.0,275,637.0
+1960-01-31,Airline2,717.0,276,660.0
+1960-02-29,Airline2,691.0,277,642.0
+1960-03-31,Airline2,719.0,278,706.0
+1960-04-30,Airline2,761.0,279,696.0
+1960-05-31,Airline2,772.0,280,720.0
+1960-06-30,Airline2,835.0,281,772.0
+1960-07-31,Airline2,922.0,282,848.0
+1960-08-31,Airline2,906.0,283,859.0
+1960-09-30,Airline2,808.0,284,763.0
+1960-10-31,Airline2,761.0,285,707.0
+1960-11-30,Airline2,690.0,286,662.0
+1960-12-31,Airline2,732.0,287,705.0
diff --git a/evadb/binder/statement_binder.py b/evadb/binder/statement_binder.py
index bee37f922..2b57229a6 100644
--- a/evadb/binder/statement_binder.py
+++ b/evadb/binder/statement_binder.py
@@ -126,10 +126,10 @@ def _bind_create_function_statement(self, node: CreateFunctionStatement):
                     elif column.name == arg_map.get("predict", "y"):
                         outputs.append(column)
                         required_columns.remove(column.name)
-                    else:
-                        raise BinderError(
-                            f"Unexpected column {column.name} found for forecasting function."
-                        )
+                    # else:
+                    #     raise BinderError(
+                    #         f"Unexpected column {column.name} found for forecasting function."
+                    #     )
                 assert (
                     len(required_columns) == 0
                 ), f"Missing required {required_columns} columns for forecasting function."
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index e711882da..1393b9567 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -244,7 +244,7 @@ def handle_forecasting_function(self):
         """
             Set or infer data frequency
         """
-
+        
         if "frequency" not in arg_map.keys():
             arg_map["frequency"] = pd.infer_freq(data["ds"])
         frequency = arg_map["frequency"]
@@ -277,15 +277,17 @@ def handle_forecasting_function(self):
         if library == "neuralforecast":
             from neuralforecast import NeuralForecast
             from neuralforecast.auto import AutoNBEATS, AutoNHITS
-            from neuralforecast.models import NHITS
+            from neuralforecast.models import NBEATS, NHITS
 
             model_dict = {
+                "AutoNBEATS": AutoNBEATS,
                 "AutoNHITS": AutoNHITS,
+                "NBEATS": NBEATS,
                 "NHITS": NHITS,
             }
 
             if "model" not in arg_map.keys():
-                arg_map["model"] = "AutoNHITS"
+                arg_map["model"] = "NBEATS"
 
             try:
                 model_here = model_dict[arg_map["model"]]
@@ -342,17 +344,21 @@ def handle_forecasting_function(self):
 
         data["ds"] = pd.to_datetime(data["ds"])
 
+        encoding_text = data.to_string()
+        if "exogenous" in arg_map.keys():
+            encoding_text += "exogenous_"+str(sorted(exogenous_args))
+
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
             library,
-            arg_map["model"]
+            arg_map["model"],
+            str(hashlib.sha256(encoding_text.encode()).hexdigest())
         )
         Path(model_dir).mkdir(parents=True, exist_ok=True)
 
         model_save_name = (
-            str(hashlib.sha256(data.to_string().encode()).hexdigest())
-            + "_horizon"
+            "horizon"
             + str(horizon)
             + ".pkl"
         )
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index 2a9b266c7..2a807612f 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -30,6 +30,7 @@ def setUpClass(cls):
         # reset the catalog manager before running each test
         cls.evadb.catalog().reset()
 
+
         create_table_query = """
             CREATE TABLE AirData (\
             unique_id TEXT(30),\
@@ -37,6 +38,15 @@ def setUpClass(cls):
             y INTEGER);"""
         execute_query_fetch_all(cls.evadb, create_table_query)
 
+        create_table_query = """
+            CREATE TABLE AirDataPanel (\
+            unique_id TEXT(30),\
+            ds TEXT(30),\
+            y INTEGER,\
+            trend INTEGER,\
+            ylagged INTEGER);"""
+        execute_query_fetch_all(cls.evadb, create_table_query)
+
         create_table_query = """
             CREATE TABLE HomeData (\
             saledate TEXT(30),\
@@ -49,6 +59,10 @@ def setUpClass(cls):
         load_query = f"LOAD CSV '{path}' INTO AirData;"
         execute_query_fetch_all(cls.evadb, load_query)
 
+        path = f"{EvaDB_ROOT_DIR}/data/forecasting/ AirPassengersPanel.csv"
+        load_query = f"LOAD CSV '{path}' INTO AirDataPanel;"
+        execute_query_fetch_all(cls.evadb, load_query)
+
         path = f"{EvaDB_ROOT_DIR}/data/forecasting/home_sales.csv"
         load_query = f"LOAD CSV '{path}' INTO HomeData;"
         execute_query_fetch_all(cls.evadb, load_query)
@@ -69,13 +83,14 @@ def test_forecast(self):
         create_predict_udf = """
             CREATE FUNCTION AirForecast FROM
             (SELECT unique_id, ds, y FROM AirData)
+            HORIZON 12
             TYPE Forecasting
             PREDICT 'y';
         """
         execute_query_fetch_all(self.evadb, create_predict_udf)
 
         predict_query = """
-            SELECT AirForecast(12) order by y;
+            SELECT AirForecast() order by y;
         """
         result = execute_query_fetch_all(self.evadb, predict_query)
         self.assertEqual(len(result), 12)
@@ -83,6 +98,27 @@ def test_forecast(self):
             result.columns, ["airforecast.unique_id", "airforecast.ds", "airforecast.y"]
         )
 
+        create_predict_udf = """
+            CREATE FUNCTION AirPanelForecast FROM
+            (SELECT unique_id, ds, y, trend FROM AirDataPanel)
+            HORIZON 12
+            TYPE Forecasting
+            PREDICT 'y'
+            LIBRARY 'neuralforecast'
+            EXOGENOUS 'trend'
+            FREQUENCY 'M';
+        """
+        execute_query_fetch_all(self.evadb, create_predict_udf)
+
+        predict_query = """
+            SELECT AirPanelForecast() order by y;
+        """
+        result = execute_query_fetch_all(self.evadb, predict_query)
+        self.assertEqual(len(result), 12)
+        self.assertEqual(
+            result.columns, ["airpanelforecast.unique_id", "airpanelforecast.ds", "airpanelforecast.y"]
+        )
+
     @forecast_skip_marker
     def test_forecast_with_column_rename(self):
         create_predict_udf = """

From 52c563e2d81d27e68df9956ccf084a0b9f480d6f Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Mon, 25 Sep 2023 11:01:39 -0400
Subject: [PATCH 12/23] add tests

---
 .../source/reference/ai/model-forecasting.rst |  6 +++-
 evadb/executor/create_function_executor.py    | 28 ++++++++-----------
 setup.py                                      |  1 +
 .../long/test_model_forecasting.py            |  4 +--
 4 files changed, 20 insertions(+), 19 deletions(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index ac6152783..be09f473a 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -53,8 +53,12 @@ EvaDB's default forecast framework is `statsforecast <https://nixtla.github.io/s
      - The name of the column that contains the datestamp, wihch should be of a format expected by Pandas, ideally YYYY-MM-DD for a date or YYYY-MM-DD HH:MM:SS for a timestamp. Please visit the `pandas documentation <https://pandas.pydata.org/docs/reference/api/pandas.to_datetime.html>`_ for details. If not provided, an auto increasing ID column will be used.
    * - ID
      - The name of column that represents an identifier for the series. If not provided, the whole table is considered as one series of data.
+   * - LIBRARY
+     - We can select one of `statsforecast` (default) or `neuralforecast`. `statsforecast` provides access to statistical forecasting methods, while `neuralforecast` gives access to deep-learning based forecasting methods.
    * - MODEL
-     - We can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models.
+     - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `Automatic Forecasting <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
+   * - EXOGENOUS
+     - The names of columns to be treated as exogenous variables, separated by comma. These columns would be considered for forecasting by the backend only for LIBRARY `neuralforecast`.
    * - Frequency
      - A string indicating the frequency of the data. The common used ones are D, W, M, Y, which repestively represents day-, week-, month- and year- end frequency. The default value is M. Check `pandas available frequencies <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`_ for all available frequencies.
 
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index 1393b9567..c88c86a06 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -244,7 +244,7 @@ def handle_forecasting_function(self):
         """
             Set or infer data frequency
         """
-        
+
         if "frequency" not in arg_map.keys():
             arg_map["frequency"] = pd.infer_freq(data["ds"])
         frequency = arg_map["frequency"]
@@ -297,19 +297,21 @@ def handle_forecasting_function(self):
                 raise FunctionIODefinitionError(err_msg)
             model_args = {}
             if "exogenous" in arg_map.keys():
-                exogenous_args = [x.strip() for x in arg_map["exogenous"].strip().split(",")]
+                exogenous_args = [
+                    x.strip() for x in arg_map["exogenous"].strip().split(",")
+                ]
                 model_args["hist_exog_list"] = exogenous_args
 
             if "auto" not in arg_map["model"].lower():
-                model_args["input_size"] = 2*horizon
+                model_args["input_size"] = 2 * horizon
                 model_args["max_steps"] = 50
-            
+
             model_args["h"] = horizon
 
             model = NeuralForecast(
-                    [model_here(**model_args)],
-                    freq=new_freq,
-                )
+                [model_here(**model_args)],
+                freq=new_freq,
+            )
 
         # """
         #     Statsforecast implementation
@@ -335,8 +337,6 @@ def handle_forecasting_function(self):
                 logger.error(err_msg)
                 raise FunctionIODefinitionError(err_msg)
 
-
-            
             else:
                 model = StatsForecast(
                     [model_here(season_length=season_length)], freq=new_freq
@@ -346,22 +346,18 @@ def handle_forecasting_function(self):
 
         encoding_text = data.to_string()
         if "exogenous" in arg_map.keys():
-            encoding_text += "exogenous_"+str(sorted(exogenous_args))
+            encoding_text += "exogenous_" + str(sorted(exogenous_args))
 
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
             library,
             arg_map["model"],
-            str(hashlib.sha256(encoding_text.encode()).hexdigest())
+            str(hashlib.sha256(encoding_text.encode()).hexdigest()),
         )
         Path(model_dir).mkdir(parents=True, exist_ok=True)
 
-        model_save_name = (
-            "horizon"
-            + str(horizon)
-            + ".pkl"
-        )
+        model_save_name = "horizon" + str(horizon) + ".pkl"
 
         model_path = os.path.join(model_dir, model_save_name)
 
diff --git a/setup.py b/setup.py
index 4389b3c2e..c050fd9cd 100644
--- a/setup.py
+++ b/setup.py
@@ -120,6 +120,7 @@ def read(path, encoding="utf-8"):
 
 forecasting_libs = [
     "statsforecast" # MODEL TRAIN AND FINE TUNING
+    "neuralforecast" # MODEL TRAIN AND FINE TUNING
 ]
 
 ### NEEDED FOR DEVELOPER TESTING ONLY
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index 2a807612f..d18649e59 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -30,7 +30,6 @@ def setUpClass(cls):
         # reset the catalog manager before running each test
         cls.evadb.catalog().reset()
 
-
         create_table_query = """
             CREATE TABLE AirData (\
             unique_id TEXT(30),\
@@ -116,7 +115,8 @@ def test_forecast(self):
         result = execute_query_fetch_all(self.evadb, predict_query)
         self.assertEqual(len(result), 12)
         self.assertEqual(
-            result.columns, ["airpanelforecast.unique_id", "airpanelforecast.ds", "airpanelforecast.y"]
+            result.columns,
+            ["airpanelforecast.unique_id", "airpanelforecast.ds", "airpanelforecast.y"],
         )
 
     @forecast_skip_marker

From 84a159e9c681feb75ac78ba1ec3c63618a0ac14a Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Mon, 25 Sep 2023 14:08:47 -0400
Subject: [PATCH 13/23] wip: fix test

---
 docs/source/reference/ai/model-forecasting.rst        | 2 +-
 setup.py                                              | 2 +-
 test/integration_tests/long/test_model_forecasting.py | 6 +++---
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index be09f473a..0234aefdf 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -56,7 +56,7 @@ EvaDB's default forecast framework is `statsforecast <https://nixtla.github.io/s
    * - LIBRARY
      - We can select one of `statsforecast` (default) or `neuralforecast`. `statsforecast` provides access to statistical forecasting methods, while `neuralforecast` gives access to deep-learning based forecasting methods.
    * - MODEL
-     - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `Automatic Forecasting <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
+     - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `NBEATS docs <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
    * - EXOGENOUS
      - The names of columns to be treated as exogenous variables, separated by comma. These columns would be considered for forecasting by the backend only for LIBRARY `neuralforecast`.
    * - Frequency
diff --git a/setup.py b/setup.py
index c050fd9cd..87833578d 100644
--- a/setup.py
+++ b/setup.py
@@ -119,7 +119,7 @@ def read(path, encoding="utf-8"):
 ludwig_libs = ["ludwig[hyperopt,distributed]"]  # MODEL TRAIN AND FINE TUNING
 
 forecasting_libs = [
-    "statsforecast" # MODEL TRAIN AND FINE TUNING
+    "statsforecast", # MODEL TRAIN AND FINE TUNING
     "neuralforecast" # MODEL TRAIN AND FINE TUNING
 ]
 
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index d18649e59..1941a4c71 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -58,7 +58,7 @@ def setUpClass(cls):
         load_query = f"LOAD CSV '{path}' INTO AirData;"
         execute_query_fetch_all(cls.evadb, load_query)
 
-        path = f"{EvaDB_ROOT_DIR}/data/forecasting/ AirPassengersPanel.csv"
+        path = f"{EvaDB_ROOT_DIR}/data/forecasting/AirPassengersPanel.csv"
         load_query = f"LOAD CSV '{path}' INTO AirDataPanel;"
         execute_query_fetch_all(cls.evadb, load_query)
 
@@ -82,8 +82,8 @@ def test_forecast(self):
         create_predict_udf = """
             CREATE FUNCTION AirForecast FROM
             (SELECT unique_id, ds, y FROM AirData)
-            HORIZON 12
             TYPE Forecasting
+            HORIZON 12
             PREDICT 'y';
         """
         execute_query_fetch_all(self.evadb, create_predict_udf)
@@ -100,8 +100,8 @@ def test_forecast(self):
         create_predict_udf = """
             CREATE FUNCTION AirPanelForecast FROM
             (SELECT unique_id, ds, y, trend FROM AirDataPanel)
-            HORIZON 12
             TYPE Forecasting
+            HORIZON 12
             PREDICT 'y'
             LIBRARY 'neuralforecast'
             EXOGENOUS 'trend'

From 06a7db0bb21703084816d03ff65a9b72aedb4f49 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Mon, 25 Sep 2023 15:21:31 -0400
Subject: [PATCH 14/23] remove strict column check in test

---
 .../binder/test_statement_binder.py           | 88 +++++++++----------
 1 file changed, 44 insertions(+), 44 deletions(-)

diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index 6a4ee08de..e267250f6 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -568,50 +568,50 @@ def test_bind_create_function_should_bind_forecast_with_renaming_columns(self):
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
 
-    def test_bind_create_function_should_raise_forecast_with_unexpected_columns(self):
-        with patch.object(StatementBinder, "bind"):
-            create_function_statement = MagicMock()
-            create_function_statement.function_type = "forecasting"
-            id_col_obj = ColumnCatalogEntry(
-                name="type",
-                type=MagicMock(),
-                array_type=MagicMock(),
-                array_dimensions=MagicMock(),
-            )
-            ds_col_obj = ColumnCatalogEntry(
-                name="saledate",
-                type=MagicMock(),
-                array_type=MagicMock(),
-                array_dimensions=MagicMock(),
-            )
-            y_col_obj = ColumnCatalogEntry(
-                name="ma",
-                type=MagicMock(),
-                array_type=MagicMock(),
-                array_dimensions=MagicMock(),
-            )
-            create_function_statement.query.target_list = [
-                TupleValueExpression(
-                    name=id_col_obj.name, table_alias="a", col_object=id_col_obj
-                ),
-                TupleValueExpression(
-                    name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
-                ),
-                TupleValueExpression(
-                    name=y_col_obj.name, table_alias="a", col_object=y_col_obj
-                ),
-            ]
-            create_function_statement.metadata = [
-                ("predict", "ma"),
-                ("time", "saledate"),
-            ]
-            binder = StatementBinder(StatementBinderContext(MagicMock()))
-
-            with self.assertRaises(BinderError) as cm:
-                binder._bind_create_function_statement(create_function_statement)
-
-            err_msg = "Unexpected column type found for forecasting function."
-            self.assertEqual(str(cm.exception), err_msg)
+    # def test_bind_create_function_should_raise_forecast_with_unexpected_columns(self):
+    #     with patch.object(StatementBinder, "bind"):
+    #         create_function_statement = MagicMock()
+    #         create_function_statement.function_type = "forecasting"
+    #         id_col_obj = ColumnCatalogEntry(
+    #             name="type",
+    #             type=MagicMock(),
+    #             array_type=MagicMock(),
+    #             array_dimensions=MagicMock(),
+    #         )
+    #         ds_col_obj = ColumnCatalogEntry(
+    #             name="saledate",
+    #             type=MagicMock(),
+    #             array_type=MagicMock(),
+    #             array_dimensions=MagicMock(),
+    #         )
+    #         y_col_obj = ColumnCatalogEntry(
+    #             name="ma",
+    #             type=MagicMock(),
+    #             array_type=MagicMock(),
+    #             array_dimensions=MagicMock(),
+    #         )
+    #         create_function_statement.query.target_list = [
+    #             TupleValueExpression(
+    #                 name=id_col_obj.name, table_alias="a", col_object=id_col_obj
+    #             ),
+    #             TupleValueExpression(
+    #                 name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
+    #             ),
+    #             TupleValueExpression(
+    #                 name=y_col_obj.name, table_alias="a", col_object=y_col_obj
+    #             ),
+    #         ]
+    #         create_function_statement.metadata = [
+    #             ("predict", "ma"),
+    #             ("time", "saledate"),
+    #         ]
+    #         binder = StatementBinder(StatementBinderContext(MagicMock()))
+
+    #         with self.assertRaises(BinderError) as cm:
+    #             binder._bind_create_function_statement(create_function_statement)
+
+    #         err_msg = "Unexpected column type found for forecasting function."
+    #         self.assertEqual(str(cm.exception), err_msg)
 
     def test_bind_create_function_should_raise_forecast_missing_required_columns(self):
         with patch.object(StatementBinder, "bind"):

From 32a204bc7d44a3088dd2cdec9f79d4da2aeeb9db Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Thu, 28 Sep 2023 14:05:25 -0400
Subject: [PATCH 15/23] Fix GPU issue with neuralforecast; fixed auto exog
 veriables

---
 evadb/executor/create_function_executor.py | 32 ++++++++++++++--------
 1 file changed, 20 insertions(+), 12 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index c88c86a06..3cb9065f3 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -183,6 +183,7 @@ def handle_ultralytics_function(self):
 
     def handle_forecasting_function(self):
         """Handle forecasting functions"""
+        os.environ["CUDA_VISIBLE_DEVICES"] = ""
         aggregated_batch_list = []
         child = self.children[0]
         for batch in child.exec():
@@ -296,15 +297,17 @@ def handle_forecasting_function(self):
                 logger.error(err_msg)
                 raise FunctionIODefinitionError(err_msg)
             model_args = {}
-            if "exogenous" in arg_map.keys():
-                exogenous_args = [
-                    x.strip() for x in arg_map["exogenous"].strip().split(",")
+
+            if len(data.columns) >= 4:
+                exogenous_columns = [
+                    x for x in list(data.columns) if x not in ["ds", "y", "unique_id"]
                 ]
-                model_args["hist_exog_list"] = exogenous_args
+                model_args["hist_exog_list"] = exogenous_columns
 
             if "auto" not in arg_map["model"].lower():
                 model_args["input_size"] = 2 * horizon
-                model_args["max_steps"] = 50
+
+            model_args["early_stop_patience_steps"] = 20
 
             model_args["h"] = horizon
 
@@ -344,16 +347,15 @@ def handle_forecasting_function(self):
 
         data["ds"] = pd.to_datetime(data["ds"])
 
-        encoding_text = data.to_string()
-        if "exogenous" in arg_map.keys():
-            encoding_text += "exogenous_" + str(sorted(exogenous_args))
+        model_save_dir_name = library + "_" + arg_map["model"] + "_" + new_freq
+        if len(data.columns) >= 4:
+            model_save_dir_name += "_exogenous_" + str(sorted(exogenous_columns))
 
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
             self.node.name,
-            library,
-            arg_map["model"],
-            str(hashlib.sha256(encoding_text.encode()).hexdigest()),
+            model_save_dir_name,
+            str(hashlib.sha256(data.to_string().encode()).hexdigest()),
         )
         Path(model_dir).mkdir(parents=True, exist_ok=True)
 
@@ -371,7 +373,11 @@ def handle_forecasting_function(self):
             if int(x.split("horizon")[1].split(".pkl")[0]) >= horizon
         ]
         if len(existing_model_files) == 0:
-            model.fit(df=data)
+            print("Training")
+            if library == "neuralforecast":
+                model.fit(df=data, val_size=horizon)
+            else:
+                model.fit(df=data)
             f = open(model_path, "wb")
             pickle.dump(model, f)
             f.close()
@@ -396,6 +402,8 @@ def handle_forecasting_function(self):
             FunctionMetadataCatalogEntry("library", library),
         ]
 
+        os.environ.pop("CUDA_VISIBLE_DEVICES", None)
+
         return (
             self.node.name,
             impl_path,

From 736d9e0b3a876dba0bfae48a717c8c9561d24cb2 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Thu, 28 Sep 2023 20:30:48 -0400
Subject: [PATCH 16/23] added auto support; updated docs

---
 .../source/reference/ai/model-forecasting.rst | 22 ++++++-----
 evadb/executor/create_function_executor.py    | 37 ++++++++++++++-----
 .../long/test_model_forecasting.py            |  4 +-
 3 files changed, 41 insertions(+), 22 deletions(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index 5c46bae85..ff7c1803b 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -47,20 +47,22 @@ EvaDB's default forecast framework is `statsforecast <https://nixtla.github.io/s
 .. list-table:: Available Parameters
    :widths: 25 75
 
-   * - PREDICT (**required**) 
+   * - PREDICT (required) 
      - The name of the column we wish to forecast.
-   * - TIME
-     - The name of the column that contains the datestamp, wihch should be of a format expected by Pandas, ideally YYYY-MM-DD for a date or YYYY-MM-DD HH:MM:SS for a timestamp. Please visit the `pandas documentation <https://pandas.pydata.org/docs/reference/api/pandas.to_datetime.html>`_ for details. If not provided, an auto increasing ID column will be used.
-   * - ID
-     - The name of column that represents an identifier for the series. If not provided, the whole table is considered as one series of data.
-   * - LIBRARY
+   * - TIME (default: 'ds')
+     - The name of the column that contains the datestamp, which should be of a format expected by Pandas, ideally YYYY-MM-DD for a date or YYYY-MM-DD HH:MM:SS for a timestamp. Please visit the `pandas documentation <https://pandas.pydata.org/docs/reference/api/pandas.to_datetime.html>`_ for details. If relevant column is not found, an auto increasing ID column will be used.
+   * - ID (default: 'unique_id')
+     - The name of column that represents an identifier for the series. If relevant column is not found, the whole table is considered as one series of data.
+   * - LIBRARY (default: 'statsforecast')
      - We can select one of `statsforecast` (default) or `neuralforecast`. `statsforecast` provides access to statistical forecasting methods, while `neuralforecast` gives access to deep-learning based forecasting methods.
-   * - MODEL
+   * - MODEL (default: 'AutoARIMA')
      - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `NBEATS docs <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
-   * - EXOGENOUS
+   * - AUTO (default: 'F')
      - The names of columns to be treated as exogenous variables, separated by comma. These columns would be considered for forecasting by the backend only for LIBRARY `neuralforecast`.
-   * - Frequency
-     - A string indicating the frequency of the data. The common used ones are D, W, M, Y, which repestively represents day-, week-, month- and year- end frequency. The default value is M. Check `pandas available frequencies <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`_ for all available frequencies.
+   * - Frequency (default: 'auto')
+     - A string indicating the frequency of the data. The common used ones are D, W, M, Y, which repestively represents day-, week-, month- and year- end frequency. The default value is M. Check `pandas available frequencies <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`_ for all available frequencies. If it is not provided, the frequency is attempted to be determined automatically.
+
+Note: If columns other than the ones required as mentioned above are passed while creating the function, they will be treated as exogenous variables if LIBRARY is `neuralforecast` and the AUTO is set to F. In other situations, they would be ignored.
 
 Below is an example query specifying the above parameters:
 
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index 3cb9065f3..82570ea4e 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -246,7 +246,7 @@ def handle_forecasting_function(self):
             Set or infer data frequency
         """
 
-        if "frequency" not in arg_map.keys():
+        if "frequency" not in arg_map.keys() or arg_map["frequency"] == "auto":
             arg_map["frequency"] = pd.infer_freq(data["ds"])
         frequency = arg_map["frequency"]
         if frequency is None:
@@ -290,6 +290,12 @@ def handle_forecasting_function(self):
             if "model" not in arg_map.keys():
                 arg_map["model"] = "NBEATS"
 
+            if (
+                arg_map["model"].lower()[0] == "t"
+                and "auto" not in arg_map["model"].lower()
+            ):
+                arg_map["model"] = "Auto" + arg_map["model"]
+
             try:
                 model_here = model_dict[arg_map["model"]]
             except Exception:
@@ -298,16 +304,17 @@ def handle_forecasting_function(self):
                 raise FunctionIODefinitionError(err_msg)
             model_args = {}
 
-            if len(data.columns) >= 4:
-                exogenous_columns = [
-                    x for x in list(data.columns) if x not in ["ds", "y", "unique_id"]
-                ]
-                model_args["hist_exog_list"] = exogenous_columns
-
             if "auto" not in arg_map["model"].lower():
                 model_args["input_size"] = 2 * horizon
+                if len(data.columns) >= 4:
+                    exogenous_columns = [
+                        x
+                        for x in list(data.columns)
+                        if x not in ["ds", "y", "unique_id"]
+                    ]
+                    model_args["hist_exog_list"] = exogenous_columns
 
-            model_args["early_stop_patience_steps"] = 20
+                model_args["early_stop_patience_steps"] = 20
 
             model_args["h"] = horizon
 
@@ -333,6 +340,12 @@ def handle_forecasting_function(self):
             if "model" not in arg_map.keys():
                 arg_map["model"] = "AutoARIMA"
 
+            if (
+                arg_map["model"].lower()[0] == "t"
+                and "auto" not in arg_map["model"].lower()
+            ):
+                arg_map["model"] = "Auto" + arg_map["model"]
+
             try:
                 model_here = model_dict[arg_map["model"]]
             except Exception:
@@ -348,7 +361,11 @@ def handle_forecasting_function(self):
         data["ds"] = pd.to_datetime(data["ds"])
 
         model_save_dir_name = library + "_" + arg_map["model"] + "_" + new_freq
-        if len(data.columns) >= 4:
+        if (
+            len(data.columns) >= 4
+            and "auto" not in arg_map["model"].lower()
+            and library == "neuralforecast"
+        ):
             model_save_dir_name += "_exogenous_" + str(sorted(exogenous_columns))
 
         model_dir = os.path.join(
@@ -373,7 +390,7 @@ def handle_forecasting_function(self):
             if int(x.split("horizon")[1].split(".pkl")[0]) >= horizon
         ]
         if len(existing_model_files) == 0:
-            print("Training")
+            print("Training, please wait...")
             if library == "neuralforecast":
                 model.fit(df=data, val_size=horizon)
             else:
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index 1941a4c71..f47ff328e 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -104,7 +104,6 @@ def test_forecast(self):
             HORIZON 12
             PREDICT 'y'
             LIBRARY 'neuralforecast'
-            EXOGENOUS 'trend'
             FREQUENCY 'M';
         """
         execute_query_fetch_all(self.evadb, create_predict_udf)
@@ -128,6 +127,7 @@ def test_forecast_with_column_rename(self):
                 WHERE bedrooms = 2
             )
             TYPE Forecasting
+            HORIZON 24
             PREDICT 'ma'
             ID 'type'
             TIME 'saledate'
@@ -136,7 +136,7 @@ def test_forecast_with_column_rename(self):
         execute_query_fetch_all(self.evadb, create_predict_udf)
 
         predict_query = """
-            SELECT HomeForecast(12);
+            SELECT HomeForecast();
         """
         result = execute_query_fetch_all(self.evadb, predict_query)
         self.assertEqual(len(result), 24)

From 06fb001cab01418f75ad166eb2f30cc5162c4281 Mon Sep 17 00:00:00 2001
From: Andy Xu <xzdandy@gmail.com>
Date: Fri, 29 Sep 2023 00:35:43 -0400
Subject: [PATCH 17/23] Update forecasting notebook.

---
 tutorials/16-homesale-forecasting.ipynb | 281 +++++++++++-------------
 1 file changed, 126 insertions(+), 155 deletions(-)

diff --git a/tutorials/16-homesale-forecasting.ipynb b/tutorials/16-homesale-forecasting.ipynb
index f2d81c9ff..82451bb69 100644
--- a/tutorials/16-homesale-forecasting.ipynb
+++ b/tutorials/16-homesale-forecasting.ipynb
@@ -8,7 +8,7 @@
       "collapsed_sections": [
         "GHToaA_NKiHY"
       ],
-      "authorship_tag": "ABX9TyPOmDfDbnc8CP+70g/FkjHR"
+      "authorship_tag": "ABX9TyO5CS+F9YOzKquzJseLZjOy"
     },
     "kernelspec": {
       "name": "python3",
@@ -70,7 +70,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "Z7PodOEEEDsQ",
-        "outputId": "0dcaa531-ae05-4c13-ab74-6dacdf6d8739"
+        "outputId": "37d49a92-bd41-4486-fad7-16ddecc88536"
       },
       "execution_count": 1,
       "outputs": [
@@ -93,7 +93,7 @@
             "After this operation, 51.5 MB of additional disk space will be used.\n",
             "Preconfiguring packages ...\n",
             "Selecting previously unselected package logrotate.\n",
-            "(Reading database ... 120901 files and directories currently installed.)\n",
+            "(Reading database ... 120895 files and directories currently installed.)\n",
             "Preparing to unpack .../00-logrotate_3.19.0-1ubuntu1.1_amd64.deb ...\n",
             "Unpacking logrotate (3.19.0-1ubuntu1.1) ...\n",
             "Selecting previously unselected package netbase.\n",
@@ -211,7 +211,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "UrlfWZOkEa4V",
-        "outputId": "1fc62319-0d3f-4f2a-bcc4-e408587e50fb"
+        "outputId": "4ab9906a-b4a1-4487-8f12-69b4efca2be5"
       },
       "execution_count": 2,
       "outputs": [
@@ -264,7 +264,7 @@
     {
       "cell_type": "code",
       "source": [
-        "%pip install --quiet \"evadb[postgres,forecasting] @ git+https://github.com/georgia-tech-db/evadb.git@a40c72ed6cb18993e2ae5bda28c7195f4de4f109\"\n",
+        "%pip install --quiet \"evadb[postgres,forecasting] @ git+https://github.com/georgia-tech-db/evadb.git@736d9e0b3a876dba0bfae48a717c8c9561d24cb2\"\n",
         "\n",
         "import evadb\n",
         "cursor = evadb.connect().cursor()"
@@ -274,7 +274,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "NoAykveeElqm",
-        "outputId": "de6547e5-670d-4fba-d081-30ffecc74849"
+        "outputId": "90d07f6e-cf75-4ca4-85e3-867d7db7b49f"
       },
       "execution_count": 4,
       "outputs": [
@@ -285,22 +285,26 @@
             "  Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
             "  Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
             "  Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.6/92.6 kB\u001b[0m \u001b[31m2.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m108.9/108.9 kB\u001b[0m \u001b[31m12.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m137.6/137.6 kB\u001b[0m \u001b[31m15.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.5/45.5 kB\u001b[0m \u001b[31m5.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.9/110.9 kB\u001b[0m \u001b[31m14.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m98.7/98.7 kB\u001b[0m \u001b[31m11.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m275.0/275.0 kB\u001b[0m \u001b[31m26.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.1/3.1 MB\u001b[0m \u001b[31m32.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[?25h\u001b[33mWARNING: Retrying (Retry(total=4, connect=None, read=None, redirect=None, status=None)) after connection broken by 'ProtocolError('Connection aborted.', RemoteDisconnected('Remote end closed connection without response'))': /simple/triad/\u001b[0m\u001b[33m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.0/57.0 kB\u001b[0m \u001b[31m6.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m169.2/169.2 kB\u001b[0m \u001b[31m20.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.6/154.6 kB\u001b[0m \u001b[31m15.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.6/92.6 kB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m108.9/108.9 kB\u001b[0m \u001b[31m7.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m137.6/137.6 kB\u001b[0m \u001b[31m10.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.5/45.5 kB\u001b[0m \u001b[31m3.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.9/110.9 kB\u001b[0m \u001b[31m9.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m162.6/162.6 kB\u001b[0m \u001b[31m9.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m98.7/98.7 kB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m727.7/727.7 kB\u001b[0m \u001b[31m18.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.5/62.5 MB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m275.0/275.0 kB\u001b[0m \u001b[31m23.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.1/3.1 MB\u001b[0m \u001b[31m84.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.0/57.0 kB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m169.2/169.2 kB\u001b[0m \u001b[31m18.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.7/154.7 kB\u001b[0m \u001b[31m15.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
             "\u001b[?25h  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m303.2/303.2 kB\u001b[0m \u001b[31m32.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.2/144.2 kB\u001b[0m \u001b[31m17.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m135.3/135.3 kB\u001b[0m \u001b[31m17.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m313.3/313.3 kB\u001b[0m \u001b[31m27.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m805.2/805.2 kB\u001b[0m \u001b[31m60.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m101.7/101.7 kB\u001b[0m \u001b[31m12.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.2/144.2 kB\u001b[0m \u001b[31m17.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m135.3/135.3 kB\u001b[0m \u001b[31m13.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
             "\u001b[?25h  Building wheel for evadb (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
             "  Building wheel for fugue-sql-antlr (setup.py) ... \u001b[?25l\u001b[?25hdone\n"
           ]
@@ -310,7 +314,7 @@
           "name": "stderr",
           "text": [
             "Downloading: \"http://ml.cs.tsinghua.edu.cn/~chenxi/pytorch-models/mnist-b07bb66b.pth\" to /root/.cache/torch/hub/checkpoints/mnist-b07bb66b.pth\n",
-            "100%|██████████| 1.03M/1.03M [00:01<00:00, 898kB/s]\n",
+            "100%|██████████| 1.03M/1.03M [00:01<00:00, 723kB/s] \n",
             "Downloading: \"https://download.pytorch.org/models/fasterrcnn_resnet50_fpn_coco-258fb6c6.pth\" to /root/.cache/torch/hub/checkpoints/fasterrcnn_resnet50_fpn_coco-258fb6c6.pth\n"
           ]
         }
@@ -352,10 +356,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 81
+          "height": 80
         },
         "id": "IsP6rLZ2Ftxo",
-        "outputId": "eee82699-fd4f-4aa8-edac-a9f0e0575e98"
+        "outputId": "f8ab8a89-739c-42f5-fa9b-353d4e471251"
       },
       "execution_count": 5,
       "outputs": [
@@ -368,7 +372,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-559fd0c5-3aa0-4b5c-be1b-18203fb7d960\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-a33adaa7-4ec6-4065-a69d-cc379f825855\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -401,7 +405,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-559fd0c5-3aa0-4b5c-be1b-18203fb7d960')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-a33adaa7-4ec6-4065-a69d-cc379f825855')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -453,12 +457,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-559fd0c5-3aa0-4b5c-be1b-18203fb7d960 button.colab-df-convert');\n",
+              "        document.querySelector('#df-a33adaa7-4ec6-4065-a69d-cc379f825855 button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-559fd0c5-3aa0-4b5c-be1b-18203fb7d960');\n",
+              "        const element = document.querySelector('#df-a33adaa7-4ec6-4065-a69d-cc379f825855');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -505,7 +509,7 @@
       "metadata": {
         "id": "msbHcP_xJpFV"
       },
-      "execution_count": 23,
+      "execution_count": 6,
       "outputs": []
     },
     {
@@ -520,12 +524,12 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 81
+          "height": 80
         },
         "id": "MhYfovbzNB-k",
-        "outputId": "240995b6-2bba-4e34-e955-5ba9c4f1a171"
+        "outputId": "b8bb6814-2aab-4a54-cf63-7cf44d183628"
       },
-      "execution_count": 21,
+      "execution_count": 7,
       "outputs": [
         {
           "output_type": "execute_result",
@@ -536,7 +540,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-2f4467d1-bc66-4eb4-a385-4c27587b0c81\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-f85ea85d-bae8-465c-93a3-85a95523d220\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -569,7 +573,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-2f4467d1-bc66-4eb4-a385-4c27587b0c81')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-f85ea85d-bae8-465c-93a3-85a95523d220')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -621,12 +625,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-2f4467d1-bc66-4eb4-a385-4c27587b0c81 button.colab-df-convert');\n",
+              "        document.querySelector('#df-f85ea85d-bae8-465c-93a3-85a95523d220 button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-2f4467d1-bc66-4eb4-a385-4c27587b0c81');\n",
+              "        const element = document.querySelector('#df-f85ea85d-bae8-465c-93a3-85a95523d220');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -650,7 +654,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 21
+          "execution_count": 7
         }
       ]
     },
@@ -668,12 +672,12 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 81
+          "height": 80
         },
         "id": "OH8Fxn0SNYO3",
-        "outputId": "b0cbe3ac-f64a-454d-b39c-60735621c2df"
+        "outputId": "58ceacff-f392-4f27-c8ef-0873b81ba943"
       },
-      "execution_count": 24,
+      "execution_count": 8,
       "outputs": [
         {
           "output_type": "execute_result",
@@ -684,7 +688,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-5d8d200d-836d-40f6-9ae0-f48178dd0cd2\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-c862d78f-e497-4ce9-b8ba-7866064c775a\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -717,7 +721,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-5d8d200d-836d-40f6-9ae0-f48178dd0cd2')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-c862d78f-e497-4ce9-b8ba-7866064c775a')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -769,12 +773,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-5d8d200d-836d-40f6-9ae0-f48178dd0cd2 button.colab-df-convert');\n",
+              "        document.querySelector('#df-c862d78f-e497-4ce9-b8ba-7866064c775a button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-5d8d200d-836d-40f6-9ae0-f48178dd0cd2');\n",
+              "        const element = document.querySelector('#df-c862d78f-e497-4ce9-b8ba-7866064c775a');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -798,7 +802,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 24
+          "execution_count": 8
         }
       ]
     },
@@ -828,9 +832,9 @@
           "height": 143
         },
         "id": "20_IEby7N1Pe",
-        "outputId": "26159fd4-cbaf-4892-8e3f-53fa8124340c"
+        "outputId": "d0fc448b-7d7d-470d-d344-b877621cfc29"
       },
-      "execution_count": 25,
+      "execution_count": 9,
       "outputs": [
         {
           "output_type": "execute_result",
@@ -848,7 +852,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-22a08351-a2b3-41a9-a13a-aa90d6cf32be\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-9c810f53-59bd-43f3-888d-bfa546e8809c\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -905,7 +909,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-22a08351-a2b3-41a9-a13a-aa90d6cf32be')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9c810f53-59bd-43f3-888d-bfa546e8809c')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -957,12 +961,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-22a08351-a2b3-41a9-a13a-aa90d6cf32be button.colab-df-convert');\n",
+              "        document.querySelector('#df-9c810f53-59bd-43f3-888d-bfa546e8809c button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-22a08351-a2b3-41a9-a13a-aa90d6cf32be');\n",
+              "        const element = document.querySelector('#df-9c810f53-59bd-43f3-888d-bfa546e8809c');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -982,8 +986,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-6d00b11c-1029-45d1-b8f4-646f93dc22c9\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-6d00b11c-1029-45d1-b8f4-646f93dc22c9')\"\n",
+              "<div id=\"df-51a3551f-c044-4495-8869-677d2a65d50b\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-51a3551f-c044-4495-8869-677d2a65d50b')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1102,7 +1106,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-6d00b11c-1029-45d1-b8f4-646f93dc22c9 button');\n",
+              "        document.querySelector('#df-51a3551f-c044-4495-8869-677d2a65d50b button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",
@@ -1113,7 +1117,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 25
+          "execution_count": 9
         }
       ]
     },
@@ -1141,9 +1145,8 @@
     {
       "cell_type": "code",
       "source": [
-        "cursor.query(\"DROP FUNCTION IF EXISTS HomeSaleForecast;\").df()\n",
         "cursor.query(\"\"\"\n",
-        "  CREATE FUNCTION IF NOT EXISTS HomeSaleForecast FROM\n",
+        "  CREATE OR REPLACE FUNCTION HomeSaleForecast FROM\n",
         "    (\n",
         "      SELECT propertytype, datesold, price\n",
         "      FROM postgres_data.home_sales\n",
@@ -1151,6 +1154,7 @@
         "    )\n",
         "  TYPE Forecasting\n",
         "  PREDICT 'price'\n",
+        "  HORIZON 3\n",
         "  TIME 'datesold'\n",
         "  ID 'propertytype'\n",
         "  FREQUENCY 'W'\n",
@@ -1159,23 +1163,30 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 81
+          "height": 98
         },
         "id": "IFstPBI8UINv",
-        "outputId": "c5dcb3b1-47de-4a05-a41e-5a28e69abf80"
+        "outputId": "4a2d9c7b-cfb4-46df-a4c6-1a13c4da7b89"
       },
-      "execution_count": 39,
+      "execution_count": 10,
       "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Training, please wait...\n"
+          ]
+        },
         {
           "output_type": "execute_result",
           "data": {
             "text/plain": [
-              "                                                   0\n",
-              "0  Function HomeSaleForecast successfully added t..."
+              "                                                  0\n",
+              "0  Function HomeSaleForecast added to the database."
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-60463c36-95ec-4d4e-b0a7-c3f86042b8fd\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-26fdae5c-6067-428e-bbb3-c53153ab4b8e\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1200,7 +1211,7 @@
               "  <tbody>\n",
               "    <tr>\n",
               "      <th>0</th>\n",
-              "      <td>Function HomeSaleForecast successfully added t...</td>\n",
+              "      <td>Function HomeSaleForecast added to the database.</td>\n",
               "    </tr>\n",
               "  </tbody>\n",
               "</table>\n",
@@ -1208,7 +1219,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-60463c36-95ec-4d4e-b0a7-c3f86042b8fd')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-26fdae5c-6067-428e-bbb3-c53153ab4b8e')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1260,12 +1271,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-60463c36-95ec-4d4e-b0a7-c3f86042b8fd button.colab-df-convert');\n",
+              "        document.querySelector('#df-26fdae5c-6067-428e-bbb3-c53153ab4b8e button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-60463c36-95ec-4d4e-b0a7-c3f86042b8fd');\n",
+              "        const element = document.querySelector('#df-26fdae5c-6067-428e-bbb3-c53153ab4b8e');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1289,7 +1300,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 39
+          "execution_count": 10
         }
       ]
     },
@@ -1306,17 +1317,17 @@
     {
       "cell_type": "code",
       "source": [
-        "cursor.query(\"SELECT HomeSaleForecast(3);\").df()"
+        "cursor.query(\"SELECT HomeSaleForecast();\").df()"
       ],
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 238
+          "height": 143
         },
         "id": "_7m-QQG5U3_C",
-        "outputId": "dba1c727-bf6d-4301-aaaf-0db3b5ebffd0"
+        "outputId": "6c0ce026-2da0-4177-a905-2adc952e003a"
       },
-      "execution_count": 40,
+      "execution_count": 11,
       "outputs": [
         {
           "output_type": "execute_result",
@@ -1326,21 +1337,15 @@
               "0                         house                2019-07-21   \n",
               "1                         house                2019-07-28   \n",
               "2                         house                2019-08-04   \n",
-              "3                          unit                2018-12-23   \n",
-              "4                          unit                2018-12-30   \n",
-              "5                          unit                2019-01-06   \n",
               "\n",
               "   homesaleforecast.price  \n",
-              "0            766572.93750  \n",
-              "1            766572.93750  \n",
-              "2            766572.93750  \n",
-              "3            417229.78125  \n",
-              "4            409601.65625  \n",
-              "5            402112.96875  "
+              "0             766572.9375  \n",
+              "1             766572.9375  \n",
+              "2             766572.9375  "
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-73cc57a4-60e1-49bb-8415-4f9c15ea8fe4\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-aa8b966b-71d0-40a1-9a89-3da41a56f161\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1369,37 +1374,19 @@
               "      <th>0</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-21</td>\n",
-              "      <td>766572.93750</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "    <tr>\n",
               "      <th>1</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-28</td>\n",
-              "      <td>766572.93750</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "    <tr>\n",
               "      <th>2</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-08-04</td>\n",
-              "      <td>766572.93750</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>3</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2018-12-23</td>\n",
-              "      <td>417229.78125</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>4</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2018-12-30</td>\n",
-              "      <td>409601.65625</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>5</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2019-01-06</td>\n",
-              "      <td>402112.96875</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "  </tbody>\n",
               "</table>\n",
@@ -1407,7 +1394,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-73cc57a4-60e1-49bb-8415-4f9c15ea8fe4')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-aa8b966b-71d0-40a1-9a89-3da41a56f161')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1459,12 +1446,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-73cc57a4-60e1-49bb-8415-4f9c15ea8fe4 button.colab-df-convert');\n",
+              "        document.querySelector('#df-aa8b966b-71d0-40a1-9a89-3da41a56f161 button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-73cc57a4-60e1-49bb-8415-4f9c15ea8fe4');\n",
+              "        const element = document.querySelector('#df-aa8b966b-71d0-40a1-9a89-3da41a56f161');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1484,8 +1471,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-5dd181c2-a44d-4d15-88ce-fe36e7eedba4\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-5dd181c2-a44d-4d15-88ce-fe36e7eedba4')\"\n",
+              "<div id=\"df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1604,7 +1591,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-5dd181c2-a44d-4d15-88ce-fe36e7eedba4 button');\n",
+              "        document.querySelector('#df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",
@@ -1615,7 +1602,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 40
+          "execution_count": 11
         }
       ]
     },
@@ -1631,33 +1618,35 @@
     {
       "cell_type": "code",
       "source": [
-        "cursor.query(\"SELECT * FROM (SELECT HomeSaleForecast(3)) AS T ORDER BY price;\").df()"
+        "cursor.query(\"SELECT HomeSaleForecast() ORDER BY price;\").df()"
       ],
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 238
+          "height": 143
         },
         "id": "abmrZiOzVO5S",
-        "outputId": "a09186b9-fa89-4763-9c21-e82224ea33a1"
+        "outputId": "350a729c-5859-4a43-fb00-dc193622a5a3"
       },
-      "execution_count": 42,
+      "execution_count": 12,
       "outputs": [
         {
           "output_type": "execute_result",
           "data": {
             "text/plain": [
-              "  T.propertytype T.datesold       T.price\n",
-              "0           unit 2019-01-06  402112.96875\n",
-              "1           unit 2018-12-30  409601.65625\n",
-              "2           unit 2018-12-23  417229.78125\n",
-              "3          house 2019-07-21  766572.93750\n",
-              "4          house 2019-07-28  766572.93750\n",
-              "5          house 2019-08-04  766572.93750"
+              "  homesaleforecast.propertytype homesaleforecast.datesold  \\\n",
+              "0                         house                2019-07-21   \n",
+              "1                         house                2019-07-28   \n",
+              "2                         house                2019-08-04   \n",
+              "\n",
+              "   homesaleforecast.price  \n",
+              "0             766572.9375  \n",
+              "1             766572.9375  \n",
+              "2             766572.9375  "
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-9d1a88a6-c6d9-454b-b030-43bccab80120\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-b84874cd-af94-4832-bc14-36045810ecde\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1676,47 +1665,29 @@
               "  <thead>\n",
               "    <tr style=\"text-align: right;\">\n",
               "      <th></th>\n",
-              "      <th>T.propertytype</th>\n",
-              "      <th>T.datesold</th>\n",
-              "      <th>T.price</th>\n",
+              "      <th>homesaleforecast.propertytype</th>\n",
+              "      <th>homesaleforecast.datesold</th>\n",
+              "      <th>homesaleforecast.price</th>\n",
               "    </tr>\n",
               "  </thead>\n",
               "  <tbody>\n",
               "    <tr>\n",
               "      <th>0</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2019-01-06</td>\n",
-              "      <td>402112.96875</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>1</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2018-12-30</td>\n",
-              "      <td>409601.65625</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>2</th>\n",
-              "      <td>unit</td>\n",
-              "      <td>2018-12-23</td>\n",
-              "      <td>417229.78125</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>3</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-21</td>\n",
-              "      <td>766572.93750</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "    <tr>\n",
-              "      <th>4</th>\n",
+              "      <th>1</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-28</td>\n",
-              "      <td>766572.93750</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "    <tr>\n",
-              "      <th>5</th>\n",
+              "      <th>2</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-08-04</td>\n",
-              "      <td>766572.93750</td>\n",
+              "      <td>766572.9375</td>\n",
               "    </tr>\n",
               "  </tbody>\n",
               "</table>\n",
@@ -1724,7 +1695,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9d1a88a6-c6d9-454b-b030-43bccab80120')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-b84874cd-af94-4832-bc14-36045810ecde')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1776,12 +1747,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-9d1a88a6-c6d9-454b-b030-43bccab80120 button.colab-df-convert');\n",
+              "        document.querySelector('#df-b84874cd-af94-4832-bc14-36045810ecde button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-9d1a88a6-c6d9-454b-b030-43bccab80120');\n",
+              "        const element = document.querySelector('#df-b84874cd-af94-4832-bc14-36045810ecde');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1801,8 +1772,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-db5d2477-0c07-43e8-b2ad-0d5b076494ce\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-db5d2477-0c07-43e8-b2ad-0d5b076494ce')\"\n",
+              "<div id=\"df-78abaefd-84fb-41e0-ac5e-a231b6feda2e\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-78abaefd-84fb-41e0-ac5e-a231b6feda2e')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1921,7 +1892,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-db5d2477-0c07-43e8-b2ad-0d5b076494ce button');\n",
+              "        document.querySelector('#df-78abaefd-84fb-41e0-ac5e-a231b6feda2e button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",
@@ -1932,7 +1903,7 @@
             ]
           },
           "metadata": {},
-          "execution_count": 42
+          "execution_count": 12
         }
       ]
     }

From a36a1f55ef7afe5648b75a28cc26dfb0bc88bef0 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Fri, 29 Sep 2023 02:52:12 -0400
Subject: [PATCH 18/23] fixes

---
 .../source/reference/ai/model-forecasting.rst | 16 ++++---
 evadb/binder/statement_binder.py              |  4 --
 evadb/executor/create_function_executor.py    | 23 +++++-----
 evadb/utils/generic_utils.py                  |  7 ++-
 .../binder/test_statement_binder.py           | 45 -------------------
 5 files changed, 27 insertions(+), 68 deletions(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index ff7c1803b..a445e8cf5 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -47,19 +47,21 @@ EvaDB's default forecast framework is `statsforecast <https://nixtla.github.io/s
 .. list-table:: Available Parameters
    :widths: 25 75
 
-   * - PREDICT (required) 
+   * - PREDICT (str, required) 
      - The name of the column we wish to forecast.
-   * - TIME (default: 'ds')
+   * - HORIZON (int, required) 
+     - The number of steps into the future we wish to forecast.
+   * - TIME (str, default: 'ds')
      - The name of the column that contains the datestamp, which should be of a format expected by Pandas, ideally YYYY-MM-DD for a date or YYYY-MM-DD HH:MM:SS for a timestamp. Please visit the `pandas documentation <https://pandas.pydata.org/docs/reference/api/pandas.to_datetime.html>`_ for details. If relevant column is not found, an auto increasing ID column will be used.
-   * - ID (default: 'unique_id')
+   * - ID (str, default: 'unique_id')
      - The name of column that represents an identifier for the series. If relevant column is not found, the whole table is considered as one series of data.
-   * - LIBRARY (default: 'statsforecast')
+   * - LIBRARY (str, default: 'statsforecast')
      - We can select one of `statsforecast` (default) or `neuralforecast`. `statsforecast` provides access to statistical forecasting methods, while `neuralforecast` gives access to deep-learning based forecasting methods.
-   * - MODEL (default: 'AutoARIMA')
+   * - MODEL (str, default: 'AutoARIMA')
      - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `NBEATS docs <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
-   * - AUTO (default: 'F')
+   * - AUTO (str, default: 'F')
      - The names of columns to be treated as exogenous variables, separated by comma. These columns would be considered for forecasting by the backend only for LIBRARY `neuralforecast`.
-   * - Frequency (default: 'auto')
+   * - Frequency (str, default: 'auto')
      - A string indicating the frequency of the data. The common used ones are D, W, M, Y, which repestively represents day-, week-, month- and year- end frequency. The default value is M. Check `pandas available frequencies <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`_ for all available frequencies. If it is not provided, the frequency is attempted to be determined automatically.
 
 Note: If columns other than the ones required as mentioned above are passed while creating the function, they will be treated as exogenous variables if LIBRARY is `neuralforecast` and the AUTO is set to F. In other situations, they would be ignored.
diff --git a/evadb/binder/statement_binder.py b/evadb/binder/statement_binder.py
index 57f069349..eb881c483 100644
--- a/evadb/binder/statement_binder.py
+++ b/evadb/binder/statement_binder.py
@@ -126,10 +126,6 @@ def _bind_create_function_statement(self, node: CreateFunctionStatement):
                     elif column.name == arg_map.get("predict", "y"):
                         outputs.append(column)
                         required_columns.remove(column.name)
-                    # else:
-                    #     raise BinderError(
-                    #         f"Unexpected column {column.name} found for forecasting function."
-                    #     )
                 assert (
                     len(required_columns) == 0
                 ), f"Missing required {required_columns} columns for forecasting function."
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index 82570ea4e..b61c368fa 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -38,7 +38,8 @@
 from evadb.utils.generic_utils import (
     load_function_class_from_file,
     string_comparison_case_insensitive,
-    try_to_import_forecast,
+    try_to_import_statsforecast,
+    try_to_import_neuralforecast,
     try_to_import_ludwig,
     try_to_import_sklearn,
     try_to_import_torch,
@@ -270,12 +271,12 @@ def handle_forecasting_function(self):
         )  # shortens longer frequencies like Q-DEC
         season_length = season_dict[new_freq] if new_freq in season_dict else 1
 
-        try_to_import_forecast()
 
         """
             Neuralforecast implementation
         """
         if library == "neuralforecast":
+            try_to_import_neuralforecast()
             from neuralforecast import NeuralForecast
             from neuralforecast.auto import AutoNBEATS, AutoNHITS
             from neuralforecast.models import NBEATS, NHITS
@@ -291,7 +292,8 @@ def handle_forecasting_function(self):
                 arg_map["model"] = "NBEATS"
 
             if (
-                arg_map["model"].lower()[0] == "t"
+                "auto" in arg_map.keys()
+                and arg_map["auto"].lower()[0] == "t"
                 and "auto" not in arg_map["model"].lower()
             ):
                 arg_map["model"] = "Auto" + arg_map["model"]
@@ -327,6 +329,7 @@ def handle_forecasting_function(self):
         #     Statsforecast implementation
         # """
         else:
+            try_to_import_statsforecast()
             from statsforecast import StatsForecast
             from statsforecast.models import AutoARIMA, AutoCES, AutoETS, AutoTheta
 
@@ -341,7 +344,8 @@ def handle_forecasting_function(self):
                 arg_map["model"] = "AutoARIMA"
 
             if (
-                arg_map["model"].lower()[0] == "t"
+                "auto" in arg_map.keys()
+                and arg_map["auto"].lower()[0] == "t"
                 and "auto" not in arg_map["model"].lower()
             ):
                 arg_map["model"] = "Auto" + arg_map["model"]
@@ -353,10 +357,9 @@ def handle_forecasting_function(self):
                 logger.error(err_msg)
                 raise FunctionIODefinitionError(err_msg)
 
-            else:
-                model = StatsForecast(
-                    [model_here(season_length=season_length)], freq=new_freq
-                )
+            model = StatsForecast(
+                [model_here(season_length=season_length)], freq=new_freq
+            )
 
         data["ds"] = pd.to_datetime(data["ds"])
 
@@ -370,7 +373,7 @@ def handle_forecasting_function(self):
 
         model_dir = os.path.join(
             self.db.config.get_value("storage", "model_dir"),
-            self.node.name,
+            "tsforecasting",
             model_save_dir_name,
             str(hashlib.sha256(data.to_string().encode()).hexdigest()),
         )
@@ -394,7 +397,7 @@ def handle_forecasting_function(self):
             if library == "neuralforecast":
                 model.fit(df=data, val_size=horizon)
             else:
-                model.fit(df=data)
+                model.fit(df=data[["ds","y","unique_id"]])
             f = open(model_path, "wb")
             pickle.dump(model, f)
             f.close()
diff --git a/evadb/utils/generic_utils.py b/evadb/utils/generic_utils.py
index 30890a45c..1f76fdd67 100644
--- a/evadb/utils/generic_utils.py
+++ b/evadb/utils/generic_utils.py
@@ -270,7 +270,7 @@ def try_to_import_ray():
         )
 
 
-def try_to_import_forecast():
+def try_to_import_statsforecast():
     try:
         from statsforecast import StatsForecast  # noqa: F401
     except ImportError:
@@ -278,6 +278,8 @@ def try_to_import_forecast():
             """Could not import StatsForecast python package.
                 Please install it with `pip install statsforecast`."""
         )
+
+def try_to_import_neuralforecast():
     try:
         from neuralforecast import NeuralForecast  # noqa: F401
     except ImportError:
@@ -326,7 +328,8 @@ def is_ludwig_available() -> bool:
 
 def is_forecast_available() -> bool:
     try:
-        try_to_import_forecast()
+        try_to_import_statsforecast()
+        try_to_import_neuralforecast()
         return True
     except ValueError:  # noqa: E722
         return False
diff --git a/test/unit_tests/binder/test_statement_binder.py b/test/unit_tests/binder/test_statement_binder.py
index e267250f6..3de8d1745 100644
--- a/test/unit_tests/binder/test_statement_binder.py
+++ b/test/unit_tests/binder/test_statement_binder.py
@@ -568,51 +568,6 @@ def test_bind_create_function_should_bind_forecast_with_renaming_columns(self):
             self.assertEqual(create_function_statement.inputs, expected_inputs)
             self.assertEqual(create_function_statement.outputs, expected_outputs)
 
-    # def test_bind_create_function_should_raise_forecast_with_unexpected_columns(self):
-    #     with patch.object(StatementBinder, "bind"):
-    #         create_function_statement = MagicMock()
-    #         create_function_statement.function_type = "forecasting"
-    #         id_col_obj = ColumnCatalogEntry(
-    #             name="type",
-    #             type=MagicMock(),
-    #             array_type=MagicMock(),
-    #             array_dimensions=MagicMock(),
-    #         )
-    #         ds_col_obj = ColumnCatalogEntry(
-    #             name="saledate",
-    #             type=MagicMock(),
-    #             array_type=MagicMock(),
-    #             array_dimensions=MagicMock(),
-    #         )
-    #         y_col_obj = ColumnCatalogEntry(
-    #             name="ma",
-    #             type=MagicMock(),
-    #             array_type=MagicMock(),
-    #             array_dimensions=MagicMock(),
-    #         )
-    #         create_function_statement.query.target_list = [
-    #             TupleValueExpression(
-    #                 name=id_col_obj.name, table_alias="a", col_object=id_col_obj
-    #             ),
-    #             TupleValueExpression(
-    #                 name=ds_col_obj.name, table_alias="a", col_object=ds_col_obj
-    #             ),
-    #             TupleValueExpression(
-    #                 name=y_col_obj.name, table_alias="a", col_object=y_col_obj
-    #             ),
-    #         ]
-    #         create_function_statement.metadata = [
-    #             ("predict", "ma"),
-    #             ("time", "saledate"),
-    #         ]
-    #         binder = StatementBinder(StatementBinderContext(MagicMock()))
-
-    #         with self.assertRaises(BinderError) as cm:
-    #             binder._bind_create_function_statement(create_function_statement)
-
-    #         err_msg = "Unexpected column type found for forecasting function."
-    #         self.assertEqual(str(cm.exception), err_msg)
-
     def test_bind_create_function_should_raise_forecast_missing_required_columns(self):
         with patch.object(StatementBinder, "bind"):
             create_function_statement = MagicMock()

From 09bee128b3037d1ea535fcaa1a37feeec6cd6ede Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Fri, 29 Sep 2023 18:56:29 -0400
Subject: [PATCH 19/23] Fix horizon issue for multi uniqueids

---
 evadb/executor/create_function_executor.py            | 7 +++----
 evadb/functions/forecast.py                           | 2 +-
 evadb/utils/generic_utils.py                          | 1 +
 test/integration_tests/long/test_model_forecasting.py | 2 +-
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index b61c368fa..bf624efb1 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -38,10 +38,10 @@
 from evadb.utils.generic_utils import (
     load_function_class_from_file,
     string_comparison_case_insensitive,
-    try_to_import_statsforecast,
-    try_to_import_neuralforecast,
     try_to_import_ludwig,
+    try_to_import_neuralforecast,
     try_to_import_sklearn,
+    try_to_import_statsforecast,
     try_to_import_torch,
     try_to_import_ultralytics,
 )
@@ -271,7 +271,6 @@ def handle_forecasting_function(self):
         )  # shortens longer frequencies like Q-DEC
         season_length = season_dict[new_freq] if new_freq in season_dict else 1
 
-
         """
             Neuralforecast implementation
         """
@@ -397,7 +396,7 @@ def handle_forecasting_function(self):
             if library == "neuralforecast":
                 model.fit(df=data, val_size=horizon)
             else:
-                model.fit(df=data[["ds","y","unique_id"]])
+                model.fit(df=data[["ds", "y", "unique_id"]])
             f = open(model_path, "wb")
             pickle.dump(model, f)
             f.close()
diff --git a/evadb/functions/forecast.py b/evadb/functions/forecast.py
index 3073ec13f..1571f6c4f 100644
--- a/evadb/functions/forecast.py
+++ b/evadb/functions/forecast.py
@@ -61,5 +61,5 @@ def forward(self, data) -> pd.DataFrame:
                 "ds": self.time_column_rename,
                 self.model_name: self.predict_column_rename,
             }
-        )[: self.horizon]
+        )[: self.horizon * forecast_df["unique_id"].nunique()]
         return forecast_df
diff --git a/evadb/utils/generic_utils.py b/evadb/utils/generic_utils.py
index 1f76fdd67..e99f8a06a 100644
--- a/evadb/utils/generic_utils.py
+++ b/evadb/utils/generic_utils.py
@@ -279,6 +279,7 @@ def try_to_import_statsforecast():
                 Please install it with `pip install statsforecast`."""
         )
 
+
 def try_to_import_neuralforecast():
     try:
         from neuralforecast import NeuralForecast  # noqa: F401
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index f47ff328e..ab4f9ea8d 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -127,7 +127,7 @@ def test_forecast_with_column_rename(self):
                 WHERE bedrooms = 2
             )
             TYPE Forecasting
-            HORIZON 24
+            HORIZON 12
             PREDICT 'ma'
             ID 'type'
             TIME 'saledate'

From b4220006b78013778f113e3efa8f0ad6146c9d92 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Fri, 29 Sep 2023 19:29:17 -0400
Subject: [PATCH 20/23] update docs

---
 docs/source/reference/ai/model-forecasting.rst | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index a445e8cf5..a00381e72 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -73,8 +73,20 @@ Below is an example query specifying the above parameters:
    CREATE FUNCTION IF NOT EXISTS HomeRentalForecast FROM
    (SELECT saledate, ma, type FROM HomeData)
    TYPE Forecasting
+   HORIZON 12
    PREDICT 'ma'
    TIME 'saledate'
    ID 'type'
-   MODEL 'AutoCES'
    Frequency 'W';
+
+Below is an example query with `neuralforecast` with `trend` column as exogenous:
+
+.. code-block:: sql
+   
+    CREATE FUNCTION AirPanelForecast FROM
+    (SELECT unique_id, ds, y, trend FROM AirDataPanel)
+    TYPE Forecasting
+    HORIZON 12
+    PREDICT 'y'
+    LIBRARY 'neuralforecast'
+    FREQUENCY 'M';
\ No newline at end of file

From e176bd4062dfd95e613909379efc6fab448db0f8 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Sat, 30 Sep 2023 00:01:42 -0400
Subject: [PATCH 21/23] fix exogenous for auto; made default

---
 .../source/reference/ai/model-forecasting.rst | 13 +++---
 evadb/executor/create_function_executor.py    | 45 ++++++++++---------
 .../long/test_model_forecasting.py            |  2 +-
 3 files changed, 31 insertions(+), 29 deletions(-)

diff --git a/docs/source/reference/ai/model-forecasting.rst b/docs/source/reference/ai/model-forecasting.rst
index a00381e72..8285ad76b 100644
--- a/docs/source/reference/ai/model-forecasting.rst
+++ b/docs/source/reference/ai/model-forecasting.rst
@@ -57,14 +57,14 @@ EvaDB's default forecast framework is `statsforecast <https://nixtla.github.io/s
      - The name of column that represents an identifier for the series. If relevant column is not found, the whole table is considered as one series of data.
    * - LIBRARY (str, default: 'statsforecast')
      - We can select one of `statsforecast` (default) or `neuralforecast`. `statsforecast` provides access to statistical forecasting methods, while `neuralforecast` gives access to deep-learning based forecasting methods.
-   * - MODEL (str, default: 'AutoARIMA')
-     - If LIBRARY is `statsforecast`, we can select one of AutoARIMA, AutoCES, AutoETS, AutoTheta. The default is AutoARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `NBEATS docs <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
-   * - AUTO (str, default: 'F')
-     - The names of columns to be treated as exogenous variables, separated by comma. These columns would be considered for forecasting by the backend only for LIBRARY `neuralforecast`.
+   * - MODEL (str, default: 'ARIMA')
+     - If LIBRARY is `statsforecast`, we can select one of ARIMA, CES, ETS, Theta. The default is ARIMA. Check `Automatic Forecasting <https://nixtla.github.io/statsforecast/src/core/models_intro.html#automatic-forecasting>`_ to learn details about these models. If LIBRARY is `neuralforecast`, we can select one of NHITS or NBEATS. The default is NBEATS. Check `NBEATS docs <https://nixtla.github.io/neuralforecast/models.nbeats.html>`_ for details.
+   * - AUTO (str, default: 'T')
+     - If set to 'T', it enables automatic hyperparameter optimization. Must be set to 'T' for `statsforecast` library. One may set this parameter to `false` if LIBRARY is `neuralforecast` for faster (but less reliable) results.
    * - Frequency (str, default: 'auto')
      - A string indicating the frequency of the data. The common used ones are D, W, M, Y, which repestively represents day-, week-, month- and year- end frequency. The default value is M. Check `pandas available frequencies <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`_ for all available frequencies. If it is not provided, the frequency is attempted to be determined automatically.
 
-Note: If columns other than the ones required as mentioned above are passed while creating the function, they will be treated as exogenous variables if LIBRARY is `neuralforecast` and the AUTO is set to F. In other situations, they would be ignored.
+Note: If columns other than the ones required as mentioned above are passed while creating the function, they will be treated as exogenous variables if LIBRARY is `neuralforecast`. Otherwise, they would be ignored.
 
 Below is an example query specifying the above parameters:
 
@@ -79,7 +79,7 @@ Below is an example query specifying the above parameters:
    ID 'type'
    Frequency 'W';
 
-Below is an example query with `neuralforecast` with `trend` column as exogenous:
+Below is an example query with `neuralforecast` with `trend` column as exogenous and without automatic hyperparameter optimization:
 
 .. code-block:: sql
    
@@ -89,4 +89,5 @@ Below is an example query with `neuralforecast` with `trend` column as exogenous
     HORIZON 12
     PREDICT 'y'
     LIBRARY 'neuralforecast'
+    AUTO 'f'
     FREQUENCY 'M';
\ No newline at end of file
diff --git a/evadb/executor/create_function_executor.py b/evadb/executor/create_function_executor.py
index bf624efb1..8f4b5ad27 100644
--- a/evadb/executor/create_function_executor.py
+++ b/evadb/executor/create_function_executor.py
@@ -290,9 +290,8 @@ def handle_forecasting_function(self):
             if "model" not in arg_map.keys():
                 arg_map["model"] = "NBEATS"
 
-            if (
-                "auto" in arg_map.keys()
-                and arg_map["auto"].lower()[0] == "t"
+            if "auto" not in arg_map.keys() or (
+                arg_map["auto"].lower()[0] == "t"
                 and "auto" not in arg_map["model"].lower()
             ):
                 arg_map["model"] = "Auto" + arg_map["model"]
@@ -307,15 +306,21 @@ def handle_forecasting_function(self):
 
             if "auto" not in arg_map["model"].lower():
                 model_args["input_size"] = 2 * horizon
-                if len(data.columns) >= 4:
-                    exogenous_columns = [
-                        x
-                        for x in list(data.columns)
-                        if x not in ["ds", "y", "unique_id"]
-                    ]
-                    model_args["hist_exog_list"] = exogenous_columns
-
                 model_args["early_stop_patience_steps"] = 20
+            else:
+                model_args["config"] = {
+                    "input_size": 2 * horizon,
+                    "early_stop_patience_steps": 20,
+                }
+
+            if len(data.columns) >= 4:
+                exogenous_columns = [
+                    x for x in list(data.columns) if x not in ["ds", "y", "unique_id"]
+                ]
+                if "auto" not in arg_map["model"].lower():
+                    model_args["hist_exog_list"] = exogenous_columns
+                else:
+                    model_args["config"]["hist_exog_list"] = exogenous_columns
 
             model_args["h"] = horizon
 
@@ -328,6 +333,10 @@ def handle_forecasting_function(self):
         #     Statsforecast implementation
         # """
         else:
+            if "auto" in arg_map.keys() and arg_map["auto"].lower()[0] != "t":
+                raise RuntimeError(
+                    "Statsforecast implementation only supports automatic hyperparameter optimization. Please set AUTO to true."
+                )
             try_to_import_statsforecast()
             from statsforecast import StatsForecast
             from statsforecast.models import AutoARIMA, AutoCES, AutoETS, AutoTheta
@@ -340,13 +349,9 @@ def handle_forecasting_function(self):
             }
 
             if "model" not in arg_map.keys():
-                arg_map["model"] = "AutoARIMA"
+                arg_map["model"] = "ARIMA"
 
-            if (
-                "auto" in arg_map.keys()
-                and arg_map["auto"].lower()[0] == "t"
-                and "auto" not in arg_map["model"].lower()
-            ):
+            if "auto" not in arg_map["model"].lower():
                 arg_map["model"] = "Auto" + arg_map["model"]
 
             try:
@@ -363,11 +368,7 @@ def handle_forecasting_function(self):
         data["ds"] = pd.to_datetime(data["ds"])
 
         model_save_dir_name = library + "_" + arg_map["model"] + "_" + new_freq
-        if (
-            len(data.columns) >= 4
-            and "auto" not in arg_map["model"].lower()
-            and library == "neuralforecast"
-        ):
+        if len(data.columns) >= 4 and library == "neuralforecast":
             model_save_dir_name += "_exogenous_" + str(sorted(exogenous_columns))
 
         model_dir = os.path.join(
diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index ab4f9ea8d..24b37db05 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -112,7 +112,7 @@ def test_forecast(self):
             SELECT AirPanelForecast() order by y;
         """
         result = execute_query_fetch_all(self.evadb, predict_query)
-        self.assertEqual(len(result), 12)
+        self.assertEqual(len(result), 24)
         self.assertEqual(
             result.columns,
             ["airpanelforecast.unique_id", "airpanelforecast.ds", "airpanelforecast.y"],

From 68265d3b138babfe4a20091bc5fa7a67b56072f5 Mon Sep 17 00:00:00 2001
From: americast <sayan.sinha@cc.gatech.edu>
Date: Sat, 30 Sep 2023 00:42:42 -0400
Subject: [PATCH 22/23] turn auto off for neuralforecast test to avoid TLE
 error

---
 test/integration_tests/long/test_model_forecasting.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/test/integration_tests/long/test_model_forecasting.py b/test/integration_tests/long/test_model_forecasting.py
index 24b37db05..47ffe65a8 100644
--- a/test/integration_tests/long/test_model_forecasting.py
+++ b/test/integration_tests/long/test_model_forecasting.py
@@ -104,6 +104,7 @@ def test_forecast(self):
             HORIZON 12
             PREDICT 'y'
             LIBRARY 'neuralforecast'
+            AUTO 'false'
             FREQUENCY 'M';
         """
         execute_query_fetch_all(self.evadb, create_predict_udf)

From 267443d52441709396fccbec13d1224ff38b6e25 Mon Sep 17 00:00:00 2001
From: Andy Xu <xzdandy@gmail.com>
Date: Sat, 30 Sep 2023 05:14:02 -0400
Subject: [PATCH 23/23] Update the Notebook

---
 tutorials/16-homesale-forecasting.ipynb | 232 ++++++++++++++----------
 1 file changed, 140 insertions(+), 92 deletions(-)

diff --git a/tutorials/16-homesale-forecasting.ipynb b/tutorials/16-homesale-forecasting.ipynb
index 82451bb69..82f0eafc1 100644
--- a/tutorials/16-homesale-forecasting.ipynb
+++ b/tutorials/16-homesale-forecasting.ipynb
@@ -8,7 +8,7 @@
       "collapsed_sections": [
         "GHToaA_NKiHY"
       ],
-      "authorship_tag": "ABX9TyO5CS+F9YOzKquzJseLZjOy"
+      "authorship_tag": "ABX9TyOZ3w3qGhWQ6hZO9onIutni"
     },
     "kernelspec": {
       "name": "python3",
@@ -70,7 +70,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "Z7PodOEEEDsQ",
-        "outputId": "37d49a92-bd41-4486-fad7-16ddecc88536"
+        "outputId": "7b01f944-0b6a-4c91-e7cd-0251d2b66ab1"
       },
       "execution_count": 1,
       "outputs": [
@@ -211,7 +211,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "UrlfWZOkEa4V",
-        "outputId": "4ab9906a-b4a1-4487-8f12-69b4efca2be5"
+        "outputId": "af5143e2-9e7c-45c9-fc2b-247f1d241ae4"
       },
       "execution_count": 2,
       "outputs": [
@@ -264,7 +264,7 @@
     {
       "cell_type": "code",
       "source": [
-        "%pip install --quiet \"evadb[postgres,forecasting] @ git+https://github.com/georgia-tech-db/evadb.git@736d9e0b3a876dba0bfae48a717c8c9561d24cb2\"\n",
+        "%pip install --quiet \"evadb[postgres,forecasting] @ git+https://github.com/georgia-tech-db/evadb.git@68265d3b138babfe4a20091bc5fa7a67b56072f5\"\n",
         "\n",
         "import evadb\n",
         "cursor = evadb.connect().cursor()"
@@ -274,7 +274,7 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "NoAykveeElqm",
-        "outputId": "90d07f6e-cf75-4ca4-85e3-867d7db7b49f"
+        "outputId": "e6a44278-1571-461f-c673-572400d3962f"
       },
       "execution_count": 4,
       "outputs": [
@@ -285,26 +285,26 @@
             "  Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
             "  Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
             "  Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.6/92.6 kB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m108.9/108.9 kB\u001b[0m \u001b[31m7.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m137.6/137.6 kB\u001b[0m \u001b[31m10.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.5/45.5 kB\u001b[0m \u001b[31m3.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.9/110.9 kB\u001b[0m \u001b[31m9.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m162.6/162.6 kB\u001b[0m \u001b[31m9.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m98.7/98.7 kB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m727.7/727.7 kB\u001b[0m \u001b[31m18.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.5/62.5 MB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m275.0/275.0 kB\u001b[0m \u001b[31m23.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.1/3.1 MB\u001b[0m \u001b[31m84.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.0/57.0 kB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m169.2/169.2 kB\u001b[0m \u001b[31m18.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.7/154.7 kB\u001b[0m \u001b[31m15.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.6/92.6 kB\u001b[0m \u001b[31m2.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m108.9/108.9 kB\u001b[0m \u001b[31m6.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m137.6/137.6 kB\u001b[0m \u001b[31m8.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.5/45.5 kB\u001b[0m \u001b[31m3.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.9/110.9 kB\u001b[0m \u001b[31m8.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m162.6/162.6 kB\u001b[0m \u001b[31m12.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m98.7/98.7 kB\u001b[0m \u001b[31m11.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m727.7/727.7 kB\u001b[0m \u001b[31m19.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.5/62.5 MB\u001b[0m \u001b[31m8.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m275.0/275.0 kB\u001b[0m \u001b[31m21.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.1/3.1 MB\u001b[0m \u001b[31m79.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.0/57.0 kB\u001b[0m \u001b[31m6.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m169.2/169.2 kB\u001b[0m \u001b[31m18.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.7/154.7 kB\u001b[0m \u001b[31m19.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
             "\u001b[?25h  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m313.3/313.3 kB\u001b[0m \u001b[31m27.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m805.2/805.2 kB\u001b[0m \u001b[31m60.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m101.7/101.7 kB\u001b[0m \u001b[31m12.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.2/144.2 kB\u001b[0m \u001b[31m17.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
-            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m135.3/135.3 kB\u001b[0m \u001b[31m13.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m313.3/313.3 kB\u001b[0m \u001b[31m28.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m805.2/805.2 kB\u001b[0m \u001b[31m63.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m101.7/101.7 kB\u001b[0m \u001b[31m12.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.2/144.2 kB\u001b[0m \u001b[31m17.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m135.3/135.3 kB\u001b[0m \u001b[31m13.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
             "\u001b[?25h  Building wheel for evadb (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
             "  Building wheel for fugue-sql-antlr (setup.py) ... \u001b[?25l\u001b[?25hdone\n"
           ]
@@ -314,7 +314,7 @@
           "name": "stderr",
           "text": [
             "Downloading: \"http://ml.cs.tsinghua.edu.cn/~chenxi/pytorch-models/mnist-b07bb66b.pth\" to /root/.cache/torch/hub/checkpoints/mnist-b07bb66b.pth\n",
-            "100%|██████████| 1.03M/1.03M [00:01<00:00, 723kB/s] \n",
+            "100%|██████████| 1.03M/1.03M [00:01<00:00, 745kB/s]\n",
             "Downloading: \"https://download.pytorch.org/models/fasterrcnn_resnet50_fpn_coco-258fb6c6.pth\" to /root/.cache/torch/hub/checkpoints/fasterrcnn_resnet50_fpn_coco-258fb6c6.pth\n"
           ]
         }
@@ -356,10 +356,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 80
+          "height": 0
         },
         "id": "IsP6rLZ2Ftxo",
-        "outputId": "f8ab8a89-739c-42f5-fa9b-353d4e471251"
+        "outputId": "9260345f-eb8f-4f19-e1a4-9078ca6e1da3"
       },
       "execution_count": 5,
       "outputs": [
@@ -372,7 +372,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-a33adaa7-4ec6-4065-a69d-cc379f825855\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-29ae7fc7-40ef-40c7-b947-6548b58f4cfd\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -405,7 +405,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-a33adaa7-4ec6-4065-a69d-cc379f825855')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-29ae7fc7-40ef-40c7-b947-6548b58f4cfd')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -457,12 +457,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-a33adaa7-4ec6-4065-a69d-cc379f825855 button.colab-df-convert');\n",
+              "        document.querySelector('#df-29ae7fc7-40ef-40c7-b947-6548b58f4cfd button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-a33adaa7-4ec6-4065-a69d-cc379f825855');\n",
+              "        const element = document.querySelector('#df-29ae7fc7-40ef-40c7-b947-6548b58f4cfd');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -524,10 +524,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 80
+          "height": 0
         },
         "id": "MhYfovbzNB-k",
-        "outputId": "b8bb6814-2aab-4a54-cf63-7cf44d183628"
+        "outputId": "d9a17118-c063-419f-8bc8-5ca0552c0769"
       },
       "execution_count": 7,
       "outputs": [
@@ -540,7 +540,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-f85ea85d-bae8-465c-93a3-85a95523d220\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-4d0cdb80-4eee-4d94-aa91-5aebfd7fb52e\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -573,7 +573,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-f85ea85d-bae8-465c-93a3-85a95523d220')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-4d0cdb80-4eee-4d94-aa91-5aebfd7fb52e')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -625,12 +625,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-f85ea85d-bae8-465c-93a3-85a95523d220 button.colab-df-convert');\n",
+              "        document.querySelector('#df-4d0cdb80-4eee-4d94-aa91-5aebfd7fb52e button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-f85ea85d-bae8-465c-93a3-85a95523d220');\n",
+              "        const element = document.querySelector('#df-4d0cdb80-4eee-4d94-aa91-5aebfd7fb52e');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -672,10 +672,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 80
+          "height": 0
         },
         "id": "OH8Fxn0SNYO3",
-        "outputId": "58ceacff-f392-4f27-c8ef-0873b81ba943"
+        "outputId": "f4644c76-34e6-40e2-cc1b-97ce126fbec8"
       },
       "execution_count": 8,
       "outputs": [
@@ -688,7 +688,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-c862d78f-e497-4ce9-b8ba-7866064c775a\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-e3785f9c-3835-4927-8f61-ebf3df88ad0f\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -721,7 +721,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-c862d78f-e497-4ce9-b8ba-7866064c775a')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-e3785f9c-3835-4927-8f61-ebf3df88ad0f')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -773,12 +773,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-c862d78f-e497-4ce9-b8ba-7866064c775a button.colab-df-convert');\n",
+              "        document.querySelector('#df-e3785f9c-3835-4927-8f61-ebf3df88ad0f button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-c862d78f-e497-4ce9-b8ba-7866064c775a');\n",
+              "        const element = document.querySelector('#df-e3785f9c-3835-4927-8f61-ebf3df88ad0f');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -829,10 +829,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 143
+          "height": 0
         },
         "id": "20_IEby7N1Pe",
-        "outputId": "d0fc448b-7d7d-470d-d344-b877621cfc29"
+        "outputId": "814eed8d-08a6-461c-f4db-c69df70eaa8e"
       },
       "execution_count": 9,
       "outputs": [
@@ -852,7 +852,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-9c810f53-59bd-43f3-888d-bfa546e8809c\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-0e563703-5371-4843-9922-706e50252362\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -909,7 +909,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9c810f53-59bd-43f3-888d-bfa546e8809c')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-0e563703-5371-4843-9922-706e50252362')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -961,12 +961,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-9c810f53-59bd-43f3-888d-bfa546e8809c button.colab-df-convert');\n",
+              "        document.querySelector('#df-0e563703-5371-4843-9922-706e50252362 button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-9c810f53-59bd-43f3-888d-bfa546e8809c');\n",
+              "        const element = document.querySelector('#df-0e563703-5371-4843-9922-706e50252362');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -986,8 +986,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-51a3551f-c044-4495-8869-677d2a65d50b\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-51a3551f-c044-4495-8869-677d2a65d50b')\"\n",
+              "<div id=\"df-ccb7f586-ad2f-4319-ac4e-a77adfc48df2\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-ccb7f586-ad2f-4319-ac4e-a77adfc48df2')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1106,7 +1106,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-51a3551f-c044-4495-8869-677d2a65d50b button');\n",
+              "        document.querySelector('#df-ccb7f586-ad2f-4319-ac4e-a77adfc48df2 button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",
@@ -1166,7 +1166,7 @@
           "height": 98
         },
         "id": "IFstPBI8UINv",
-        "outputId": "4a2d9c7b-cfb4-46df-a4c6-1a13c4da7b89"
+        "outputId": "018c4b18-0b3f-4abe-f3b7-2fdb72314303"
       },
       "execution_count": 10,
       "outputs": [
@@ -1186,7 +1186,7 @@
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-26fdae5c-6067-428e-bbb3-c53153ab4b8e\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-3e5e52d8-7246-48e9-9de9-bde38db4377e\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1219,7 +1219,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-26fdae5c-6067-428e-bbb3-c53153ab4b8e')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-3e5e52d8-7246-48e9-9de9-bde38db4377e')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1271,12 +1271,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-26fdae5c-6067-428e-bbb3-c53153ab4b8e button.colab-df-convert');\n",
+              "        document.querySelector('#df-3e5e52d8-7246-48e9-9de9-bde38db4377e button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-26fdae5c-6067-428e-bbb3-c53153ab4b8e');\n",
+              "        const element = document.querySelector('#df-3e5e52d8-7246-48e9-9de9-bde38db4377e');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1322,10 +1322,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 143
+          "height": 238
         },
         "id": "_7m-QQG5U3_C",
-        "outputId": "6c0ce026-2da0-4177-a905-2adc952e003a"
+        "outputId": "1382ac30-d554-4ea5-e4c9-c7b4a73d28c0"
       },
       "execution_count": 11,
       "outputs": [
@@ -1337,15 +1337,21 @@
               "0                         house                2019-07-21   \n",
               "1                         house                2019-07-28   \n",
               "2                         house                2019-08-04   \n",
+              "3                          unit                2018-12-23   \n",
+              "4                          unit                2018-12-30   \n",
+              "5                          unit                2019-01-06   \n",
               "\n",
               "   homesaleforecast.price  \n",
-              "0             766572.9375  \n",
-              "1             766572.9375  \n",
-              "2             766572.9375  "
+              "0            766572.93750  \n",
+              "1            766572.93750  \n",
+              "2            766572.93750  \n",
+              "3            417229.78125  \n",
+              "4            409601.65625  \n",
+              "5            402112.96875  "
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-aa8b966b-71d0-40a1-9a89-3da41a56f161\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-b8a75a44-e813-4591-bbe6-c74e1d18f1aa\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1374,19 +1380,37 @@
               "      <th>0</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-21</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
               "    </tr>\n",
               "    <tr>\n",
               "      <th>1</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-28</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
               "    </tr>\n",
               "    <tr>\n",
               "      <th>2</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-08-04</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>3</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2018-12-23</td>\n",
+              "      <td>417229.78125</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>4</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2018-12-30</td>\n",
+              "      <td>409601.65625</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>5</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2019-01-06</td>\n",
+              "      <td>402112.96875</td>\n",
               "    </tr>\n",
               "  </tbody>\n",
               "</table>\n",
@@ -1394,7 +1418,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-aa8b966b-71d0-40a1-9a89-3da41a56f161')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-b8a75a44-e813-4591-bbe6-c74e1d18f1aa')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1446,12 +1470,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-aa8b966b-71d0-40a1-9a89-3da41a56f161 button.colab-df-convert');\n",
+              "        document.querySelector('#df-b8a75a44-e813-4591-bbe6-c74e1d18f1aa button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-aa8b966b-71d0-40a1-9a89-3da41a56f161');\n",
+              "        const element = document.querySelector('#df-b8a75a44-e813-4591-bbe6-c74e1d18f1aa');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1471,8 +1495,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a')\"\n",
+              "<div id=\"df-41b652c8-2bb2-4dc5-b6f0-067ec80ebe1e\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-41b652c8-2bb2-4dc5-b6f0-067ec80ebe1e')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1591,7 +1615,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-bddb3e5c-c7e2-421e-a4f5-c640ba0a210a button');\n",
+              "        document.querySelector('#df-41b652c8-2bb2-4dc5-b6f0-067ec80ebe1e button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",
@@ -1623,10 +1647,10 @@
       "metadata": {
         "colab": {
           "base_uri": "https://localhost:8080/",
-          "height": 143
+          "height": 238
         },
         "id": "abmrZiOzVO5S",
-        "outputId": "350a729c-5859-4a43-fb00-dc193622a5a3"
+        "outputId": "8bb5f0f0-38a2-4b0a-88b3-3b721c7e69d5"
       },
       "execution_count": 12,
       "outputs": [
@@ -1635,18 +1659,24 @@
           "data": {
             "text/plain": [
               "  homesaleforecast.propertytype homesaleforecast.datesold  \\\n",
-              "0                         house                2019-07-21   \n",
-              "1                         house                2019-07-28   \n",
-              "2                         house                2019-08-04   \n",
+              "0                          unit                2019-01-06   \n",
+              "1                          unit                2018-12-30   \n",
+              "2                          unit                2018-12-23   \n",
+              "3                         house                2019-07-21   \n",
+              "4                         house                2019-07-28   \n",
+              "5                         house                2019-08-04   \n",
               "\n",
               "   homesaleforecast.price  \n",
-              "0             766572.9375  \n",
-              "1             766572.9375  \n",
-              "2             766572.9375  "
+              "0            402112.96875  \n",
+              "1            409601.65625  \n",
+              "2            417229.78125  \n",
+              "3            766572.93750  \n",
+              "4            766572.93750  \n",
+              "5            766572.93750  "
             ],
             "text/html": [
               "\n",
-              "  <div id=\"df-b84874cd-af94-4832-bc14-36045810ecde\" class=\"colab-df-container\">\n",
+              "  <div id=\"df-9171c022-047f-4486-9c15-5944c7164286\" class=\"colab-df-container\">\n",
               "    <div>\n",
               "<style scoped>\n",
               "    .dataframe tbody tr th:only-of-type {\n",
@@ -1673,21 +1703,39 @@
               "  <tbody>\n",
               "    <tr>\n",
               "      <th>0</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2019-01-06</td>\n",
+              "      <td>402112.96875</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>1</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2018-12-30</td>\n",
+              "      <td>409601.65625</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2</th>\n",
+              "      <td>unit</td>\n",
+              "      <td>2018-12-23</td>\n",
+              "      <td>417229.78125</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>3</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-21</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
               "    </tr>\n",
               "    <tr>\n",
-              "      <th>1</th>\n",
+              "      <th>4</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-07-28</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
               "    </tr>\n",
               "    <tr>\n",
-              "      <th>2</th>\n",
+              "      <th>5</th>\n",
               "      <td>house</td>\n",
               "      <td>2019-08-04</td>\n",
-              "      <td>766572.9375</td>\n",
+              "      <td>766572.93750</td>\n",
               "    </tr>\n",
               "  </tbody>\n",
               "</table>\n",
@@ -1695,7 +1743,7 @@
               "    <div class=\"colab-df-buttons\">\n",
               "\n",
               "  <div class=\"colab-df-container\">\n",
-              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-b84874cd-af94-4832-bc14-36045810ecde')\"\n",
+              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9171c022-047f-4486-9c15-5944c7164286')\"\n",
               "            title=\"Convert this dataframe to an interactive table.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1747,12 +1795,12 @@
               "\n",
               "    <script>\n",
               "      const buttonEl =\n",
-              "        document.querySelector('#df-b84874cd-af94-4832-bc14-36045810ecde button.colab-df-convert');\n",
+              "        document.querySelector('#df-9171c022-047f-4486-9c15-5944c7164286 button.colab-df-convert');\n",
               "      buttonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "\n",
               "      async function convertToInteractive(key) {\n",
-              "        const element = document.querySelector('#df-b84874cd-af94-4832-bc14-36045810ecde');\n",
+              "        const element = document.querySelector('#df-9171c022-047f-4486-9c15-5944c7164286');\n",
               "        const dataTable =\n",
               "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
               "                                                    [key], {});\n",
@@ -1772,8 +1820,8 @@
               "  </div>\n",
               "\n",
               "\n",
-              "<div id=\"df-78abaefd-84fb-41e0-ac5e-a231b6feda2e\">\n",
-              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-78abaefd-84fb-41e0-ac5e-a231b6feda2e')\"\n",
+              "<div id=\"df-f8f058a9-86dc-41a1-9c67-2e6bb752a956\">\n",
+              "  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-f8f058a9-86dc-41a1-9c67-2e6bb752a956')\"\n",
               "            title=\"Suggest charts.\"\n",
               "            style=\"display:none;\">\n",
               "\n",
@@ -1892,7 +1940,7 @@
               "    }\n",
               "    (() => {\n",
               "      let quickchartButtonEl =\n",
-              "        document.querySelector('#df-78abaefd-84fb-41e0-ac5e-a231b6feda2e button');\n",
+              "        document.querySelector('#df-f8f058a9-86dc-41a1-9c67-2e6bb752a956 button');\n",
               "      quickchartButtonEl.style.display =\n",
               "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
               "    })();\n",