Lumiwealth · brettelliot · Nov 28, 2024 · Dec 9, 2024 · Dec 9, 2024 · Dec 9, 2024
@@ -412,8 +412,11 @@ def get_start_datetime_and_ts_unit(self, length, timestep, start_dt=None, start_
         # Convert timestep string to timedelta and get start datetime
         td, ts_unit = self.convert_timestep_str_to_timedelta(timestep)
 
-        # Multiply td by length to get the end datetime
-        td *= length
+        if ts_unit == "day":
+            # Multiply td * length * 1.5 to get the end datetime with overflow + 3 days for long weekends
+            td = (td * length * 1.5) + timedelta(days=3)
+        else:
+            td *= length
 
         if start_dt is not None:
             start_datetime = start_dt - td

diff --git a/lumibot/entities/data.py b/lumibot/entities/data.py
@@ -480,6 +480,11 @@ def _get_bars_dict(self, dt, length=1, timestep=None, timeshift=0):
 
         # Get bars.
         end_row = self.get_iter_count(dt) - timeshift
+        if self.df.index[end_row] != dt:
+            # If dt is not in the dataframe, get_iter_count will return the last bar before dt.
+            # Since the data is not complete, we need to get the last bar, which is the end_row.
+            # And since the selection at the end is exclusive of end_row, we need to add 1 to end_row here.
+            end_row += 1
         start_row = end_row - length
 
         if start_row < 0:

@@ -411,20 +411,6 @@ def get_missing_dates(df_all, asset, start, end):
     dates = pd.Series(df_all.index.date).unique()
     missing_dates = sorted(set(trading_dates) - set(dates))
 
-    # TODO: This code works AFAIK, But when i enable it the tests for "test_polygon_missing_day_caching" and
-    # i don't know why nor how to fix this code or the tests. So im leaving it disabled for now. If you have problems
-    # with NANs in cached polygon data, you can try to enable this code and fix the tests.
-
-    # # Find any dates with nan values in the df_all DataFrame
-    # missing_dates += df_all[df_all.isnull().all(axis=1)].index.date.tolist()
-    #
-    # # make sure the dates are unique
-    # missing_dates = list(set(missing_dates))
-    # missing_dates.sort()
-    #
-    # # finally, filter out any dates that are not in start/end range (inclusive)
-    # missing_dates = [d for d in missing_dates if start.date() <= d <= end.date()]
-
     return missing_dates
 
 

@@ -17,9 +17,7 @@
 
 # Global parameters
 # API Key for testing Polygon.io
-POLYGON_API_KEY = os.environ.get("POLYGON_API_KEY")
-POLYGON_IS_PAID_SUBSCRIPTION = os.getenv("POLYGON_IS_PAID_SUBSCRIPTION", "true").lower() not in {'false', '0', 'f', 'n', 'no'}
-
+from lumibot.credentials import POLYGON_CONFIG
 
 class TestExampleStrategies:
     def test_stock_bracket(self):
@@ -208,7 +206,14 @@ def test_limit_and_trailing_stops(self):
         assert round(results["total_return"] * 100, 1) >= 0.7
         assert round(results["max_drawdown"]["drawdown"] * 100, 1) <= 0.2
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
     def test_options_hold_to_expiry(self):
         """
         Test the example strategy OptionsHoldToExpiry by running a backtest and checking that the strategy object is
@@ -227,7 +232,7 @@ def test_options_hold_to_expiry(self):
             show_plot=False,
             show_tearsheet=False,
             save_tearsheet=False,
-            polygon_api_key=POLYGON_API_KEY,
+            polygon_api_key=POLYGON_CONFIG["API_KEY"],
         )
 
         trades_df = strat_obj.broker._trade_event_log_df

@@ -20,8 +20,7 @@
 from datetime import timedelta
 
 # Global parameters
-# API Key for testing Polygon.io
-from lumibot.credentials import POLYGON_API_KEY
+from lumibot.credentials import POLYGON_CONFIG
 
 
 class PolygonBacktestStrat(Strategy):
@@ -204,7 +203,18 @@ def verify_backtest_results(self, poly_strat_obj):
         )
         assert "fill" not in poly_strat_obj.order_time_tracker[stoploss_order_id]
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_polygon_restclient(self):
         """
         Test Polygon REST Client with Lumibot Backtesting and real API calls to Polygon. Using the Amazon stock
@@ -219,7 +229,7 @@ def test_polygon_restclient(self):
         data_source = PolygonDataBacktesting(
             datetime_start=backtesting_start,
             datetime_end=backtesting_end,
-            api_key=POLYGON_API_KEY,
+            api_key=POLYGON_CONFIG['API_KEY'],
         )
         broker = BacktestingBroker(data_source=data_source)
         poly_strat_obj = PolygonBacktestStrat(
@@ -232,7 +242,18 @@ def test_polygon_restclient(self):
         assert results
         self.verify_backtest_results(poly_strat_obj)
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_intraday_daterange(self):
         tzinfo = pytz.timezone("America/New_York")
         backtesting_start = datetime.datetime(2024, 2, 7).astimezone(tzinfo)
@@ -241,7 +262,7 @@ def test_intraday_daterange(self):
         data_source = PolygonDataBacktesting(
             datetime_start=backtesting_start,
             datetime_end=backtesting_end,
-            api_key=POLYGON_API_KEY,
+            api_key=POLYGON_CONFIG['API_KEY'],
         )
         broker = BacktestingBroker(data_source=data_source)
         poly_strat_obj = PolygonBacktestStrat(
@@ -256,7 +277,18 @@ def test_intraday_daterange(self):
         # Assert the end datetime is before the market open of the next trading day.
         assert broker.datetime == datetime.datetime.fromisoformat("2024-02-12 08:30:00-05:00")
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_polygon_legacy_backtest(self):
         """
         Do the same backtest as test_polygon_restclient() but using the legacy backtest() function call instead of
@@ -283,7 +315,18 @@ def test_polygon_legacy_backtest(self):
         assert results
         self.verify_backtest_results(poly_strat_obj)
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_polygon_legacy_backtest2(self):
         """Test that the legacy backtest() function call works without returning the startegy object"""
         # Parameters: True = Live Trading | False = Backtest
@@ -300,7 +343,7 @@ def test_polygon_legacy_backtest2(self):
             show_plot=False,
             show_tearsheet=False,
             save_tearsheet=False,
-            polygon_api_key=POLYGON_API_KEY,  # Testing the legacy parameter name while DeprecationWarning is active
+            polygon_api_key=POLYGON_CONFIG['API_KEY'],  # Testing the legacy parameter name while DeprecationWarning is active
         )
         assert results
 
@@ -349,14 +392,25 @@ def test_pull_source_symbol_bars_with_api_call(self, polygon_data_backtesting, m
 
 class TestPolygonDataSource:
 
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_get_historical_prices(self):
         tzinfo = pytz.timezone("America/New_York")
         start = datetime.datetime(2024, 2, 5).astimezone(tzinfo)
         end = datetime.datetime(2024, 2, 10).astimezone(tzinfo)
 
         data_source = PolygonDataBacktesting(
-            start, end, api_key=POLYGON_API_KEY
+            start, end, api_key=POLYGON_CONFIG['API_KEY']
         )
         data_source._datetime = datetime.datetime(2024, 2, 7, 10).astimezone(tzinfo)
         # This call will set make the data source use minute bars.

@@ -16,9 +16,7 @@
 from lumibot.tools import get_trading_days
 
 # Global parameters
-# API Key for testing Polygon.io
-from lumibot.credentials import POLYGON_API_KEY
-from lumibot.credentials import TRADIER_CONFIG, ALPACA_CONFIG
+from lumibot.credentials import TRADIER_CONFIG, ALPACA_CONFIG, POLYGON_CONFIG
 
 
 logger = logging.getLogger(__name__)
@@ -59,7 +57,20 @@ class TestDatasourceBacktestingGetHistoricalPricesDailyData:
     @classmethod
     def setup_class(cls):
         pass
-
+
+    # noinspection PyMethodMayBeStatic
+    def get_first_trading_day_after_thanksgiving(self, year):
+        # Thanksgiving is the fourth Thursday in November
+        thanksgiving = datetime(year, 11, 1) + timedelta(days=(3 - datetime(year, 11, 1).weekday() + 28) % 7 + 21)
+        # The first trading day after Thanksgiving is the next business day
+        first_trading_day = thanksgiving + timedelta(days=1)
+
+        # Check if the first trading day is a weekend and adjust accordingly
+        if first_trading_day.weekday() >= 5:  # 5 = Saturday, 6 = Sunday
+            first_trading_day += timedelta(days=(7 - first_trading_day.weekday()))
+
+        return first_trading_day
+
     # noinspection PyMethodMayBeStatic
     def check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
             self, bars: Bars,
@@ -117,6 +128,13 @@ def check_dividends_and_adjusted_returns(self, bars):
             rtol=0
         )
 
+    def test_get_first_trading_day_after_thanksgiving(self):
+        first_trading_day_after_thanksgiving = self.get_first_trading_day_after_thanksgiving(2019)
+        assert first_trading_day_after_thanksgiving == datetime(2019, 11, 29)
+
+        first_trading_day_after_thanksgiving = self.get_first_trading_day_after_thanksgiving(2023)
+        assert first_trading_day_after_thanksgiving == datetime(2023, 11, 24)
+
     def test_pandas_backtesting_data_source_get_historical_prices_daily_bars(self, pandas_data_fixture):
         """
         This tests that the pandas data_source calculates adjusted returns for bars and that they
@@ -131,20 +149,65 @@ def test_pandas_backtesting_data_source_get_historical_prices_daily_bars(self, p
         )
         bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
         check_bars(bars=bars, length=self.length)
-        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(bars, backtesting_start=backtesting_start)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
         self.check_dividends_and_adjusted_returns(bars)
 
-    @pytest.mark.skip(reason="This test exposes a possible bug in data.py that we have not investigated yet.")
-    @pytest.mark.skipif(POLYGON_API_KEY == '<your key here>', reason="This test requires a Polygon.io API key")
+        # First trading day after Thanksgiving test
+        backtesting_start = datetime(2019, 11, 2)
+        backtesting_end = self.get_first_trading_day_after_thanksgiving(2019)
+        data_source = PandasData(
+            datetime_start=backtesting_start,
+            datetime_end=backtesting_end,
+            pandas_data=pandas_data_fixture
+        )
+        bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
+        check_bars(bars=bars, length=self.length)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
+
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["API_KEY"],
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        POLYGON_CONFIG['API_KEY'] == '<your key here>',
+        reason="This test requires a Polygon.io API key"
+    )
+    @pytest.mark.skipif(
+        not POLYGON_CONFIG["IS_PAID_SUBSCRIPTION"],
+        reason="This test requires a paid Polygon.io API key"
+    )
     def test_polygon_backtesting_data_source_get_historical_prices_daily_bars(self):
-        backtesting_end = datetime.now() - timedelta(days=1)
-        backtesting_start = backtesting_end - timedelta(days=self.length * 2 + 5)
+        last_year = datetime.now().year - 1
+        backtesting_start = datetime(last_year, 3, 25)
+        backtesting_end = datetime(last_year, 4, 25)
         data_source = PolygonDataBacktesting(
-            backtesting_start, backtesting_end, api_key=POLYGON_API_KEY
+            backtesting_start, backtesting_end, api_key=POLYGON_CONFIG["API_KEY"]
         )
         bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
         check_bars(bars=bars, length=self.length)
-        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(bars, backtesting_start=backtesting_start)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
+
+        # First trading day after Thanksgiving test
+        backtesting_start = datetime(last_year, 11, 2)
+        backtesting_end = self.get_first_trading_day_after_thanksgiving(last_year)
+        data_source = PolygonDataBacktesting(
+            backtesting_start, backtesting_end, api_key=POLYGON_CONFIG["API_KEY"]
+        )
+        bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
+        check_bars(bars=bars, length=self.length)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
 
     def test_yahoo_backtesting_data_source_get_historical_prices_daily_bars(self, pandas_data_fixture):
         """
@@ -161,10 +224,27 @@ def test_yahoo_backtesting_data_source_get_historical_prices_daily_bars(self, pa
         bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
         check_bars(bars=bars, length=self.length)
         self.check_dividends_and_adjusted_returns(bars)
-        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(bars, backtesting_start=backtesting_start)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
+
+        # First trading day after Thanksgiving test
+        backtesting_start = datetime(2019, 11, 2)
+        backtesting_end = self.get_first_trading_day_after_thanksgiving(2019)
+        data_source = YahooDataBacktesting(
+            datetime_start=backtesting_start,
+            datetime_end=backtesting_end,
+            pandas_data=pandas_data_fixture
+        )
+        bars = data_source.get_historical_prices(asset=self.asset, length=self.length, timestep=self.timestep)
+        check_bars(bars=bars, length=self.length)
+        self.check_date_of_last_bar_is_date_of_last_trading_date_before_backtest_start(
+            bars,
+            backtesting_start=backtesting_start
+        )
 
 
-# @pytest.mark.skip()
 class TestDatasourceGetHistoricalPricesDailyData:
     """These tests check the daily Bars returned from get_historical_prices for live data sources."""
 
@@ -202,8 +282,10 @@ def check_date_of_last_bar_is_correct_for_live_data_sources(self, bars):
             # if it's not a trading day, the last bar the bar should from the last trading day
             assert bars.df.index[-1].date() == self.trading_days.index[-1].date()
 
-    # @pytest.mark.skip()
-    @pytest.mark.skipif(not ALPACA_CONFIG['API_KEY'], reason="This test requires an alpaca API key")
+    @pytest.mark.skipif(
+        not ALPACA_CONFIG['API_KEY'],
+        reason="This test requires an alpaca API key"
+    )
     @pytest.mark.skipif(
         ALPACA_CONFIG['API_KEY'] == '<your key here>',
         reason="This test requires an alpaca API key"
@@ -225,7 +307,6 @@ def test_alpaca_data_source_get_historical_prices_daily_bars(self):
         check_bars(bars=bars, length=1, check_timezone=False)
         self.check_date_of_last_bar_is_correct_for_live_data_sources(bars)
 
-    # @pytest.mark.skip()
     @pytest.mark.skipif(not TRADIER_CONFIG['ACCESS_TOKEN'], reason="No Tradier credentials provided.")
     def test_tradier_data_source_get_historical_prices_daily_bars(self):
         data_source = TradierData(