pandas-dev · AbhijitPatill · Jul 19, 2025 · Jul 19, 2025
diff --git a/bad_lines.csv b/bad_lines.csv
@@ -0,0 +1,4 @@
+name,age
+Alice,30
+Bob,not_a_number
+Charlie,40,extra_column
diff --git a/n_bad_lines-parserwarning b/n_bad_lines-parserwarning
diff --git a/pandas/io/parsers/readers.py b/pandas/io/parsers/readers.py
@@ -668,23 +668,26 @@ def _validate_names(names: Sequence[Hashable] | None) -> None:
             raise ValueError("Names should be an ordered collection.")
 
 
-def _read(
-    filepath_or_buffer: FilePath | ReadCsvBuffer[bytes] | ReadCsvBuffer[str], kwds
-) -> DataFrame | TextFileReader:
-    """Generic reader of line files."""
-    # if we pass a date_format and parse_dates=False, we should not parse the
-    # dates GH#44366
-    if kwds.get("parse_dates", None) is None:
-        if kwds.get("date_format", None) is None:
-            kwds["parse_dates"] = False
-        else:
-            kwds["parse_dates"] = True
+def _read(filepath_or_buffer, kwds):
+    import warnings
+
+    from pandas.errors import ParserWarning
 
-    # Extract some of the arguments (pass chunksize on).
     iterator = kwds.get("iterator", False)
     chunksize = kwds.get("chunksize", None)
 
-    # Check type of encoding_errors
+    # Your inserted warning
+    on_bad_lines = kwds.get("on_bad_lines", "error")
+    index_col = kwds.get("index_col", None)
+
+    if callable(on_bad_lines) and index_col is not None:
+        warnings.warn(
+            "When using a callable for on_bad_lines with index_col set, "
+            "ParserWarning should be explicitly handled. This behavior may change.",
+            ParserWarning,
+            stacklevel=3,
+        )
+
     errors = kwds.get("encoding_errors", "strict")
     if not isinstance(errors, str):
         raise ValueError(

diff --git a/pandas/tests/io/parser/test_read_csv_warn.py b/pandas/tests/io/parser/test_read_csv_warn.py
@@ -0,0 +1,14 @@
+import pandas as pd
+
+
+def my_bad_line_handler(bad_line):
+    print("Bad line encountered:", bad_line)
+
+
+df = pd.read_csv(
+    "test.csv",  # make sure this file exists in same folder or adjust the path
+    on_bad_lines=my_bad_line_handler,
+    index_col=0,
+    engine="python",  # ✅ add this line
+)
+print(df)