mssql-python/mssql_python/connection.py at 0e0b5f9c0ad25394881d482cd93deba45f2d2338 · microsoft/mssql-python · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
"""
Copyright (c) Microsoft Corporation.
Licensed under the MIT license.
This module defines the Connection class, which is used to manage a connection to a database.
The class provides methods to establish a connection, create cursors, commit transactions,
roll back transactions, and close the connection.
Resource Management:
- All cursors created from this connection are tracked internally.
- When close() is called on the connection, all open cursors are automatically closed.
- Do not use any cursor after the connection is closed; doing so will raise an exception.
- Cursors are also cleaned up automatically when no longer referenced, to prevent memory leaks.
"""
import weakref
import re
import codecs
from typing import Any
import threading
from mssql_python.cursor import Cursor
from mssql_python.helpers import add_driver_to_connection_str, sanitize_connection_string, sanitize_user_input, log
from mssql_python import ddbc_bindings
from mssql_python.pooling import PoolingManager
from mssql_python.exceptions import InterfaceError, ProgrammingError
from mssql_python.auth import process_connection_string
from mssql_python.constants import ConstantsDDBC

# Add SQL_WMETADATA constant for metadata decoding configuration
SQL_WMETADATA = -99  # Special flag for column name decoding
# Threshold to determine if an info type is string-based
INFO_TYPE_STRING_THRESHOLD = 10000

# UTF-16 encoding variants that should use SQL_WCHAR by default
UTF16_ENCODINGS = frozenset([
    'utf-16',
    'utf-16le',
    'utf-16be'
])

def _validate_encoding(encoding: str) -> bool:
    """
    Cached encoding validation using codecs.lookup().

    Args:
        encoding (str): The encoding name to validate.

    Returns:
        bool: True if encoding is valid, False otherwise.

    Note:
        Uses LRU cache to avoid repeated expensive codecs.lookup() calls.
        Cache size is limited to 128 entries which should cover most use cases.
    """
    try:
        codecs.lookup(encoding)
        return True
    except LookupError:
        return False

# Import all DB-API 2.0 exception classes for Connection attributes
from mssql_python.exceptions import (
    Warning,
    Error,
    InterfaceError,
    DatabaseError,
    DataError,
    OperationalError,
    IntegrityError,
    InternalError,
    ProgrammingError,
    NotSupportedError,
)
from mssql_python.constants import GetInfoConstants


class Connection:
    """
    A class to manage a connection to a database, compliant with DB-API 2.0 specifications.

    This class provides methods to establish a connection to a database, create cursors,
    commit transactions, roll back transactions, and close the connection. It is designed
    to be used in a context where database operations are required, such as executing queries
    and fetching results.

    The Connection class supports the Python context manager protocol (with statement).
    When used as a context manager, it will automatically close the connection when
    exiting the context, ensuring proper resource cleanup.

    Example usage:
        with connect(connection_string) as conn:
            cursor = conn.cursor()
            cursor.execute("INSERT INTO table VALUES (?)", [value])
        # Connection is automatically closed when exiting the with block

    For long-lived connections, use without context manager:
        conn = connect(connection_string)
        try:
            # Multiple operations...
        finally:
            conn.close()

    Methods:
        __init__(database: str) -> None:
        connect_to_db() -> None:
        cursor() -> Cursor:
        commit() -> None:
        rollback() -> None:
        close() -> None:
        __enter__() -> Connection:
        __exit__() -> None:
        setencoding(encoding=None, ctype=None) -> None:
        setdecoding(sqltype, encoding=None, ctype=None) -> None:
        getdecoding(sqltype) -> dict:
    """

    # DB-API 2.0 Exception attributes
    # These allow users to catch exceptions using connection.Error, connection.ProgrammingError, etc.
    Warning = Warning
    Error = Error
    InterfaceError = InterfaceError
    DatabaseError = DatabaseError
    DataError = DataError
    OperationalError = OperationalError
    IntegrityError = IntegrityError
    InternalError = InternalError
    ProgrammingError = ProgrammingError
    NotSupportedError = NotSupportedError

    def __init__(self, connection_str: str = "", autocommit: bool = False, attrs_before: dict = None, timeout: int = 0, **kwargs) -> None:
        """
        Initialize the connection object with the specified connection string and parameters.

        Args:
            - connection_str (str): The connection string to connect to.
            - autocommit (bool): If True, causes a commit to be performed after each SQL statement.
            **kwargs: Additional key/value pairs for the connection string.
            Not including below properties since we are driver doesn't support this:

        Returns:
            None

        Raises:
            ValueError: If the connection string is invalid or connection fails.

        This method sets up the initial state for the connection object,
        preparing it for further operations such as connecting to the
        database, executing queries, etc.
        """
        self.connection_str = self._construct_connection_string(
            connection_str, **kwargs
        )
        self._attrs_before = attrs_before or {}

        # Validate access token if provided directly via attrs_before
        if ConstantsDDBC.SQL_COPT_SS_ACCESS_TOKEN.value in self._attrs_before:
            from mssql_python.auth import validate_access_token_struct
            token_struct = self._attrs_before[ConstantsDDBC.SQL_COPT_SS_ACCESS_TOKEN.value]
            if isinstance(token_struct, (bytes, bytearray)):
                try:
                    validate_access_token_struct(bytes(token_struct))
                except ValueError as e:
                    raise ValueError(f"Invalid access token in attrs_before: {e}") from e

        # Initialize encoding settings with defaults for Python 3
        # Python 3 only has str (which is Unicode), so we use utf-16le by default
        self._encoding_settings = {
            'encoding': 'utf-16le',
            'ctype': ConstantsDDBC.SQL_WCHAR.value
        }

        # Initialize decoding settings with Python 3 defaults
        self._decoding_settings = {
            ConstantsDDBC.SQL_CHAR.value: {
                'encoding': 'utf-8',
                'ctype': ConstantsDDBC.SQL_CHAR.value
            },
            ConstantsDDBC.SQL_WCHAR.value: {
                'encoding': 'utf-16le',
                'ctype': ConstantsDDBC.SQL_WCHAR.value
            },
            SQL_WMETADATA: {
                'encoding': 'utf-16le',
                'ctype': ConstantsDDBC.SQL_WCHAR.value
            }
        }

        # Check if the connection string contains authentication parameters
        # This is important for processing the connection string correctly.
        # If authentication is specified, it will be processed to handle
        # different authentication types like interactive, device code, etc.
        if re.search(r"authentication", self.connection_str, re.IGNORECASE):
            connection_result = process_connection_string(self.connection_str)
            self.connection_str = connection_result[0]
            if connection_result[1]:
                self._attrs_before.update(connection_result[1])

        self._closed = False
        self._timeout = timeout

        # Using WeakSet which automatically removes cursors when they are no longer in use
        # It is a set that holds weak references to its elements.
        # When an object is only weakly referenced, it can be garbage collected even if it's still in the set.
        # It prevents memory leaks by ensuring that cursors are cleaned up when no longer in use without requiring explicit deletion.
        # TODO: Think and implement scenarios for multi-threaded access to cursors
        self._cursors = weakref.WeakSet()

        # Initialize output converters dictionary and its lock for thread safety
        self._output_converters = {}
        self._converters_lock = threading.Lock()

        # Auto-enable pooling if user never called
        if not PoolingManager.is_initialized():
            PoolingManager.enable()
        self._pooling = PoolingManager.is_enabled()
        self._conn = ddbc_bindings.Connection(self.connection_str, self._pooling, self._attrs_before)
        self.setautocommit(autocommit)

    def _construct_connection_string(self, connection_str: str = "", **kwargs) -> str:
        """
        Construct the connection string by concatenating the connection string
        with key/value pairs from kwargs.

        Args:
            connection_str (str): The base connection string.
            **kwargs: Additional key/value pairs for the connection string.

        Returns:
            str: The constructed connection string.
        """
        # Add the driver attribute to the connection string
        conn_str = add_driver_to_connection_str(connection_str)

        # Add additional key-value pairs to the connection string
        for key, value in kwargs.items():
            if key.lower() == "host" or key.lower() == "server":
                key = "Server"
            elif key.lower() == "user" or key.lower() == "uid":
                key = "Uid"
            elif key.lower() == "password" or key.lower() == "pwd":
                key = "Pwd"
            elif key.lower() == "database":
                key = "Database"
            elif key.lower() == "encrypt":
                key = "Encrypt"
            elif key.lower() == "trust_server_certificate":
                key = "TrustServerCertificate"
            else:
                continue
            conn_str += f"{key}={value};"

        log('info', "Final connection string: %s", sanitize_connection_string(conn_str))

        return conn_str

    @property
    def timeout(self) -> int:
        """
        Get the current query timeout setting in seconds.

        Returns:
            int: The timeout value in seconds. Zero means no timeout (wait indefinitely).
        """
        return self._timeout

    @timeout.setter
    def timeout(self, value: int) -> None:
        """
        Set the query timeout for all operations performed by this connection.

        Args:
            value (int): The timeout value in seconds. Zero means no timeout.

        Returns:
            None

        Note:
            This timeout applies to all cursors created from this connection.
            It cannot be changed for individual cursors or SQL statements.
            If a query timeout occurs, an OperationalError exception will be raised.
        """
        if not isinstance(value, int):
            raise TypeError("Timeout must be an integer")
        if value < 0:
            raise ValueError("Timeout cannot be negative")
        self._timeout = value
        log('info', f"Query timeout set to {value} seconds")

    @property
    def autocommit(self) -> bool:
        """
        Return the current autocommit mode of the connection.
        Returns:
            bool: True if autocommit is enabled, False otherwise.
        """
        return self._conn.get_autocommit()

    @autocommit.setter
    def autocommit(self, value: bool) -> None:
        """
        Set the autocommit mode of the connection.
        Args:
            value (bool): True to enable autocommit, False to disable it.
        Returns:
            None
        """
        self.setautocommit(value)
        log('info', "Autocommit mode set to %s.", value)

    def setautocommit(self, value: bool = False) -> None:
        """
        Set the autocommit mode of the connection.
        Args:
            value (bool): True to enable autocommit, False to disable it.
        Returns:
            None
        Raises:
            DatabaseError: If there is an error while setting the autocommit mode.
        """
        self._conn.set_autocommit(value)

    def setencoding(self, encoding=None, ctype=None):
        """
        Sets the text encoding for SQL statements and text parameters.

        Since Python 3 only has str (which is Unicode), this method configures
        how text is encoded when sending to the database.

        Args:
            encoding (str, optional): The encoding to use. This must be a valid Python
                encoding that converts text to bytes. If None, defaults to 'utf-16le'.
            ctype (int, optional): The C data type to use when passing data:
                SQL_CHAR or SQL_WCHAR. If not provided, SQL_WCHAR is used for
                UTF-16 variants (see UTF16_ENCODINGS constant). SQL_CHAR is used for all other encodings.

        Returns:
            None

        Raises:
            ProgrammingError: If the encoding is not valid or not supported.
            InterfaceError: If the connection is closed.

        Example:
            # For databases that only communicate with UTF-8
            cnxn.setencoding(encoding='utf-8')

            # For explicitly using SQL_CHAR
            cnxn.setencoding(encoding='utf-8', ctype=mssql_python.SQL_CHAR)
        """
        if self._closed:
            raise InterfaceError(
                driver_error="Connection is closed",
                ddbc_error="Connection is closed",
            )

        # Set default encoding if not provided
        if encoding is None:
            encoding = 'utf-16le'

        # Validate encoding using cached validation for better performance
        if not _validate_encoding(encoding):
            # Log the sanitized encoding for security
            log('warning', "Invalid encoding attempted: %s", sanitize_user_input(str(encoding)))
            raise ProgrammingError(
                driver_error=f"Unsupported encoding: {encoding}",
                ddbc_error=f"The encoding '{encoding}' is not supported by Python",
            )

        # Normalize encoding to casefold for more robust Unicode handling
        encoding = encoding.casefold()

        # Set default ctype based on encoding if not provided
        if ctype is None:
            if encoding in UTF16_ENCODINGS:
                ctype = ConstantsDDBC.SQL_WCHAR.value
            else:
                ctype = ConstantsDDBC.SQL_CHAR.value

        # Validate ctype
        valid_ctypes = [ConstantsDDBC.SQL_CHAR.value, ConstantsDDBC.SQL_WCHAR.value]
        if ctype not in valid_ctypes:
            # Log the sanitized ctype for security
            log('warning', "Invalid ctype attempted: %s", sanitize_user_input(str(ctype)))
            raise ProgrammingError(
                driver_error=f"Invalid ctype: {ctype}",
                ddbc_error=f"ctype must be SQL_CHAR ({ConstantsDDBC.SQL_CHAR.value}) or SQL_WCHAR ({ConstantsDDBC.SQL_WCHAR.value})",
            )

        # Store the encoding settings
        self._encoding_settings = {
            'encoding': encoding,
            'ctype': ctype
        }

        # Log with sanitized values for security
        log('info', "Text encoding set to %s with ctype %s",
            sanitize_user_input(encoding), sanitize_user_input(str(ctype)))

    def getencoding(self):
        """
        Gets the current text encoding settings.

        Returns:
            dict: A dictionary containing 'encoding' and 'ctype' keys.

        Raises:
            InterfaceError: If the connection is closed.

        Example:
            settings = cnxn.getencoding()
            print(f"Current encoding: {settings['encoding']}")
            print(f"Current ctype: {settings['ctype']}")
        """
        if self._closed:
            raise InterfaceError(
                driver_error="Connection is closed",
                ddbc_error="Connection is closed",
            )

        return self._encoding_settings.copy()

    def setdecoding(self, sqltype, encoding=None, ctype=None):
        """
        Sets the text decoding used when reading SQL_CHAR and SQL_WCHAR from the database.

        This method configures how text data is decoded when reading from the database.
        In Python 3, all text is Unicode (str), so this primarily affects the encoding
        used to decode bytes from the database.

        Args:
            sqltype (int): The SQL type being configured: SQL_CHAR, SQL_WCHAR, or SQL_WMETADATA.
                SQL_WMETADATA is a special flag for configuring column name decoding.
            encoding (str, optional): The Python encoding to use when decoding the data.
                If None, uses default encoding based on sqltype.
            ctype (int, optional): The C data type to request from SQLGetData:
                SQL_CHAR or SQL_WCHAR. If None, uses default based on encoding.

        Returns:
            None

        Raises:
            ProgrammingError: If the sqltype, encoding, or ctype is invalid.
            InterfaceError: If the connection is closed.

        Example:
            # Configure SQL_CHAR to use UTF-8 decoding
            cnxn.setdecoding(mssql_python.SQL_CHAR, encoding='utf-8')

            # Configure column metadata decoding
            cnxn.setdecoding(mssql_python.SQL_WMETADATA, encoding='utf-16le')

            # Use explicit ctype
            cnxn.setdecoding(mssql_python.SQL_WCHAR, encoding='utf-16le', ctype=mssql_python.SQL_WCHAR)
        """
        if self._closed:
            raise InterfaceError(
                driver_error="Connection is closed",
                ddbc_error="Connection is closed",
            )

        # Validate sqltype
        valid_sqltypes = [
            ConstantsDDBC.SQL_CHAR.value,
            ConstantsDDBC.SQL_WCHAR.value,
            SQL_WMETADATA
        ]
        if sqltype not in valid_sqltypes:
            log('warning', "Invalid sqltype attempted: %s", sanitize_user_input(str(sqltype)))
            raise ProgrammingError(
                driver_error=f"Invalid sqltype: {sqltype}",
                ddbc_error=f"sqltype must be SQL_CHAR ({ConstantsDDBC.SQL_CHAR.value}), SQL_WCHAR ({ConstantsDDBC.SQL_WCHAR.value}), or SQL_WMETADATA ({SQL_WMETADATA})",
            )

        # Set default encoding based on sqltype if not provided
        if encoding is None:
            if sqltype == ConstantsDDBC.SQL_CHAR.value:
                encoding = 'utf-8'  # Default for SQL_CHAR in Python 3
            else:  # SQL_WCHAR or SQL_WMETADATA
                encoding = 'utf-16le'  # Default for SQL_WCHAR in Python 3

        # Validate encoding using cached validation for better performance
        if not _validate_encoding(encoding):
            log('warning', "Invalid encoding attempted: %s", sanitize_user_input(str(encoding)))
            raise ProgrammingError(
                driver_error=f"Unsupported encoding: {encoding}",
                ddbc_error=f"The encoding '{encoding}' is not supported by Python",
            )

        # Normalize encoding to lowercase for consistency
        encoding = encoding.lower()

        # Set default ctype based on encoding if not provided
        if ctype is None:
            if encoding in UTF16_ENCODINGS:
                ctype = ConstantsDDBC.SQL_WCHAR.value
            else:
                ctype = ConstantsDDBC.SQL_CHAR.value

        # Validate ctype
        valid_ctypes = [ConstantsDDBC.SQL_CHAR.value, ConstantsDDBC.SQL_WCHAR.value]
        if ctype not in valid_ctypes:
            log('warning', "Invalid ctype attempted: %s", sanitize_user_input(str(ctype)))
            raise ProgrammingError(
                driver_error=f"Invalid ctype: {ctype}",
                ddbc_error=f"ctype must be SQL_CHAR ({ConstantsDDBC.SQL_CHAR.value}) or SQL_WCHAR ({ConstantsDDBC.SQL_WCHAR.value})",
            )

        # Store the decoding settings for the specified sqltype
        self._decoding_settings[sqltype] = {
            'encoding': encoding,
            'ctype': ctype
        }

        # Log with sanitized values for security
        sqltype_name = {
            ConstantsDDBC.SQL_CHAR.value: "SQL_CHAR",
            ConstantsDDBC.SQL_WCHAR.value: "SQL_WCHAR",
            SQL_WMETADATA: "SQL_WMETADATA"
        }.get(sqltype, str(sqltype))

        log('info', "Text decoding set for %s to %s with ctype %s",
            sqltype_name, sanitize_user_input(encoding), sanitize_user_input(str(ctype)))

    def getdecoding(self, sqltype):
        """
        Gets the current text decoding settings for the specified SQL type.

        Args:
            sqltype (int): The SQL type to get settings for: SQL_CHAR, SQL_WCHAR, or SQL_WMETADATA.

        Returns:
            dict: A dictionary containing 'encoding' and 'ctype' keys for the specified sqltype.

        Raises:
            ProgrammingError: If the sqltype is invalid.
            InterfaceError: If the connection is closed.

        Example:
            settings = cnxn.getdecoding(mssql_python.SQL_CHAR)
            print(f"SQL_CHAR encoding: {settings['encoding']}")
            print(f"SQL_CHAR ctype: {settings['ctype']}")
        """
        if self._closed:
            raise InterfaceError(
                driver_error="Connection is closed",
                ddbc_error="Connection is closed",
            )

        # Validate sqltype
        valid_sqltypes = [
            ConstantsDDBC.SQL_CHAR.value,
            ConstantsDDBC.SQL_WCHAR.value,
            SQL_WMETADATA
        ]
        if sqltype not in valid_sqltypes:
            raise ProgrammingError(
                driver_error=f"Invalid sqltype: {sqltype}",
                ddbc_error=f"sqltype must be SQL_CHAR ({ConstantsDDBC.SQL_CHAR.value}), SQL_WCHAR ({ConstantsDDBC.SQL_WCHAR.value}), or SQL_WMETADATA ({SQL_WMETADATA})",
            )

        return self._decoding_settings[sqltype].copy()

    @property
    def searchescape(self):
        """
        The ODBC search pattern escape character, as returned by
        SQLGetInfo(SQL_SEARCH_PATTERN_ESCAPE), used to escape special characters
        such as '%' and '_' in LIKE clauses. These are driver specific.

        Returns:
            str: The search pattern escape character (usually '\' or another character)
        """
        if not hasattr(self, '_searchescape'):
            try:
                escape_char = self.getinfo(GetInfoConstants.SQL_SEARCH_PATTERN_ESCAPE.value)
                # Some drivers might return this as an integer memory address
                # or other non-string format, so ensure we have a string
                if not isinstance(escape_char, str):
                    escape_char = '\\'  # Default to backslash if not a string
                self._searchescape = escape_char
            except Exception as e:
                # Log the exception for debugging, but do not expose sensitive info
                log('warning', f"Failed to retrieve search escape character, using default '\\'. Exception: {type(e).__name__}")
                self._searchescape = '\\'
        return self._searchescape

    def cursor(self) -> Cursor:
        """
        Return a new Cursor object using the connection.

        This method creates and returns a new cursor object that can be used to
        execute SQL queries and fetch results. The cursor is associated with the
        current connection and allows interaction with the database.

        Returns:
            Cursor: A new cursor object for executing SQL queries.

        Raises:
            DatabaseError: If there is an error while creating the cursor.
            InterfaceError: If there is an error related to the database interface.
        """
        """Return a new Cursor object using the connection."""
        if self._closed:
            # raise InterfaceError
            raise InterfaceError(
                driver_error="Cannot create cursor on closed connection",
                ddbc_error="Cannot create cursor on closed connection",
            )

        cursor = Cursor(self, timeout=self._timeout)
        self._cursors.add(cursor)  # Track the cursor
        return cursor

    def add_output_converter(self, sqltype, func) -> None:
        """
        Register an output converter function that will be called whenever a value
        with the given SQL type is read from the database.

        Thread-safe implementation that protects the converters dictionary with a lock.

        ⚠️ WARNING: Registering an output converter will cause the supplied Python function
        to be executed on every matching database value. Do not register converters from
        untrusted sources, as this can result in arbitrary code execution and security
        vulnerabilities. This API should never be exposed to untrusted or external input.

        Args:
            sqltype (int): The integer SQL type value to convert, which can be one of the
                          defined standard constants (e.g. SQL_VARCHAR) or a database-specific
                          value (e.g. -151 for the SQL Server 2008 geometry data type).
            func (callable): The converter function which will be called with a single parameter,
                            the value, and should return the converted value. If the value is NULL
                            then the parameter passed to the function will be None, otherwise it
                            will be a bytes object.

        Returns:
            None
        """
        with self._converters_lock:
            self._output_converters[sqltype] = func
            # Pass to the underlying connection if native implementation supports it
            if hasattr(self._conn, 'add_output_converter'):
                self._conn.add_output_converter(sqltype, func)
        log('info', f"Added output converter for SQL type {sqltype}")

    def get_output_converter(self, sqltype):
        """
        Get the output converter function for the specified SQL type.

        Thread-safe implementation that protects the converters dictionary with a lock.

        Args:
            sqltype (int or type): The SQL type value or Python type to get the converter for

        Returns:
            callable or None: The converter function or None if no converter is registered

        Note:
            ⚠️ The returned converter function will be executed on database values. Only use
            converters from trusted sources.
        """
        with self._converters_lock:
            return self._output_converters.get(sqltype)

    def remove_output_converter(self, sqltype):
        """
        Remove the output converter function for the specified SQL type.

        Thread-safe implementation that protects the converters dictionary with a lock.

        Args:
            sqltype (int or type): The SQL type value to remove the converter for

        Returns:
            None
        """
        with self._converters_lock:
            if sqltype in self._output_converters:
                del self._output_converters[sqltype]
                # Pass to the underlying connection if native implementation supports it
                if hasattr(self._conn, 'remove_output_converter'):
                    self._conn.remove_output_converter(sqltype)
        log('info', f"Removed output converter for SQL type {sqltype}")

    def clear_output_converters(self) -> None:
        """
        Remove all output converter functions.

        Thread-safe implementation that protects the converters dictionary with a lock.

        Returns:
            None
        """
        with self._converters_lock:
            self._output_converters.clear()
            # Pass to the underlying connection if native implementation supports it
            if hasattr(self._conn, 'clear_output_converters'):
                self._conn.clear_output_converters()
        log('info', "Cleared all output converters")

    def execute(self, sql: str, *args: Any) -> Cursor:
        """
        Creates a new Cursor object, calls its execute method, and returns the new cursor.

        This is a convenience method that is not part of the DB API. Since a new Cursor
        is allocated by each call, this should not be used if more than one SQL statement
        needs to be executed on the connection.

        Note on cursor lifecycle management:
        - Each call creates a new cursor that is tracked by the connection's internal WeakSet
        - Cursors are automatically dereferenced/closed when they go out of scope
        - For long-running applications or loops, explicitly call cursor.close() when done
          to release resources immediately rather than waiting for garbage collection

        Args:
            sql (str): The SQL query to execute.
            *args: Parameters to be passed to the query.

        Returns:
            Cursor: A new cursor with the executed query.

        Raises:
            DatabaseError: If there is an error executing the query.
            InterfaceError: If the connection is closed.

        Example:
            # Automatic cleanup (cursor goes out of scope after the operation)
            row = connection.execute("SELECT name FROM users WHERE id = ?", 123).fetchone()

            # Manual cleanup for more explicit resource management
            cursor = connection.execute("SELECT * FROM large_table")
            try:
                # Use cursor...
                rows = cursor.fetchall()
            finally:
                cursor.close()  # Explicitly release resources
        """
        cursor = self.cursor()
        try:
            # Add the cursor to our tracking set BEFORE execution
            # This ensures it's tracked even if execution fails
            self._cursors.add(cursor)

            # Now execute the query
            cursor.execute(sql, *args)
            return cursor
        except Exception:
            # If execution fails, close the cursor to avoid leaking resources
            cursor.close()
            raise

    def batch_execute(self, statements, params=None, reuse_cursor=None, auto_close=False):
        """
        Execute multiple SQL statements efficiently using a single cursor.

        This method allows executing multiple SQL statements in sequence using a single
        cursor, which is more efficient than creating a new cursor for each statement.

        Args:
            statements (list): List of SQL statements to execute
            params (list, optional): List of parameter sets corresponding to statements.
                Each item can be None, a single parameter, or a sequence of parameters.
                If None, no parameters will be used for any statement.
            reuse_cursor (Cursor, optional): Existing cursor to reuse instead of creating a new one.
                If None, a new cursor will be created.
            auto_close (bool): Whether to close the cursor after execution if a new one was created.
                Defaults to False. Has no effect if reuse_cursor is provided.

        Returns:
            tuple: (results, cursor) where:
                - results is a list of execution results, one for each statement
                - cursor is the cursor used for execution (useful if you want to keep using it)

        Raises:
            TypeError: If statements is not a list or if params is provided but not a list
            ValueError: If params is provided but has different length than statements
            DatabaseError: If there is an error executing any of the statements
            InterfaceError: If the connection is closed

        Example:
            # Execute multiple statements with a single cursor
            results, _ = conn.batch_execute([
                "INSERT INTO users VALUES (?, ?)",
                "UPDATE stats SET count = count + 1",
                "SELECT * FROM users"
            ], [
                (1, "user1"),
                None,
                None
            ])

            # Last result contains the SELECT results
            for row in results[-1]:
                print(row)

            # Reuse an existing cursor
            my_cursor = conn.cursor()
            results, _ = conn.batch_execute([
                "SELECT * FROM table1",
                "SELECT * FROM table2"
            ], reuse_cursor=my_cursor)

            # Cursor remains open for further use
            my_cursor.execute("SELECT * FROM table3")
        """
        # Validate inputs
        if not isinstance(statements, list):
            raise TypeError("statements must be a list of SQL statements")

        if params is not None:
            if not isinstance(params, list):
                raise TypeError("params must be a list of parameter sets")
            if len(params) != len(statements):
                raise ValueError("params list must have the same length as statements list")
        else:
            # Create a list of None values with the same length as statements
            params = [None] * len(statements)

        # Determine which cursor to use
        is_new_cursor = reuse_cursor is None
        cursor = self.cursor() if is_new_cursor else reuse_cursor

        # Execute statements and collect results
        results = []
        try:
            for i, (stmt, param) in enumerate(zip(statements, params)):
                try:
                    # Execute the statement with parameters if provided
                    if param is not None:
                        cursor.execute(stmt, param)
                    else:
                        cursor.execute(stmt)

                    # For SELECT statements, fetch all rows
                    # For other statements, get the row count
                    if cursor.description is not None:
                        # This is a SELECT statement or similar that returns rows
                        results.append(cursor.fetchall())
                    else:
                        # This is an INSERT, UPDATE, DELETE or similar that doesn't return rows
                        results.append(cursor.rowcount)

                    log('debug', f"Executed batch statement {i+1}/{len(statements)}")

                except Exception as e:
                    # If a statement fails, include statement context in the error
                    log('error', f"Error executing statement {i+1}/{len(statements)}: {e}")
                    raise

        except Exception as e:
            # If an error occurs and auto_close is True, close the cursor
            if auto_close:
                try:
                    # Close the cursor regardless of whether it's reused or new
                    cursor.close()
                    log('debug', "Automatically closed cursor after batch execution error")
                except Exception as close_err:
                    log('warning', f"Error closing cursor after execution failure: {close_err}")
            # Re-raise the original exception
            raise

        # Close the cursor if requested and we created a new one
        if is_new_cursor and auto_close:
            cursor.close()
            log('debug', "Automatically closed cursor after batch execution")

        return results, cursor

    def getinfo(self, info_type):
        """
        Return general information about the driver and data source.

        Args:
            info_type (int): The type of information to return. See the ODBC
                             SQLGetInfo documentation for the supported values.

        Returns:
            The requested information. The type of the returned value depends
            on the information requested. It will be a string, integer, or boolean.

        Raises:
            DatabaseError: If there is an error retrieving the information.
            InterfaceError: If the connection is closed.
        """
        if self._closed:
            raise InterfaceError(
                driver_error="Cannot get info on closed connection",
                ddbc_error="Cannot get info on closed connection",
            )

        # Check that info_type is an integer
        if not isinstance(info_type, int):
            raise ValueError(f"info_type must be an integer, got {type(info_type).__name__}")

        # Check for invalid info_type values
        if info_type < 0:
            log('warning', f"Invalid info_type: {info_type}. Must be a positive integer.")
            return None

        # Get the raw result from the C++ layer
        try:
            raw_result = self._conn.get_info(info_type)
        except Exception as e:
            # Log the error and return None for invalid info types
            log('warning', f"getinfo({info_type}) failed: {e}")
            return None

        if raw_result is None:
            return None

        # Check if the result is already a simple type
        if isinstance(raw_result, (str, int, bool)):
            return raw_result

        # If it's a dictionary with data and metadata
        if isinstance(raw_result, dict) and "data" in raw_result:
            # Extract data and metadata from the raw result
            data = raw_result["data"]
            length = raw_result["length"]

            # Debug logging to understand the issue better
            log('debug', f"getinfo: info_type={info_type}, length={length}, data_type={type(data)}")

            # Define constants for different return types
            # String types - these return strings in pyodbc
            string_type_constants = {
                GetInfoConstants.SQL_DATA_SOURCE_NAME.value,
                GetInfoConstants.SQL_DRIVER_NAME.value,
                GetInfoConstants.SQL_DRIVER_VER.value,
                GetInfoConstants.SQL_SERVER_NAME.value,
                GetInfoConstants.SQL_USER_NAME.value,
                GetInfoConstants.SQL_DRIVER_ODBC_VER.value,
                GetInfoConstants.SQL_IDENTIFIER_QUOTE_CHAR.value,
                GetInfoConstants.SQL_CATALOG_NAME_SEPARATOR.value,
                GetInfoConstants.SQL_CATALOG_TERM.value,
                GetInfoConstants.SQL_SCHEMA_TERM.value,
                GetInfoConstants.SQL_TABLE_TERM.value,
                GetInfoConstants.SQL_KEYWORDS.value,
                GetInfoConstants.SQL_PROCEDURE_TERM.value,
                GetInfoConstants.SQL_SPECIAL_CHARACTERS.value,
                GetInfoConstants.SQL_SEARCH_PATTERN_ESCAPE.value
            }

            # Boolean 'Y'/'N' types
            yn_type_constants = {
                GetInfoConstants.SQL_ACCESSIBLE_PROCEDURES.value,
                GetInfoConstants.SQL_ACCESSIBLE_TABLES.value,
                GetInfoConstants.SQL_DATA_SOURCE_READ_ONLY.value,
                GetInfoConstants.SQL_EXPRESSIONS_IN_ORDERBY.value,
                GetInfoConstants.SQL_LIKE_ESCAPE_CLAUSE.value,
                GetInfoConstants.SQL_MULTIPLE_ACTIVE_TXN.value,
                GetInfoConstants.SQL_NEED_LONG_DATA_LEN.value,
                GetInfoConstants.SQL_PROCEDURES.value
            }

            # Numeric type constants that return integers
            numeric_type_constants = {
                GetInfoConstants.SQL_MAX_COLUMN_NAME_LEN.value,
                GetInfoConstants.SQL_MAX_TABLE_NAME_LEN.value,
                GetInfoConstants.SQL_MAX_SCHEMA_NAME_LEN.value,
                GetInfoConstants.SQL_MAX_CATALOG_NAME_LEN.value,
                GetInfoConstants.SQL_MAX_IDENTIFIER_LEN.value,
                GetInfoConstants.SQL_MAX_STATEMENT_LEN.value,
                GetInfoConstants.SQL_MAX_DRIVER_CONNECTIONS.value,
                GetInfoConstants.SQL_NUMERIC_FUNCTIONS.value,
                GetInfoConstants.SQL_STRING_FUNCTIONS.value,
                GetInfoConstants.SQL_DATETIME_FUNCTIONS.value,
                GetInfoConstants.SQL_TXN_CAPABLE.value,
                GetInfoConstants.SQL_DEFAULT_TXN_ISOLATION.value,
                GetInfoConstants.SQL_CURSOR_COMMIT_BEHAVIOR.value
            }

            # Determine the type of information we're dealing with
            is_string_type = info_type > INFO_TYPE_STRING_THRESHOLD or info_type in string_type_constants
            is_yn_type = info_type in yn_type_constants
            is_numeric_type = info_type in numeric_type_constants

            # Process the data based on type
            if is_string_type:
                # For string data, ensure we properly handle the byte array
                if isinstance(data, bytes):
                    # Make sure we use the correct amount of data based on length
                    actual_data = data[:length]

                    # Now decode the string data
                    try:
                        return actual_data.decode('utf-8').rstrip('\0')
                    except UnicodeDecodeError:
                        try:
                            return actual_data.decode('latin1').rstrip('\0')
                        except Exception as e:
                            log('error', f"Failed to decode string in getinfo: {e}. Returning None to avoid silent corruption.")
                            # Explicitly return None to signal decoding failure
                            return None
                else:
                    # If it's not bytes, return as is
                    return data
            elif is_yn_type:
                # For Y/N types, pyodbc returns a string 'Y' or 'N'
                if isinstance(data, bytes) and length >= 1:
                    byte_val = data[0]
                    if byte_val in (b'Y'[0], b'y'[0], 1):
                        return 'Y'
                    else: