pandas-dev
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎local_test.py‎
Lines changed: 167 additions & 0 deletions b/‎local_test.py‎
Lines changed: 167 additions & 0 deletions
diff --git a/‎pandas/_libs/lib.pyx‎
Lines changed: 32 additions & 6 deletions b/‎pandas/_libs/lib.pyx‎
Lines changed: 32 additions & 6 deletions
diff --git a/‎pandas/_libs/tslibs/timedeltas.pyx‎
Lines changed: 13 additions & 6 deletions b/‎pandas/_libs/tslibs/timedeltas.pyx‎
Lines changed: 13 additions & 6 deletions
@@ -141,3 +141,6 @@ doc/source/savefig/
 # Pyodide/WASM related files #
 ##############################
 /.pyodide-xbuildenv-*
+
+
+.venv/
@@ -0,0 +1,167 @@
+#!/usr/bin/env python3
+"""
+Working test script that reproduces the exact failing test cases
+"""
+
+import pandas as pd
+import pyarrow as pa
+from pandas.core.arrays import ArrowExtensionArray
+
+def test_timestamp():
+    print("=== Testing Timestamp Case ===")
+    
+    # Create timestamp
+    timestamps = pd.to_datetime(['2020-01-01 01:01:01.000001']).tz_localize('US/Eastern')
+    
+    # Create with nanosecond precision like in the failing test
+    arrow_dtype = pd.ArrowDtype(pa.timestamp('ns', tz='US/Eastern'))
+    data_missing = ArrowExtensionArray._from_sequence([pd.NA, timestamps[0]], dtype=arrow_dtype)
+    
+    print("Original array:")
+    print(f"  dtype: {data_missing.dtype}")
+    print(f"  pyarrow_dtype: {data_missing.dtype.pyarrow_dtype}")
+    print(f"  unit: {data_missing.dtype.pyarrow_dtype.unit}")
+    print(f"  timezone: {data_missing.dtype.pyarrow_dtype.tz}")
+    print(f"  values: {data_missing}")
+    print()
+    
+    # Test the map operation that's failing
+    print("Testing map operation:")
+    result = data_missing.map(lambda x: x, na_action='ignore')
+    
+    print("Result array:")
+    print(f"  dtype: {result.dtype}")
+    print(f"  pyarrow_dtype: {result.dtype.pyarrow_dtype}")
+    print(f"  unit: {result.dtype.pyarrow_dtype.unit}")
+    print(f"  timezone: {result.dtype.pyarrow_dtype.tz}")
+    print(f"  values: {result}")
+    print()
+    
+    # Check if they're equal (this is what the test is checking)
+    dtypes_equal = data_missing.dtype == result.dtype
+    print(f"Timestamp dtypes equal: {dtypes_equal}")
+    
+    if not dtypes_equal:
+        print("❌ TIMESTAMP TEST WOULD FAIL!")
+        print(f"Expected: {data_missing.dtype}")
+        print(f"Got:      {result.dtype}")
+    else:
+        print("✅ Timestamp test would pass!")
+    
+    return dtypes_equal
+
+def test_integer():
+    print("\n=== Testing Integer Case ===")
+    
+    # Create integer array like in the failing test
+    int_dtype = pd.ArrowDtype(pa.int64())
+    data_missing = ArrowExtensionArray._from_sequence([pd.NA, 1], dtype=int_dtype)
+    
+    print("Original array:")
+    print(f"  dtype: {data_missing.dtype}")
+    print(f"  pyarrow_dtype: {data_missing.dtype.pyarrow_dtype}")
+    print(f"  values: {data_missing}")
+    print(f"  _pa_array.type: {data_missing._pa_array.type}")
+    print()
+    
+    # Test the map operation
+    print("Testing map operation:")
+    result = data_missing.map(lambda x: x, na_action='ignore')
+    
+    print("Result array:")
+    print(f"  dtype: {result.dtype}")
+    print(f"  pyarrow_dtype: {result.dtype.pyarrow_dtype}")
+    print(f"  values: {result}")
+    print()
+    
+    # Check if they're equal
+    dtypes_equal = data_missing.dtype == result.dtype
+    print(f"Integer dtypes equal: {dtypes_equal}")
+    
+    if not dtypes_equal:
+        print("❌ INTEGER TEST WOULD FAIL!")
+        print(f"Expected: {data_missing.dtype}")
+        print(f"Got:      {result.dtype}")
+    else:
+        print("✅ Integer test would pass!")
+    
+    return dtypes_equal
+
+def test_cast_pointwise_directly():
+    print("\n=== Testing _cast_pointwise_result directly ===")
+    
+    # Test with timestamp
+    print("Testing timestamp cast:")
+    timestamps = pd.to_datetime(['2020-01-01 01:01:01.000001']).tz_localize('US/Eastern')
+    arrow_dtype_ns = pd.ArrowDtype(pa.timestamp('ns', tz='US/Eastern'))
+    data_ns = ArrowExtensionArray._from_sequence([pd.NA, timestamps[0]], dtype=arrow_dtype_ns)
+    
+    arrow_dtype_us = pd.ArrowDtype(pa.timestamp('us', tz='US/Eastern'))
+    data_us = ArrowExtensionArray._from_sequence([pd.NA, timestamps[0]], dtype=arrow_dtype_us)
+    
+    print(f"Original (ns): {data_ns.dtype}")
+    print(f"Wrong (us):    {data_us.dtype}")
+    
+    try:
+        fixed_result = data_ns._cast_pointwise_result(data_us)
+        print(f"Fixed result:  {fixed_result.dtype}")
+        print(f"Timestamp fix works: {data_ns.dtype == fixed_result.dtype}")
+    except Exception as e:
+        print(f"Timestamp cast error: {e}")
+    
+    # Test with integer
+    print("\nTesting integer cast:")
+    int_dtype = pd.ArrowDtype(pa.int64())
+    data_int = ArrowExtensionArray._from_sequence([pd.NA, 1], dtype=int_dtype)
+    
+    double_dtype = pd.ArrowDtype(pa.float64())
+    data_double = ArrowExtensionArray._from_sequence([pd.NA, 1.0], dtype=double_dtype)
+    
+    print(f"Original (int64): {data_int.dtype}")
+    print(f"Wrong (double):   {data_double.dtype}")
+    
+    try:
+        fixed_result = data_int._cast_pointwise_result(data_double)
+        print(f"Fixed result:     {fixed_result.dtype}")
+        print(f"Integer fix works: {data_int.dtype == fixed_result.dtype}")
+    except Exception as e:
+        print(f"Integer cast error: {e}")
+
+def debug_pa_array_creation():
+    print("\n=== Debugging pa.array() behavior ===")
+    
+    # Test what happens when we create pa.array from integer values
+    values_int = [None, 1]
+    values_float = [None, 1.0]
+    
+    print("Testing pa.array with integer values:")
+    arr_int = pa.array(values_int, from_pandas=True)
+    print(f"  Input: {values_int}")
+    print(f"  Result type: {arr_int.type}")
+    
+    print("Testing pa.array with float values:")  
+    arr_float = pa.array(values_float, from_pandas=True)
+    print(f"  Input: {values_float}")
+    print(f"  Result type: {arr_float.type}")
+    
+    # Test mixed values (this might be the issue)
+    mixed_values = [pd.NA, 1]
+    print("Testing pa.array with mixed NA/int values:")
+    arr_mixed = pa.array(mixed_values, from_pandas=True)
+    print(f"  Input: {mixed_values}")
+    print(f"  Result type: {arr_mixed.type}")
+
+if __name__ == "__main__":
+    print("Testing Arrow dtype preservation issues...")
+    print("=" * 60)
+    
+    # Run all tests
+    ts_pass = test_timestamp()
+    int_pass = test_integer()
+    test_cast_pointwise_directly()
+    debug_pa_array_creation()
+    
+    print("\n" + "=" * 60)
+    print("SUMMARY:")
+    print(f"Timestamp test: {'✅ PASS' if ts_pass else '❌ FAIL'}")
+    print(f"Integer test:   {'✅ PASS' if int_pass else '❌ FAIL'}")
@@ -2913,12 +2913,38 @@ def maybe_convert_objects(ndarray[object] objects,
             result[mask] = 1
             result = IntegerArray(result, mask)
         elif result is floats and convert_to_nullable_dtype:
-            from pandas.core.arrays import FloatingArray
-
-            # Set these values to 1.0 to be deterministic, match
-            #  FloatingDtype._internal_fill_value
-            result[mask] = 1.0
-            result = FloatingArray(result, mask)
+            # Try to preserve integer EAs: if all valid values are integer-like,
+            # downcast to an IntegerArray instead of FloatingArray.
+            cvals = result[~mask]
+            if cvals.size == 0:
+                all_int_like = True
+                saw_negative = False
+            else:
+                all_int_like = np.all(np.isfinite(cvals)) and np.all(cvals == np.trunc(cvals))
+                saw_negative = np.any(cvals < 0)
+
+            if all_int_like:
+                from pandas.core.arrays import IntegerArray
+                # choose signedness from data
+                signed = bool(saw_negative)
+                # choose itemsize: reuse largest seen, else default to 8 bytes
+                itemsize = itemsize_max if itemsize_max > 0 else 8
+                if itemsize not in (1, 2, 4, 8):
+                    itemsize = 8
+                # build dtype code like 'i8' / 'u8'
+                code = ('i' if signed else 'u') + str(itemsize)
+                int_vals = cvals.astype(code, copy=False)
+                vals = np.empty(result.shape, dtype=int_vals.dtype)
+                vals[~mask] = int_vals
+                # match IntegerDtype._internal_fill_value deterministically
+                vals[mask] = 1
+                return IntegerArray(vals, mask)
+            else:
+                from pandas.core.arrays import FloatingArray
+                # Set these values to 1.0 to be deterministic, match
+                #  FloatingDtype._internal_fill_value
+                result[mask] = 1.0
+                result = FloatingArray(result, mask)
 
         if result is uints or result is ints or result is floats or result is complexes:
             # cast to the largest itemsize when all values are NumPy scalars
 
@@ -17,6 +17,7 @@ from cpython.object cimport (
 )
 
 import numpy as np
+import pyarrow as pa
 
 cimport numpy as cnp
 from numpy cimport (
@@ -2311,8 +2312,8 @@ class Timedelta(_Timedelta):
                 # see also: item_from_zerodim
                 item = cnp.PyArray_ToScalar(cnp.PyArray_DATA(other), other)
                 return self.__mul__(item)
-            return other * self.to_timedelta64()
-
+            result = other * self.to_timedelta64()
+            return type(self)(pa.array(result))
         return NotImplemented
 
     __rmul__ = __mul__
@@ -2323,6 +2324,8 @@ class Timedelta(_Timedelta):
             other = Timedelta(other)
             if other is NaT:
                 return np.nan
+            if other._value == 0:
+                return NaT # np.NaT attribute error
             if other._creso != self._creso:
                 self, other = self._maybe_cast_to_matching_resos(other)
             return self._value/ float(other._value)
@@ -2337,6 +2340,9 @@ class Timedelta(_Timedelta):
                 other = int(other)
             if isinstance(other, cnp.floating):
                 other = float(other)
+            if isinstance(other, Timedelta): # ratio
+                return self._value / other._value 
+            # scaling
             return Timedelta._from_value_and_reso(
                 <int64_t>(self._value/ other), self._creso
             )
@@ -2346,7 +2352,8 @@ class Timedelta(_Timedelta):
                 # see also: item_from_zerodim
                 item = cnp.PyArray_ToScalar(cnp.PyArray_DATA(other), other)
                 return self.__truediv__(item)
-            return self.to_timedelta64() / other
+            result = self.to_timedelta64() / other
+            return type(self)(pa.array(result))
 
         return NotImplemented
 
@@ -2372,8 +2379,8 @@ class Timedelta(_Timedelta):
             # TODO: if other.dtype.kind == "m" and other.dtype != self.asm8.dtype
             #  then should disallow for consistency with scalar behavior; requires
             #  deprecation cycle. (or changing scalar behavior)
-            return other / self.to_timedelta64()
-
+            result = other / self.to_timedelta64()
+            return type(self)(pa.array(result))
         return NotImplemented
 
     def __floordiv__(self, other):
@@ -2426,7 +2433,7 @@ class Timedelta(_Timedelta):
                     return self // other.item()
                 else:
                     return self.to_timedelta64() // other
-
+                    
             raise TypeError(f"Invalid dtype {other.dtype} for __floordiv__")
 
         return NotImplemented