o
    vhq%                     @  s@  d Z ddlmZ ddlZddlmZ ddlZddlZddl	m
Z
 ddlmZ ddlZddlmZ ddlmZ ddlmZ dd	lmZ dd
lmZ ddlmZ dd Zejddgddd Zejdd Zejdd Z ejdd Z!ejdd Z"ejdd Z#ejdd Z$G dd  d ej%Z&G d!d" d"ej'Z(d#d$ Z)dS )%aj  
This file contains a minimal set of tests for compliance with the extension
array interface test suite, and should contain no other tests.
The test suite for the full functionality of the array is located in
`pandas/tests/arrays/`.

The tests in this file are inherited from the BaseExtensionTests, and only
minimal tweaks should be applied to get the tests passing (by overwriting a
parent method).

Additional tests should either be added to one of the BaseExtensionTests
classes (if they are relevant for the extension interface for all dtypes), or
be added to the array-specific tests in `pandas/tests/arrays/`.

    )annotationsN)cast)HAS_PYARROW)StorageExtensionDtypeis_string_dtype)ArrowStringArrayStringDtype)string_dtype_highest_priority)basec                 C  st   |s| S | j jdkr| S td}| j}t|d }|g |d | j||d  j}|jdks4J t	| |S )Npyarrow   )
dtypestoragepytestimportorskip	_pa_arraylenchunked_arraychunks
num_chunkstype)arrchunkedpaarrow_arraysplit r   `/var/www/html/hyperkenya/venv/lib/python3.10/site-packages/pandas/tests/extension/test_string.pymaybe_split_array%   s   
r    TF)paramsc                 C  s   | j S N)param)requestr   r   r   r   6   s   r   c                 C  s   | \}}t ||dS )N)r   na_valuer	   )string_dtype_argumentsr   r%   r   r   r   r   ;   s   r   c                 C  st   t jdjttjdd}|d |d kr,t jdjttjdd}|d |d ks|  j|| d}t	||S )Nr   d   )sizer      r   )
nprandomdefault_rngchoiceliststringascii_lettersconstruct_array_type_from_sequencer    )r   r   stringsr   r   r   r   dataA   s   
r5   c                 C  s"   |   jtjdg| d}t||S )zLength 2 array with [NA, Valid]Ar*   r2   r3   pdNAr    r   r   r   r   r   r   data_missingK   s   
r;   c                 C  s    |   jg d| d}t||S )N)BCr6   r*   )r2   r3   r    r:   r   r   r   data_for_sortingR   s   
r>   c                 C  s$   |   jdtjdg| d}t||S )Nr<   r6   r*   r7   r:   r   r   r   data_missing_for_sortingX   s   
r?   c              	   C  s0   |   jddtjtjddddg| d}t||S )Nr<   r6   r=   r*   r7   r:   r   r   r   data_for_grouping^   s   
r@   c                      s   e Zd Z fddZdd Z fddZ fddZ fd	d
Zdd Z fddZ	 fddZ
dd Zdd Zd*ddZd+ddZd+d d!Zd,d"d#Zd$d% Z fd&d'Z fd(d)Z  ZS )-TestStringArrayc                   s|   t  | |jtju r|d|j dksJ d S |jdkr<tt |dks*J W d    d S 1 s5w   Y  d S d S )Nzstring[]r   zstring[pyarrow_numpy])	supertest_eq_with_strr%   r8   r9   r   tmassert_produces_warningFutureWarningselfr   	__class__r   r   rD   g   s   
"z TestStringArray.test_eq_with_strc                 C  s   t |sJ d S r"   r   rH   r   r   r   test_is_not_string_typeq   s   z'TestStringArray.test_is_not_string_typec                   s@   |j tju r|st||j}|du sJ d S t | d S )NF)r%   r+   nanr   is_dtypenamerC   test_is_dtype_from_name)rI   r   using_infer_stringresultrJ   r   r   rP   v   s   z'TestStringArray.test_is_dtype_from_namec                   s`   |j tju r(|s(tjtdd ||j W d    d S 1 s!w   Y  d S t 	| d S )Nz Cannot construct a 'StringDtype'match)
r%   r+   rM   r   raises	TypeErrorconstruct_from_stringrO   rC   #test_construct_from_string_own_name)rI   r   rQ   rJ   r   r   rX   }   s
   "z3TestStringArray.test_construct_from_string_own_namec                   (   |j jdkrtjdd t | d S Nr   /2D support not implemented for ArrowStringArrayreason)r   r   r   skiprC   	test_viewrI   r5   rJ   r   r   r_         zTestStringArray.test_viewc                 C  s   d S r"   r   r`   r   r   r   test_from_dtype   s   zTestStringArray.test_from_dtypec                   rY   rZ   )r   r   r   r^   rC   test_transposer`   rJ   r   r   rc      ra   zTestStringArray.test_transposec                   rY   rZ   )r   r   r   r^   rC   test_setitem_preserves_viewsr`   rJ   r   r   rd      ra   z,TestStringArray.test_setitem_preserves_viewsc                 C  s"   |  }|dg }t|| d S )Nr)   )dropnarE   assert_extension_array_equal)rI   r;   rR   expectedr   r   r   test_dropna_array   s   
z!TestStringArray.test_dropna_arrayc                 C  s`   ||    }|d }||}||usJ t|| |jdd}||us(J t|| d S )Nr   backfill)method)isnafillnarE   rf   )rI   r5   validrR   r   r   r   test_fillna_no_op_returns_copy   s   
z.TestStringArray.test_fillna_no_op_returns_copyop_namestrreturn4type[Exception] | tuple[type[Exception], ...] | Nonec                 C  s(   |dv rt S |dv rt S |dv rt S d S )N)__mod____rmod__
__divmod____rdivmod____pow____rpow__)__mul____rmul__)__truediv____rtruediv____floordiv____rfloordiv____sub____rsub__)rV   )rI   ro   objotherr   r   r   _get_expected_exception   s   z'TestStringArray._get_expected_exceptionser	pd.Seriesboolc                 C  s   |dv p|j jtju o|dv S )N)minmaxsum)anyall)r   r%   r+   rM   rI   r   ro   r   r   r   _supports_reduction   s   z#TestStringArray._supports_reductionc                 C  s   t |jtsJ |dv S )N)cummincummaxcumsum)
isinstancer   r   r   r   r   r   _supports_accumulation   s   z&TestStringArray._supports_accumulationc                 C  s|   t tt|}|dv r%|}t|tst|nd }t|tr$t||}n|jtj	u r/tj
}n
|jdkr7d}nd}||S )N)__add____radd__r   zbool[pyarrow]boolean)r   r
   rE   	get_dtyper   rp   r   r%   r+   rM   bool_r   astype)rI   ro   r   r   pointwise_resultr   cast_todtype_otherr   r   r   _cast_pointwise_result   s   



z&TestStringArray._cast_pointwise_resultc                 C  s   t |}| |||d d S )Nabc)r8   Series_compare_other)rI   r5   comparison_opr   r   r   r   test_compare_scalar   s   
z#TestStringArray.test_compare_scalarc                   sP   t |dj}|r |jtju r |jdkr tjjdd}|	| t
 | d S )Nr)   pythonmThe pointwise operation result will be inferred to string[nan, pyarrow], which does not match the input dtyper\   )nextr   r%   r8   r9   r   r   markxfailapplymarkerrC   test_combine_add)rI   data_repeatedrQ   r$   r   r   rJ   r   r   r      s   
z TestStringArray.test_combine_addc                   sV   |j }|r"|dkr"|jtju r"ts|jdkr"tjjdd}|	| t
 || d S )Nr   r   r   r\   )r   r%   r8   r9   r   r   r   r   r   r   rC   test_arith_series_with_array)rI   r5   all_arithmetic_operatorsrQ   r$   r   r   rJ   r   r   r      s   

z,TestStringArray.test_arith_series_with_array)ro   rp   rq   rr   )r   r   ro   rp   rq   r   )ro   rp   )__name__
__module____qualname__rD   rL   rP   rX   r_   rb   rc   rd   rh   rn   r   r   r   r   r   r   r   __classcell__r   r   rJ   r   rA   f   s$    




rA   c                   @  s    e Zd Zejdddd ZdS )Test2DCompatT)autousec                 C  s   t |trtjdd d S d S )Nr[   r\   )r   r   r   r^   r`   r   r   r   arrow_not_supported  s   
z Test2DCompat.arrow_not_supportedN)r   r   r   r   fixturer   r   r   r   r   r      s    
r   c                 C  sr   | \}}}|  g d}tj|d< |rt|}d}tjt|d || W d    d S 1 s2w   Y  d S )N)r   r   r)   zOsearchsorted requires array to be sorted, which is impossible with NAs present.rS   )taker8   r9   r   r   rU   
ValueErrorsearchsorted)r>   	as_seriesbcar   msgr   r   r    test_searchsorted_with_na_raises  s   


"r   )*__doc__
__future__r   r0   typingr   numpyr+   r   pandas.compatr   pandas.core.dtypes.baser   pandasr8   pandas._testing_testingrE   pandas.api.typesr   pandas.core.arraysr   pandas.core.arrays.string_r
   'pandas.tests.arrays.string_.test_stringr   pandas.tests.extensionr   r    r   r   r   r5   r;   r>   r?   r@   ExtensionTestsrA   Dim2CompatTestsr   r   r   r   r   r   <module>   sD    


	



 