B
    <ÓFd^Œ  ã               @   sŒ  d Z ddlmZmZmZ ddlZddlZddlZddl	m
Z
 ddlmZmZ ddl	mZ ddlmZ ddlmZ ddlmZ ejd d	k r–dd
lmZ ej
jjZddddddddddddgZdd„ Zdd„ Zdd„ Zdd„ Zd=dd „Zd>d!d„Zd"d#„ Z d$d%„ Z!d?d'd(„Z"d@d)d*„Z#dAd+d,„Z$dBd.d„Z%dCd/d„Z&dDd0d1„Z'd2d„ Z(d3d„ Z)dEd4d„Z*dFd5d„Z+dGd6d„Z,dHd7d„Z-dId;d„Z.dJd<d„Z/dS )KzÆ
Collection of utilities to manipulate structured arrays.

Most of these functions were initially implemented by John Hunter for
matplotlib.  They have been rewritten and extended for convenience.

é    )ÚdivisionÚabsolute_importÚprint_functionN)ÚndarrayÚrecarray)ÚMaskedArray)ÚMaskedRecords)Ú_is_string_like)Ú
basestringé   )ÚzipÚappend_fieldsÚdrop_fieldsÚfind_duplicatesÚget_fieldstructureÚjoin_byÚmerge_arraysÚrec_append_fieldsÚrec_drop_fieldsÚrec_joinÚrecursive_fill_fieldsÚrename_fieldsÚstack_arraysc          	   C   sj   |j }x^|jD ]T}y| | }W n tk
r4   wY nX |j jrNt||| ƒ q||| dt|ƒ…< qW |S )al  
    Fills fields from output with fields from input,
    with support for nested structures.

    Parameters
    ----------
    input : ndarray
        Input array.
    output : ndarray
        Output array.

    Notes
    -----
    * `output` should be at least the same size as `input`

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> a = np.array([(1, 10.), (2, 20.)], dtype=[('A', int), ('B', float)])
    >>> b = np.zeros((3,), dtype=a.dtype)
    >>> rfn.recursive_fill_fields(a, b)
    array([(1, 10.0), (2, 20.0), (0, 0.0)],
          dtype=[('A', '<i4'), ('B', '<f8')])

    N)ÚdtypeÚnamesÚ
ValueErrorr   Úlen)ÚinputÚoutputÚnewdtypeÚfieldÚcurrent© r"   úI/opt/alt/python37/lib64/python3.7/site-packages/numpy/lib/recfunctions.pyr   "   s    c             C   sT   g }| j }x<|D ]4}| | }|j r:| |tt|ƒƒf¡ q| |¡ qW t|ƒpRdS )aù  
    Returns the field names of the input datatype as a tuple.

    Parameters
    ----------
    adtype : dtype
        Input datatype

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> rfn.get_names(np.empty((1,), dtype=int)) is None
    True
    >>> rfn.get_names(np.empty((1,), dtype=[('A',int), ('B', float)]))
    ('A', 'B')
    >>> adtype = np.dtype([('a', int), ('b', [('ba', int), ('bb', int)])])
    >>> rfn.get_names(adtype)
    ('a', ('b', ('ba', 'bb')))
    N)r   ÚappendÚtupleÚ	get_names)ÚadtypeÚ	listnamesr   Únamer!   r"   r"   r#   r&   I   s    
r&   c             C   sJ   g }| j }x2|D ]*}| |¡ | | }|j r| t|ƒ¡ qW t|ƒpHdS )a2  
    Returns the field names of the input datatype as a tuple. Nested structure
    are flattend beforehand.

    Parameters
    ----------
    adtype : dtype
        Input datatype

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> rfn.get_names_flat(np.empty((1,), dtype=int)) is None
    True
    >>> rfn.get_names_flat(np.empty((1,), dtype=[('A',int), ('B', float)]))
    ('A', 'B')
    >>> adtype = np.dtype([('a', int), ('b', [('ba', int), ('bb', int)])])
    >>> rfn.get_names_flat(adtype)
    ('a', 'b', 'ba', 'bb')
    N)r   r$   ÚextendÚget_names_flatr%   )r'   r(   r   r)   r!   r"   r"   r#   r+   h   s    

r+   c             C   sd   | j }|dkr| jS g }x>|D ]6}| j| \}}|j rF| t|ƒ¡ q| ||f¡ qW t|ƒS dS )aD  
    Flatten a structured data-type description.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> ndtype = np.dtype([('a', '<i4'), ('b', [('ba', '<f8'), ('bb', '<i4')])])
    >>> rfn.flatten_descr(ndtype)
    (('a', dtype('int32')), ('ba', dtype('float64')), ('bb', dtype('int32')))

    N)r   ÚdescrÚfieldsr*   Úflatten_descrr$   r%   )Úndtyper   r,   r    ÚtypÚ_r"   r"   r#   r.   ‡   s    
r.   Fc             C   s|   g }|r(xf| D ]}|  t|jƒ¡ qW nHxF| D ]>}|j}|jp@d}t|ƒdkr`| d|jf¡ q.|  |j¡ q.W t |¡jS )zî
    Combine the dtype description of a series of arrays.

    Parameters
    ----------
    seqarrays : sequence of arrays
        Sequence of arrays
    flatten : {boolean}, optional
        Whether to collapse nested descriptions.
    r"   é   Ú )r*   r.   r   r   r   r$   r,   Únp)Ú	seqarraysÚflattenr   Úar!   r   r"   r"   r#   Ú	zip_descr¡   s    


r8   c             C   s¢   |dkri }| j }x†|D ]~}| | }|j rV|r:|g||< ng ||< | t|||ƒ¡ qdd„ | |g ¡pjg D ƒ}|r€| |¡ n
|rŠ|g}|pg ||< qW |p dS )ab  
    Returns a dictionary with fields indexing lists of their parent fields.

    This function is used to simplify access to fields nested in other fields.

    Parameters
    ----------
    adtype : np.dtype
        Input datatype
    lastname : optional
        Last processed field name (used internally during recursion).
    parents : dictionary
        Dictionary of parent fields (used interbally during recursion).

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> ndtype =  np.dtype([('A', int),
    ...                     ('B', [('BA', int),
    ...                            ('BB', [('BBA', int), ('BBB', int)])])])
    >>> rfn.get_fieldstructure(ndtype)
    ... # XXX: possible regression, order of BBA and BBB is swapped
    {'A': [], 'B': [], 'BA': ['B'], 'BB': ['B'], 'BBA': ['B', 'BB'], 'BBB': ['B', 'BB']}

    Nc             S   s   g | ]}|‘qS r"   r"   )Ú.0r1   r"   r"   r#   ú
<listcomp>á   s    z&get_fieldstructure.<locals>.<listcomp>)r   Úupdater   Úgetr$   )r'   ZlastnameÚparentsr   r)   r!   Z
lastparentr"   r"   r#   r   »   s"    
c             c   sB   x<| D ]4}t |tjƒr4x"tt|ƒƒD ]
}|V  q$W q|V  qW dS )zu
    Returns an iterator of concatenated fields from a sequence of arrays,
    collapsing any nested structure.

    N)Ú
isinstancer4   ÚvoidÚ_izip_fields_flatr%   )ÚiterableÚelementÚfr"   r"   r#   r@   ê   s
    
r@   c             c   s|   xv| D ]n}t |dƒr8t|tƒs8xTt|ƒD ]
}|V  q(W qt|tjƒrntt|ƒƒdkrnxt|ƒD ]
}|V  q^W q|V  qW dS )zP
    Returns an iterator of concatenated fields from a sequence of arrays.

    Ú__iter__r2   N)Úhasattrr>   r
   Ú_izip_fieldsr4   r?   r   r%   )rA   rB   rC   r"   r"   r#   rF   ø   s    


rF   Tc             c   sT   |r
t }nt}tjd dkr$tj}ntj}x$|| d|iŽD ]}t||ƒƒV  q:W dS )a*  
    Returns an iterator of concatenated items from a sequence of arrays.

    Parameters
    ----------
    seqarrays : sequence of arrays
        Sequence of arrays.
    fill_value : {None, integer}
        Value used to pad shorter iterables.
    flatten : {True, False},
        Whether to
    r   r   Ú	fillvalueN)r@   rF   ÚsysÚversion_infoÚ	itertoolsÚzip_longestZizip_longestr%   )r5   Ú
fill_valuer6   ZzipfuncrK   Útupr"   r"   r#   Úizip_records	  s    rN   c             C   s>   t | tƒsd}|r"|r:|  t¡} nt | ¡} |r:|  t¡} | S )z€
    Private function: return a recarray, a ndarray, a MaskedArray
    or a MaskedRecords depending on the input parameters
    F)r>   r   Úviewr   ÚmaÚfilledr   )r   ÚusemaskÚ
asrecarrayr"   r"   r#   Ú_fix_output&  s    


rT   c             C   s\   | j j}| j| j| j  }}}x8|p&i  ¡ D ](\}}||kr,|||< ||| || < q,W | S )zp
    Update the fill_value and masked data of `output`
    from the default given in a dictionary defaults.
    )r   r   ÚdataÚmaskrL   Úitems)r   Údefaultsr   rU   rV   rL   ÚkÚvr"   r"   r#   Ú_fix_defaults7  s    r[   éÿÿÿÿc             C   sÎ  t | ƒdkrt | d ¡} t| ttjfƒr˜| j}|rHt| fdd|jkr|  	¡ } |j
s`d|fg}|rt|rnt}q‚t}n|r~t}nt}| j||dS | f} ndd„ | D ƒ} td	d
„ | D ƒƒ}t|ƒ}t| |d}	g }
g }|rþxÚt| |ƒD ]Ì\}}|| }| 	¡  ¡ }t |¡ 	¡ }|rzt||jƒ}t|ttjfƒr‚t |jƒdkrV| ¡ d }d}n"tj||jdd}tjd|jd}nd}d}|
 t ||g| ¡¡ | t ||g| ¡¡ qæW tt|
|dƒ}tjtj||	|dtt||dƒd}|rÊ| t¡}nÌxžt| |ƒD ]\}}|| }| 	¡  ¡ }|r|t||jƒ}t|ttjfƒr€t |jƒdkrh| ¡ d }ntj||jdd}nd}|
 t ||g| ¡¡ q
W tjtt|
|dƒ|	|d}|rÊ| t¡}|S )aÃ  
    Merge arrays field by field.

    Parameters
    ----------
    seqarrays : sequence of ndarrays
        Sequence of arrays
    fill_value : {float}, optional
        Filling value used to pad missing data on the shorter arrays.
    flatten : {False, True}, optional
        Whether to collapse nested fields.
    usemask : {False, True}, optional
        Whether to return a masked array or not.
    asrecarray : {False, True}, optional
        Whether to return a recarray (MaskedRecords) or not.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> rfn.merge_arrays((np.array([1, 2]), np.array([10., 20., 30.])))
    masked_array(data = [(1, 10.0) (2, 20.0) (--, 30.0)],
                 mask = [(False, False) (False, False) (True, False)],
           fill_value = (999999, 1e+20),
                dtype = [('f0', '<i4'), ('f1', '<f8')])

    >>> rfn.merge_arrays((np.array([1, 2]), np.array([10., 20., 30.])),
    ...              usemask=False)
    array([(1, 10.0), (2, 20.0), (-1, 30.0)],
          dtype=[('f0', '<i4'), ('f1', '<f8')])
    >>> rfn.merge_arrays((np.array([1, 2]).view([('a', int)]),
    ...               np.array([10., 20., 30.])),
    ...              usemask=False, asrecarray=True)
    rec.array([(1, 10.0), (2, 20.0), (-1, 30.0)],
              dtype=[('a', '<i4'), ('f1', '<f8')])

    Notes
    -----
    * Without a mask, the missing value will be filled with something,
    * depending on what its corresponding type:
            -1      for integers
            -1.0    for floating point numbers
            '-'     for characters
            '-1'    for strings
            True    for boolean values
    * XXX: I just obtained these values empirically
    r2   r   T)r6   r3   )r   Útypec             S   s   g | ]}t  |¡‘qS r"   )r4   Ú
asanyarray)r9   Ú_mr"   r"   r#   r:   ‘  s    z merge_arrays.<locals>.<listcomp>c             s   s   | ]}|j V  qd S )N)Úsize)r9   r7   r"   r"   r#   ú	<genexpr>“  s    zmerge_arrays.<locals>.<genexpr>)r   Zndmin)r2   )r   N)r   Úcount)rV   )r   r4   r^   r>   r   r?   r   r8   r,   Úravelr   r   r   r   rO   r%   Úmaxr   Z	__array__rP   ZgetmaskarrayÚ_check_fill_valueÚitemÚarrayZonesr$   rJ   ÚchainrN   ZfromiterÚlist)r5   rL   r6   rR   rS   ZseqdtypeZseqtypeZsizesZ	maxlengthr   ZseqdataZseqmaskr7   ÚnZ	nbmissingrU   rV   ZfvalZfmskr   r"   r"   r#   r   E  s|    1


c                s`   t |ƒr|g}nt|ƒ}‡ fdd„‰ ˆ | j|ƒ}|s8dS tj| j|d}t| |ƒ}t|||dS )av  
    Return a new array with fields in `drop_names` dropped.

    Nested fields are supported.

    Parameters
    ----------
    base : array
        Input array
    drop_names : string or sequence
        String or sequence of strings corresponding to the names of the
        fields to drop.
    usemask : {False, True}, optional
        Whether to return a masked array or not.
    asrecarray : string or sequence, optional
        Whether to return a recarray or a mrecarray (`asrecarray=True`) or
        a plain ndarray or masked array with flexible dtype. The default
        is False.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> a = np.array([(1, (2, 3.0)), (4, (5, 6.0))],
    ...   dtype=[('a', int), ('b', [('ba', float), ('bb', int)])])
    >>> rfn.drop_fields(a, 'a')
    array([((2.0, 3),), ((5.0, 6),)],
          dtype=[('b', [('ba', '<f8'), ('bb', '<i4')])])
    >>> rfn.drop_fields(a, 'ba')
    array([(1, (3,)), (4, (6,))],
          dtype=[('a', '<i4'), ('b', [('bb', '<i4')])])
    >>> rfn.drop_fields(a, ['ba', 'bb'])
    array([(1,), (4,)],
          dtype=[('a', '<i4')])
    c                s`   | j }g }xP|D ]H}| | }||kr&q|j rJˆ ||ƒ}|rX| ||f¡ q| ||f¡ qW |S )N)r   r$   )r/   Ú
drop_namesr   r   r)   r!   r,   )Ú_drop_descrr"   r#   rl   ö  s    

z drop_fields.<locals>._drop_descrN)r   )rR   rS   )r	   Úsetr   r4   ÚemptyÚshaper   rT   )Úbaserk   rR   rS   r   r   r"   )rl   r#   r   Î  s    #
c                s:   ‡ fdd„|D ƒ}t jˆ j|d}tˆ |ƒ}t|||dS )aŒ  
    Return a new array keeping only the fields in `keep_names`,
    and preserving the order of those fields.

    Parameters
    ----------
    base : array
        Input array
    keep_names : string or sequence
        String or sequence of strings corresponding to the names of the
        fields to keep. Order of the names will be preserved.
    usemask : {False, True}, optional
        Whether to return a masked array or not.
    asrecarray : string or sequence, optional
        Whether to return a recarray or a mrecarray (`asrecarray=True`) or
        a plain ndarray or masked array with flexible dtype. The default
        is False.
    c                s   g | ]}|ˆ j | f‘qS r"   )r   )r9   rj   )rp   r"   r#   r:   !  s    z _keep_fields.<locals>.<listcomp>)r   )rR   rS   )r4   rn   ro   r   rT   )rp   Z
keep_namesrR   rS   r   r   r"   )rp   r#   Ú_keep_fields  s    
rq   c             C   s   t | |dddS )zK
    Returns a new numpy.recarray with fields in `drop_names` dropped.
    FT)rR   rS   )r   )rp   rk   r"   r"   r#   r   '  s    c                s"   ‡ fdd„‰ ˆ | j |ƒ}|  |¡S )aÂ  
    Rename the fields from a flexible-datatype ndarray or recarray.

    Nested fields are supported.

    Parameters
    ----------
    base : ndarray
        Input array whose fields must be modified.
    namemapper : dictionary
        Dictionary mapping old field names to their new version.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> a = np.array([(1, (2, [3.0, 30.])), (4, (5, [6.0, 60.]))],
    ...   dtype=[('a', int),('b', [('ba', float), ('bb', (float, 2))])])
    >>> rfn.rename_fields(a, {'a':'A', 'bb':'BB'})
    array([(1, (2.0, [3.0, 30.0])), (4, (5.0, [6.0, 60.0]))],
          dtype=[('A', '<i4'), ('b', [('ba', '<f8'), ('BB', '<f8', 2)])])

    c                sV   g }xL| j D ]B}| ||¡}| | }|j r@| |ˆ ||ƒf¡ q| ||f¡ qW |S )N)r   r<   r$   )r/   Ú
namemapperr   r)   Znewnamer!   )Ú_recursive_rename_fieldsr"   r#   rs   E  s    z/rename_fields.<locals>._recursive_rename_fields)r   rO   )rp   rr   r   r"   )rs   r#   r   .  s    c       	      C   sL  t |ttfƒr,t|ƒt|ƒkrBd}t|ƒ‚nt |tƒrB|g}|g}|dkrndd„ |D ƒ}dd„ t||ƒD ƒ}n`t |ttfƒs‚|g}t|ƒt|ƒkr¸t|ƒdkr¬|t|ƒ }nd}t|ƒ‚dd„ t|||ƒD ƒ}t| ||d	} t|ƒdkrút|d
||d}n| ¡ }t	j
tt| ƒt|ƒƒ| jj|jj d}t| |ƒ}t||ƒ}t|||dS )a  
    Add new fields to an existing array.

    The names of the fields are given with the `names` arguments,
    the corresponding values with the `data` arguments.
    If a single field is appended, `names`, `data` and `dtypes` do not have
    to be lists but just values.

    Parameters
    ----------
    base : array
        Input array to extend.
    names : string, sequence
        String or sequence of strings corresponding to the names
        of the new fields.
    data : array or sequence of arrays
        Array or sequence of arrays storing the fields to add to the base.
    dtypes : sequence of datatypes, optional
        Datatype or sequence of datatypes.
        If None, the datatypes are estimated from the `data`.
    fill_value : {float}, optional
        Filling value used to pad missing data on the shorter arrays.
    usemask : {False, True}, optional
        Whether to return a masked array or not.
    asrecarray : {False, True}, optional
        Whether to return a recarray (MaskedRecords) or not.

    z7The number of arrays does not match the number of namesNc             S   s   g | ]}t j|d dd‘qS )FT)ÚcopyÚsubok)r4   rg   )r9   r7   r"   r"   r#   r:   }  s    z!append_fields.<locals>.<listcomp>c             S   s"   g | ]\}}|  ||jfg¡‘qS r"   )rO   r   )r9   r)   r7   r"   r"   r#   r:   ~  s    r2   z5The dtypes argument must be None, a dtype, or a list.c             S   s0   g | ](\}}}t j|d d|d ||fg¡‘qS )FT)rt   ru   r   )r4   rg   rO   )r9   r7   rj   Údr"   r"   r#   r:   ˆ  s   )rR   rL   T)r6   rR   rL   )r   )rR   rS   )r>   r%   ri   r   r   r
   r   r   ÚpoprP   Ú
masked_allrd   r   r,   r   rT   )	rp   r   rU   ÚdtypesrL   rR   rS   Úmsgr   r"   r"   r#   r   U  s:    




c             C   s   t | |||dddS )aM  
    Add new fields to an existing array.

    The names of the fields are given with the `names` arguments,
    the corresponding values with the `data` arguments.
    If a single field is appended, `names`, `data` and `dtypes` do not have
    to be lists but just values.

    Parameters
    ----------
    base : array
        Input array to extend.
    names : string, sequence
        String or sequence of strings corresponding to the names
        of the new fields.
    data : array or sequence of arrays
        Array or sequence of arrays storing the fields to add to the base.
    dtypes : sequence of datatypes, optional
        Datatype or sequence of datatypes.
        If None, the datatypes are estimated from the `data`.

    See Also
    --------
    append_fields

    Returns
    -------
    appended_array : np.recarray
    TF)rU   ry   rS   rR   )r   )rp   r   rU   ry   r"   r"   r#   r   š  s    
c             C   s:  t | tƒr| S t| ƒdkr"| d S dd„ | D ƒ}dd„ |D ƒ}dd„ |D ƒ}dd„ |D ƒ}|d }	|	j}
dd„ |
D ƒ}xÒ|dd	… D ]Â}x¼|jD ]²}|d pžd
}||kr¾|
 |¡ | |¡ q| |¡}|
| }|rt |d ¡t |d ¡krBt|ƒ}|d |d< t	|ƒ|
|< q|d |d krt
dt|
ƒ| |d f ƒ‚qW q„W t|
ƒdkrdt |¡}nÂt t |¡f|
¡}t tjd|f ¡}g }x”t|||d	d… |dd	… ƒD ]r\}}}}|jj}|d	krè||dt|ƒ  ||…< n8x6|D ].}|| || ||…< ||krî| |¡ qîW q°W tt||ƒ||dS )a³  
    Superposes arrays fields by fields

    Parameters
    ----------
    arrays : array or sequence
        Sequence of input arrays.
    defaults : dictionary, optional
        Dictionary mapping field names to the corresponding default values.
    usemask : {True, False}, optional
        Whether to return a MaskedArray (or MaskedRecords is
        `asrecarray==True`) or a ndarray.
    asrecarray : {False, True}, optional
        Whether to return a recarray (or MaskedRecords if `usemask==True`)
        or just a flexible-type ndarray.
    autoconvert : {False, True}, optional
        Whether automatically cast the type of the field to the maximum.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> x = np.array([1, 2,])
    >>> rfn.stack_arrays(x) is x
    True
    >>> z = np.array([('A', 1), ('B', 2)], dtype=[('A', '|S3'), ('B', float)])
    >>> zz = np.array([('a', 10., 100.), ('b', 20., 200.), ('c', 30., 300.)],
    ...   dtype=[('A', '|S3'), ('B', float), ('C', float)])
    >>> test = rfn.stack_arrays((z,zz))
    >>> test
    masked_array(data = [('A', 1.0, --) ('B', 2.0, --) ('a', 10.0, 100.0) ('b', 20.0, 200.0)
     ('c', 30.0, 300.0)],
                 mask = [(False, False, True) (False, False, True) (False, False, False)
     (False, False, False) (False, False, False)],
           fill_value = ('N/A', 1e+20, 1e+20),
                dtype = [('A', '|S3'), ('B', '<f8'), ('C', '<f8')])

    r2   r   c             S   s   g | ]}t  |¡ ¡ ‘qS r"   )r4   r^   rc   )r9   r7   r"   r"   r#   r:   ç  s    z stack_arrays.<locals>.<listcomp>c             S   s   g | ]}t |ƒ‘qS r"   )r   )r9   r7   r"   r"   r#   r:   è  s    c             S   s   g | ]
}|j ‘qS r"   )r   )r9   r7   r"   r"   r#   r:   é  s    c             S   s   g | ]
}|j ‘qS r"   )r   )r9   rv   r"   r"   r#   r:   ê  s    c             S   s   g | ]}|d  ‘qS )r   r"   )r9   r1   r"   r"   r#   r:   î  s    Nr3   r\   zIncompatible type '%s' <> '%s'zf%i)rR   rS   )r>   r   r   r,   r$   Úindexr4   r   ri   r%   Ú	TypeErrorÚdictrP   Úconcatenaterx   ÚsumZcumsumZr_r   r   rT   r[   )ZarraysrX   rR   rS   Zautoconvertr5   Znrecordsr/   ZfldnamesZdtype_lZnewdescrr   Zdtype_nr,   r)   ÚnameidxZcurrent_descrr   ÚoffsetÚseenr7   rj   ÚiÚjr"   r"   r#   r   ¼  sT    '


 ,



c             C   sà   t  | ¡ ¡ } t| jƒ}| }|rBx|| D ]}|| }q*W || }| ¡ }|| }| ¡ }	|	dd… |	dd… k}
|rŒ|j}d|
|dd… < t  dg|
f¡}
|
dd… |
dd…  |
dd…< | | |
 }|rØ|||
 fS |S dS )aa  
    Find the duplicates in a structured array along a given key

    Parameters
    ----------
    a : array-like
        Input array
    key : {string, None}, optional
        Name of the fields along which to check the duplicates.
        If None, the search is performed by records
    ignoremask : {True, False}, optional
        Whether masked data should be discarded or considered as duplicates.
    return_index : {False, True}, optional
        Whether to return the indices of the duplicated values.

    Examples
    --------
    >>> from numpy.lib import recfunctions as rfn
    >>> ndtype = [('a', int)]
    >>> a = np.ma.array([1, 1, 1, 2, 2, 3, 3],
    ...         mask=[0, 0, 1, 0, 0, 0, 1]).view(ndtype)
    >>> rfn.find_duplicates(a, ignoremask=True, return_index=True)
    ... # XXX: judging by the output, the ignoremask flag has no effect
    Nr\   r2   F)	r4   r^   rc   r   r   ÚargsortrQ   Z
recordmaskr~   )r7   ÚkeyZ
ignoremaskZreturn_indexr-   rp   rC   ZsortidxZ
sortedbaseZ
sorteddataÚflagZ
sortedmaskÚ
duplicatesr"   r"   r#   r     s(    
 ÚinnerÚ1Ú2c	       )         sÖ  |dkrt d| ƒ‚tˆ tƒr$ˆ f‰ ttˆ ƒƒtˆ ƒkr^t‡ fdd„tˆ ƒD ƒƒ}	t d|	 ƒ‚x<ˆ D ]4}
|
|jjkr€t d|
 ƒ‚|
|jjkrdt d|
 ƒ‚qdW | 	¡ }| 	¡ }t|ƒ}|jj|jj }}t 
t|ƒt|ƒ¡ ˆ ¡rü|sü|süd}|d	7 }t |ƒ‚‡ fd
d„|D ƒ}t||ƒ}t||ƒ}t ||f¡}|jˆ d}|| }t dg|dd… |dd… kf¡}|dd… |dd…  |dd…< || }|||k  }|||k | }t|ƒt|ƒ }}|dkrÒd\}}nœ|dkr2||  }t ||||k  f¡}t ||||k | f¡}t|ƒ| t|ƒ|  }}n<|dkrn||  }t ||||k  f¡}t|ƒ| d }}|| ||  }}dd„ |jjD ƒ}| ‡ fdd„|jjD ƒ¡ tdd„ |D ƒƒ} xª|jjD ]ž}!t|!ƒ}!|!d }
|
| krN| |!¡}"||" }#|
ˆ krt|!d |#d ƒ|#d< n0|#d  |7  < |!d  |7  < | |"d |!¡ n|  |!d ¡ | |!¡ qÊW dd„ |D ƒ}t||ƒ}$tj|$| | f|d}%|%jj} x€|D ]x}&||& }'|&| ksÚ|&|krâ|sâ|&ˆ krâ|&|7 }&|%|& }#|'d|… |#d|…< |dkrª|'|d… |#|$|$| …< qªW x„|D ]|}&||& }'|&| ks\|&|krd|sd|&ˆ krd|&|7 }&|%|& }#|'d|… |#d|…< |dkr,|r,|'|d… |#| d…< q,W |%jˆ d t||d}(tt|%|ƒf|(ŽS )a<  
    Join arrays `r1` and `r2` on key `key`.

    The key should be either a string or a sequence of string corresponding
    to the fields used to join the array.  An exception is raised if the
    `key` field cannot be found in the two input arrays.  Neither `r1` nor
    `r2` should have any duplicates along `key`: the presence of duplicates
    will make the output quite unreliable. Note that duplicates are not
    looked for by the algorithm.

    Parameters
    ----------
    key : {string, sequence}
        A string or a sequence of strings corresponding to the fields used
        for comparison.
    r1, r2 : arrays
        Structured arrays.
    jointype : {'inner', 'outer', 'leftouter'}, optional
        If 'inner', returns the elements common to both r1 and r2.
        If 'outer', returns the common elements as well as the elements of
        r1 not in r2 and the elements of not in r2.
        If 'leftouter', returns the common elements and the elements of r1
        not in r2.
    r1postfix : string, optional
        String appended to the names of the fields of r1 that are present
        in r2 but absent of the key.
    r2postfix : string, optional
        String appended to the names of the fields of r2 that are present
        in r1 but absent of the key.
    defaults : {dictionary}, optional
        Dictionary mapping field names to the corresponding default values.
    usemask : {True, False}, optional
        Whether to return a MaskedArray (or MaskedRecords is
        `asrecarray==True`) or a ndarray.
    asrecarray : {False, True}, optional
        Whether to return a recarray (or MaskedRecords if `usemask==True`)
        or just a flexible-type ndarray.

    Notes
    -----
    * The output is sorted along the key.
    * A temporary array is formed by dropping the fields not in the key for
      the two arrays and concatenating the result. This array is then
      sorted, and the common entries selected. The output is constructed by
      filling the fields with the selected entries. Matching is not
      preserved if there are some duplicates...

    )r‰   ÚouterÚ	leftouterzWThe 'jointype' argument should be in 'inner', 'outer' or 'leftouter' (got '%s' instead)c             3   s*   | ]"\}}|ˆ |d  d… kr|V  qdS )r2   Nr"   )r9   rj   Úx)r†   r"   r#   ra   Š  s    zjoin_by.<locals>.<genexpr>zduplicate join key %rzr1 does not have key field %rzr2 does not have key field %rz8r1 and r2 contain common names, r1postfix and r2postfix zcan't be emptyc                s   g | ]}|ˆ kr|‘qS r"   r"   )r9   rj   )r†   r"   r#   r:   £  s    zjoin_by.<locals>.<listcomp>)ÚorderFr2   Nr\   r‰   )r   r   rŒ   r   r   c             S   s   g | ]}t |ƒ‘qS r"   )ri   )r9   r1   r"   r"   r#   r:   Ã  s    c             3   s"   | ]}|d  ˆ krt |ƒV  qdS )r   N)ri   )r9   r1   )r†   r"   r#   ra   Å  s    c             s   s   | ]}|d  V  qdS )r   Nr"   )r9   r1   r"   r"   r#   ra   Ç  s    c             S   s   g | ]}t |ƒ‘qS r"   )r%   )r9   r1   r"   r"   r#   r:   Ü  s    )r   )rŒ   r   )rR   rS   )r   r>   r
   r   rm   ÚnextÚ	enumerater   r   rc   ÚintersectionÚ
differencerq   rP   r~   r…   r4   r,   r*   ri   r{   rd   Úinsertr$   rx   Úsortr}   rT   r[   ))r†   Úr1Úr2ÚjointypeÚ	r1postfixÚ	r2postfixrX   rR   rS   Údupr)   Znb1Zr1namesZr2namesrz   Zkey1Zr1kZr2kZauxZidx_sortZflag_inZidx_inZidx_1Zidx_2Zr1cmnZr2cmnZr1spcZr2spcZidx_outÚs1Ús2r/   r   Zdescr€   r!   Zcmnr   rC   ZselectedÚkwargsr"   )r†   r#   r   L  s¬    3



$ 









$

$c             C   s$   t ||||ddd}t| ||f|ŽS )z¨
    Join arrays `r1` and `r2` on keys.
    Alternative to join_by, that always returns a np.recarray.

    See Also
    --------
    join_by : equivalent function
    FT)r˜   r™   rš   rX   rR   rS   )r}   r   )r†   r–   r—   r˜   r™   rš   rX   rž   r"   r"   r#   r   ù  s    
)F)NN)NT)TF)N)r\   FFF)TF)TF)Nr\   TF)N)NTFF)NTF)r‰   rŠ   r‹   NTF)r‰   rŠ   r‹   N)0Ú__doc__Z
__future__r   r   r   rH   rJ   Znumpyr4   Znumpy.marP   r   r   r   Znumpy.ma.mrecordsr   Znumpy.lib._iotoolsr	   Znumpy.compatr
   rI   Zfuture_builtinsr   Zcorere   Ú__all__r   r&   r+   r.   r8   r   r@   rF   rN   rT   r[   r   r   rq   r   r   r   r   r   r   r   r   r"   r"   r"   r#   Ú<module>   s\   

'

/


 
 	
@
' 
D
" 
Y
6 
 - 