U
    Nvf')                     @   s   d Z ddlZddlZddlZddlZddlZddlZddlZejZ	G dd de
ZG dd de
ZG dd de	ZG d	d
 d
eZdddZdS )zb
Fast cryptographic hash of Python objects, with a special case for fast
hashing of numpy arrays.
    Nc                   @   s   e Zd ZdZdd ZdS )_ConsistentSetza Class used to ensure the hash of Sets is preserved
        whatever the order of its items.
    c              	   C   sB   zt || _W n. ttjfk
r<   t dd |D | _Y nX d S )Nc                 s   s   | ]}t |V  qd S Nhash).0e r   2/tmp/pip-unpacked-wheel-dylwa62s/joblib/hashing.py	<genexpr>%   s     z*_ConsistentSet.__init__.<locals>.<genexpr>)sortedZ	_sequence	TypeErrordecimalInvalidOperation)selfZset_sequencer   r   r	   __init__   s    z_ConsistentSet.__init__N__name__
__module____qualname____doc__r   r   r   r   r	   r      s   r   c                   @   s   e Zd ZdZdd ZdS )_MyHashz7 Class used to hash objects that won't normally pickle c                 G   s
   || _ d S r   )args)r   r   r   r   r	   r   +   s    z_MyHash.__init__Nr   r   r   r   r	   r   (   s   r   c                   @   s   e Zd ZdZdddZdddZdd	 Zd
d Zdej	fddZ
ej Ze
eee< e
eee< e
eee< e
eeej< dd Zdd Zeeee < dS )HasherzW A subclass of pickler, to do cryptographic hashing, rather than
        pickling.
    md5c                 C   s0   t  | _d}tj| | j|d t|| _d S )N   )protocol)ioBytesIOstreamPicklerr   hashlibnew_hash)r   	hash_namer   r   r   r	   r   4   s    
zHasher.__init__Tc              
   C   sv   z|  | W n> tjk
rL } z| jd||f f7  _ W 5 d }~X Y nX | j }| j| |rr| j S d S )Nz"PicklingError while hashing %r: %r)	dumppicklePicklingErrorr   r   getvaluer"   update	hexdigest)r   objZreturn_digestr   dumpsr   r   r	   r   =   s    
zHasher.hashc                 C   s   t |tjti jfr|t|dr*|jj}n|j}|j}t|tt	krTt
||j}n(|d krht
||}n|jj}t
|||}t| | d S )N__func__)
isinstancetypes
MethodTypetypepophasattrr,   r   __self__r%   r   	__class__r   save)r   r*   	func_nameinstclsr   r   r	   r5   H   s    

zHasher.savec                 C   s"   t |ttfrd S t| | d S r   )r-   bytesstrr   memoize)r   r*   r   r   r	   r;   [   s    zHasher.memoizeNc                 C   s   t ||d}|d= ztj| |f| W nl tjk
r   tj| |f| t|dd }|dkr|}|d krn|j}tj| }t	||st
||| Y nX d S )N)namepackr=   r   __main__)dictr   save_globalr%   r&   getattrr   sysmodulesr2   setattr)r   r*   r<   r=   kwargsmoduleZmy_namemodr   r   r	   r@   f   s    

zHasher.save_globalc              
   C   sP   zt | tt| W n2 tk
rJ   t | ttdd |D  Y nX d S )Nc                 s   s   | ]\}}t ||fV  qd S r   r   )r   kvr   r   r	   r
      s   z)Hasher._batch_setitems.<locals>.<genexpr>)r   _batch_setitemsiterr   r   )r   itemsr   r   r	   rJ      s    zHasher._batch_setitemsc                 C   s   t | t| d S r   )r   r5   r   )r   Z	set_itemsr   r   r	   save_set   s    zHasher.save_set)r   )T)r   r   r   r   r   r   r5   r;   structr=   r@   r   dispatchcopyr0   lenobjectr%   r$   rJ   rM   setr   r   r   r	   r   /   s   
	

r   c                   @   s"   e Zd ZdZd	ddZdd ZdS )
NumpyHasherz7 Special case the hasher for when numpy is loaded.
    r   Fc                 C   s@   || _ tj| |d ddl}|| _t|dr6|j| _nt| _dS )a  
            Parameters
            ----------
            hash_name: string
                The hash algorithm to be used
            coerce_mmap: boolean
                Make no difference between np.memmap and np.ndarray
                objects.
        r#   r   N	getbuffer)	coerce_mmapr   r   numpynpr2   rV   
_getbuffer
memoryview)r   r#   rW   rY   r   r   r	   r      s    


zNumpyHasher.__init__c                 C   s   t || jjr|jjs|jdkr*| }n&|jjr8|}n|jj	rH|j
}n| }| j| || jj | jrt || jjr| jj}n|j}|d|j|j|jff}n6t || jjr| jdd | jt| dS t| | dS )z Subclass the save method, to hash ndarray subclass, rather
            than pickling them. Off course, this is a total abuse of
            the Pickler class.
        r   ZHASHEDZ_HASHED_DTYPEzutf-8N)r-   rY   ZndarrayZdtypeZ	hasobjectshapeflattenflagsc_contiguousf_contiguousTr"   r(   rZ   viewZuint8rW   Zmemmapr4   stridesencoder%   r+   r   r5   )r   r*   Zobj_c_contiguousklassr   r   r	   r5      s(    


zNumpyHasher.saveN)r   F)r   r   r   r   r   r5   r   r   r   r	   rT      s   
rT   r   Fc                 C   sH   d}||krt d||dtjkr4t||d}n
t|d}|| S )aj   Quick calculation of a hash to identify uniquely Python objects
        containing numpy arrays.

        Parameters
        ----------
        hash_name: 'md5' or 'sha1'
            Hashing algorithm used. sha1 is supposedly safer, but md5 is
            faster.
        coerce_mmap: boolean
            Make no difference between np.memmap and np.ndarray
    )r   sha1zAValid options for 'hash_name' are {}. Got hash_name={!r} instead.rX   )r#   rW   rU   )
ValueErrorformatrB   rC   rT   r   r   )r*   r#   rW   Zvalid_hash_namesZhasherr   r   r	   r      s     

r   )r   F)r   r%   r    rB   r.   rN   r   r   _Picklerr   rR   r   r   r   rT   r   r   r   r   r	   <module>   s   	kZ