o
    ;D©iÖ<  ã                   @   sB  d dl mZmZmZ d dlmZ d dlmZ d dlm	Z	 d dl
mZmZ d dlmZ d dlmZ 			d)dd„Zee_G dd„ deƒZdd„ Z	
	d*dd„Zee_	
	d)dd„Zee_d*dd„Zee_			
d+dd„Zee_G dd„ deƒZdd„ Zd,dd„Zee_G dd „ d eƒZd!d"„ Zd#d$„ Zee_G d%d&„ d&eƒZd'd(„ Zd	S )-é    )Úabsolute_importÚprint_functionÚdivision)ÚCounter)Únext)Ú
Comparable)ÚheaderÚTable)Úsort)ÚcutFNTc              	   C   s   t | ||||||dS )a÷	  
    Return rows in `a` that are not in `b`. E.g.::

        >>> import petl as etl
        >>> a = [['foo', 'bar', 'baz'],
        ...      ['A', 1, True],
        ...      ['C', 7, False],
        ...      ['B', 2, False],
        ...      ['C', 9, True]]
        >>> b = [['x', 'y', 'z'],
        ...      ['B', 2, False],
        ...      ['A', 9, False],
        ...      ['B', 3, True],
        ...      ['C', 9, True]]
        >>> aminusb = etl.complement(a, b)
        >>> aminusb
        +-----+-----+-------+
        | foo | bar | baz   |
        +=====+=====+=======+
        | 'A' |   1 | True  |
        +-----+-----+-------+
        | 'C' |   7 | False |
        +-----+-----+-------+

        >>> bminusa = etl.complement(b, a)
        >>> bminusa
        +-----+---+-------+
        | x   | y | z     |
        +=====+===+=======+
        | 'A' | 9 | False |
        +-----+---+-------+
        | 'B' | 3 | True  |
        +-----+---+-------+

    Note that the field names of each table are ignored - rows are simply
    compared following a lexical sort. See also the
    :func:`petl.transform.setops.recordcomplement` function.

    If `presorted` is True, it is assumed that the data are already sorted by
    the given key, and the `buffersize`, `tempdir` and `cache` arguments are
    ignored. Otherwise, the data are sorted, see also the discussion of the
    `buffersize`, `tempdir` and `cache` arguments under the
    :func:`petl.transform.sorts.sort` function.

    Note that the default behaviour is not strictly set-like, because 
    duplicate rows are counted separately, e.g.::
    
        >>> a = [['foo', 'bar'],
        ...      ['A', 1],
        ...      ['B', 2],
        ...      ['B', 2],
        ...      ['C', 7]]
        >>> b = [['foo', 'bar'],
        ...      ['B', 2]]
        >>> aminusb = etl.complement(a, b)
        >>> aminusb
        +-----+-----+
        | foo | bar |
        +=====+=====+
        | 'A' |   1 |
        +-----+-----+
        | 'B' |   2 |
        +-----+-----+
        | 'C' |   7 |
        +-----+-----+

    This behaviour can be changed with the `strict` keyword argument, e.g.::

        >>> aminusb = etl.complement(a, b, strict=True)
        >>> aminusb
        +-----+-----+
        | foo | bar |
        +=====+=====+
        | 'A' |   1 |
        +-----+-----+
        | 'C' |   7 |
        +-----+-----+

    .. versionchanged:: 1.1.0
    
    If `strict` is `True` then strict set-like behaviour is used, i.e., 
    only rows in `a` not found in `b` are returned.

    ©Ú	presortedÚ
buffersizeÚtempdirÚcacheÚstrict)ÚComplementView)ÚaÚbr   r   r   r   r   © r   úN/var/www/Datamplify/venv/lib/python3.10/site-packages/petl/transform/setops.pyÚ
complement   s   
Wÿr   c                   @   s"   e Zd Z		ddd„Zdd„ ZdS )	r   FNTc                 C   s@   |r	|| _ || _nt||||d| _ t||||d| _|| _d S ©N)r   r   r   )r   r   r
   r   )Úselfr   r   r   r   r   r   r   r   r   r   Ú__init__k   s   ÿÿ
zComplementView.__init__c                 C   ó   t | j| j| jƒS ©N)Úitercomplementr   r   r   ©r   r   r   r   Ú__iter__w   ó   zComplementView.__iter__©FNNTF©Ú__name__Ú
__module__Ú__qualname__r   r   r   r   r   r   r   i   s
    
ÿr   c           	      c   sV   dd„ t | ƒD ƒ}dd„ t |ƒD ƒ}tt|ƒƒ}t|ƒ |V  zt|ƒ}W n
 ty0   Y d S w zt|ƒ}W n tyL   |V  |D ]}|V  qCY d S w 	 |d u sZt|ƒt|ƒk rn|V  zt|ƒ}W nF tym   Y d S w ||kr˜zt|ƒ}W n
 ty‚   Y d S w |s—zt|ƒ}W n ty–   d }Y nw nzt|ƒ}W n ty©   d }Y nw qN)Nc                 s   ó    | ]}t |ƒV  qd S r   ©Útuple©Ú.0Úrowr   r   r   Ú	<genexpr>}   ó   € z!itercomplement.<locals>.<genexpr>c                 s   r&   r   r'   r)   r   r   r   r,   ~   r-   )Úiterr(   r   ÚStopIterationr   )	ÚtaÚtbr   ÚitaÚitbÚahdrr   r   r+   r   r   r   r   {   s\   €ÿÿþÿÿÿýÿìr   c           	      C   sL   t | ƒ}t |ƒ}t|ƒt|ƒksJ dƒ‚t|g|¢R Ž }t| |||||dS )a(  
    Find records in `a` that are not in `b`. E.g.::

        >>> import petl as etl
        >>> a = [['foo', 'bar', 'baz'],
        ...      ['A', 1, True],
        ...      ['C', 7, False],
        ...      ['B', 2, False],
        ...      ['C', 9, True]]
        >>> b = [['bar', 'foo', 'baz'],
        ...      [2, 'B', False],
        ...      [9, 'A', False],
        ...      [3, 'B', True],
        ...      [9, 'C', True]]
        >>> aminusb = etl.recordcomplement(a, b)
        >>> aminusb
        +-----+-----+-------+
        | foo | bar | baz   |
        +=====+=====+=======+
        | 'A' |   1 | True  |
        +-----+-----+-------+
        | 'C' |   7 | False |
        +-----+-----+-------+

        >>> bminusa = etl.recordcomplement(b, a)
        >>> bminusa
        +-----+-----+-------+
        | bar | foo | baz   |
        +=====+=====+=======+
        |   3 | 'B' | True  |
        +-----+-----+-------+
        |   9 | 'A' | False |
        +-----+-----+-------+

    Note that both tables must have the same set of fields, but that the order
    of the fields does not matter. See also the
    :func:`petl.transform.setops.complement` function.

    See also the discussion of the `buffersize`, `tempdir` and `cache` arguments
    under the :func:`petl.transform.sorts.sort` function.

    z,both tables must have the same set of fields©r   r   r   r   )r   Úsetr   r   )	r   r   r   r   r   r   ÚhaÚhbÚbvr   r   r   Úrecordcomplement¨   s   /
ÿr:   c           	   	   C   sH   |s
t | ƒ} t |ƒ}t|| d||||d}t| |d||||d}||fS )a;  
    Find the difference between rows in two tables. Returns a pair of tables.
    E.g.::

        >>> import petl as etl
        >>> a = [['foo', 'bar', 'baz'],
        ...      ['A', 1, True],
        ...      ['C', 7, False],
        ...      ['B', 2, False],
        ...      ['C', 9, True]]
        >>> b = [['x', 'y', 'z'],
        ...      ['B', 2, False],
        ...      ['A', 9, False],
        ...      ['B', 3, True],
        ...      ['C', 9, True]]
        >>> added, subtracted = etl.diff(a, b)
        >>> # rows in b not in a
        ... added
        +-----+---+-------+
        | x   | y | z     |
        +=====+===+=======+
        | 'A' | 9 | False |
        +-----+---+-------+
        | 'B' | 3 | True  |
        +-----+---+-------+

        >>> # rows in a not in b
        ... subtracted
        +-----+-----+-------+
        | foo | bar | baz   |
        +=====+=====+=======+
        | 'A' |   1 | True  |
        +-----+-----+-------+
        | 'C' |   7 | False |
        +-----+-----+-------+

    Convenient shorthand for ``(complement(b, a), complement(a, b))``. See also
    :func:`petl.transform.setops.complement`.

    If `presorted` is True, it is assumed that the data are already sorted by
    the given key, and the `buffersize`, `tempdir` and `cache` arguments are
    ignored. Otherwise, the data are sorted, see also the discussion of the
    `buffersize`, `tempdir` and `cache` arguments under the
    :func:`petl.transform.sorts.sort` function.

    .. versionchanged:: 1.1.0

    If `strict` is `True` then strict set-like behaviour is used.

    Tr   )r
   r   )	r   r   r   r   r   r   r   ÚaddedÚ
subtractedr   r   r   Údiffã   s   5
ÿ
ÿr=   c                 C   s0   t || ||||d}t | |||||d}||fS )aF  
    Find the difference between records in two tables. E.g.::

        >>> import petl as etl
        >>> a = [['foo', 'bar', 'baz'],
        ...      ['A', 1, True],
        ...      ['C', 7, False],
        ...      ['B', 2, False],
        ...      ['C', 9, True]]
        >>> b = [['bar', 'foo', 'baz'],
        ...      [2, 'B', False],
        ...      [9, 'A', False],
        ...      [3, 'B', True],
        ...      [9, 'C', True]]
        >>> added, subtracted = etl.recorddiff(a, b)
        >>> added
        +-----+-----+-------+
        | bar | foo | baz   |
        +=====+=====+=======+
        |   3 | 'B' | True  |
        +-----+-----+-------+
        |   9 | 'A' | False |
        +-----+-----+-------+

        >>> subtracted
        +-----+-----+-------+
        | foo | bar | baz   |
        +=====+=====+=======+
        | 'A' |   1 | True  |
        +-----+-----+-------+
        | 'C' |   7 | False |
        +-----+-----+-------+

    Convenient shorthand for
    ``(recordcomplement(b, a), recordcomplement(a, b))``. See also
    :func:`petl.transform.setops.recordcomplement`.

    See also the discussion of the `buffersize`, `tempdir` and `cache`
    arguments under the :func:`petl.transform.sorts.sort` function.

    .. versionchanged:: 1.1.0

    If `strict` is `True` then strict set-like behaviour is used.

    r5   )r:   )r   r   r   r   r   r   r;   r<   r   r   r   Ú
recorddiff%  s   
/ÿ
ÿr>   c                 C   s   t | |||||dS )aQ  
    Return rows in `a` that are also in `b`. E.g.::

        >>> import petl as etl
        >>> table1 = [['foo', 'bar', 'baz'],
        ...           ['A', 1, True],
        ...           ['C', 7, False],
        ...           ['B', 2, False],
        ...           ['C', 9, True]]
        >>> table2 = [['x', 'y', 'z'],
        ...           ['B', 2, False],
        ...           ['A', 9, False],
        ...           ['B', 3, True],
        ...           ['C', 9, True]]
        >>> table3 = etl.intersection(table1, table2)
        >>> table3
        +-----+-----+-------+
        | foo | bar | baz   |
        +=====+=====+=======+
        | 'B' |   2 | False |
        +-----+-----+-------+
        | 'C' |   9 | True  |
        +-----+-----+-------+

    If `presorted` is True, it is assumed that the data are already sorted by
    the given key, and the `buffersize`, `tempdir` and `cache` arguments are
    ignored. Otherwise, the data are sorted, see also the discussion of the
    `buffersize`, `tempdir` and `cache` arguments under the
    :func:`petl.transform.sorts.sort` function.

    )r   r   r   r   )ÚIntersectionView)r   r   r   r   r   r   r   r   r   Úintersection^  s   
"ÿr@   c                   @   s"   e Zd Z		ddd„Zdd„ ZdS )	r?   FNTc                 C   s<   |r
|| _ || _d S t||||d| _ t||||d| _d S r   )r   r   r
   )r   r   r   r   r   r   r   r   r   r   r   ‰  s   
ÿÿzIntersectionView.__init__c                 C   ó   t | j| jƒS r   )Úiterintersectionr   r   r   r   r   r   r   ”  ó   zIntersectionView.__iter__©FNNTr"   r   r   r   r   r?   ‡  s
    
ÿr?   c                 c   s°    t | ƒ}t |ƒ}t|ƒ}t|ƒ t|ƒV  z7tt|ƒƒ} tt|ƒƒ}	 t| ƒt|ƒk r3tt|ƒƒ} n| |krG| V  tt|ƒƒ} tt|ƒƒ}ntt|ƒƒ}q$ tyW   Y d S w r   )r.   r   r(   r   r/   )r   r   r2   r3   r4   r   r   r   rB   ˜  s*   €
ø	ÿrB   c                 C   s   t | ||dS )a  
    Alternative implementation of :func:`petl.transform.setops.complement`,
    where the complement is executed by constructing an in-memory set for all
    rows found in the right hand table, then iterating over rows from the
    left hand table.

    May be faster and/or more resource efficient where the right table is small
    and the left table is large.
    
    .. versionchanged:: 1.1.0
    
    If `strict` is `True` then strict set-like behaviour is used, i.e., 
    only rows in `a` not found in `b` are returned.

    )r   )ÚHashComplementView©r   r   r   r   r   r   Úhashcomplement®  s   rG   c                   @   s   e Zd Zddd„Zdd„ ZdS )rE   Fc                 C   s   || _ || _|| _d S r   rF   )r   r   r   r   r   r   r   r   Ç  s   
zHashComplementView.__init__c                 C   r   r   )Úiterhashcomplementr   r   r   r   r   r   r   r   Ì  r    zHashComplementView.__iter__N©Fr"   r   r   r   r   rE   Å  s    
rE   c           	      c   s|    t | ƒ}t|ƒ}t|ƒV  t |ƒ}t|ƒ tdd„ |D ƒƒ}|D ]}t|ƒ}|| dkr8|s7||  d8  < q!|V  q!d S )Nc                 s   r&   r   r'   r)   r   r   r   r,   Ø  r-   z%iterhashcomplement.<locals>.<genexpr>r   é   ©r.   r   r(   r   )	r   r   r   r2   r4   r3   ÚbcntÚarÚtr   r   r   rH   Ð  s   €
€úrH   c                 C   s
   t | |ƒS )au  
    Alternative implementation of
    :func:`petl.transform.setops.intersection`, where the intersection
    is executed by constructing an in-memory set for all rows found in the
    right hand table, then iterating over rows from the left hand table.

    May be faster and/or more resource efficient where the right table is small
    and the left table is large.

    )ÚHashIntersectionView©r   r   r   r   r   Úhashintersectionâ  s   
rQ   c                   @   s   e Zd Zdd„ Zdd„ ZdS )rO   c                 C   s   || _ || _d S r   rP   )r   r   r   r   r   r   r   ö  s   
zHashIntersectionView.__init__c                 C   rA   r   )Úiterhashintersectionr   r   r   r   r   r   r   ú  rC   zHashIntersectionView.__iter__Nr"   r   r   r   r   rO   ô  s    rO   c                 c   sv    t | ƒ}t|ƒ}t|ƒV  t |ƒ}t|ƒ tdd„ |D ƒƒ}|D ]}t|ƒ}|| dkr8|V  ||  d8  < q!d S )Nc                 s   r&   r   r'   r)   r   r   r   r,     r-   z'iterhashintersection.<locals>.<genexpr>r   rJ   rK   )r   r   r2   r4   r3   rL   rM   rN   r   r   r   rR   þ  s   €
€ürR   r!   )NNTFrD   rI   ) Ú
__future__r   r   r   Úcollectionsr   Úpetl.compatr   Úpetl.comparisonr   Úpetl.util.baser   r	   Úpetl.transform.sortsr
   Úpetl.transform.basicsr   r   r   r   r:   r=   r>   r@   r?   rB   rG   rE   rH   rQ   rO   rR   r   r   r   r   Ú<module>   sJ    
ÿ[-
ÿ8
ÿ?
6
ÿ&
