U
    SZfP                  
   @   s   d dl mZ d dlmZmZ d dlmZ d dlm	Z	 d dl
mZ edZedZedZd	d
 Zd*ddZd+ddZdd Zdd Zdd Zdd Zdd Zd,ddZdd Zd d! Zd"d# Zd-d(d)ZdS ).    )Number)
exceptionsoptional_importsN)
graph_objs)make_subplotsZpandasZnumpyzscipy.statsc                 C   s   t | t}t |}t |}t j|ddd}t j|ddd}t j|ddd}|| }d| }t |||| k }	t |||| k }
||||||	|
d	S )
z6
    Calculate statistics for use in violin plot.
    2   Zlinear)interpolation   lowerK   Zhigher      ?)minmaxq1q2q3d1d2)npasarrayfloatr   r   Z
percentile)dataxvals_minvals_maxr   r   r   ZiqrZwhisker_distr   r    r   A/tmp/pip-unpacked-wheel-5ksk5baj/plotly/figure_factory/_violin.py
calc_stats   s$    

r   #1f77b4rgb(0, 0, 0)c                    sH    fddt t D }tj dd|d|tjjd|ddd	dd

S )zG
    Produces a sideways probability distribution fig violin plot.
    c                    s4   g | ],}d d  |  d d |  d qS )z(pdf(y), y)=({:0.2f}z, ))format).0ir   yr   r   
<listcomp>-   s   z$make_half_violin.<locals>.<listcomp>lines Ztonextxg      ?Zspline)widthcolorshapetext)
r   r&   modenamer-   fill	fillcolorline	hoverinfoZopacity)rangelenr   ScatterscatterLine)r   r&   r1   Z	linecolorr-   r   r%   r   make_half_violin)   s    
r9   c              	   C   s4   t j| | | gt|  t jj|dddddddS )z2
    Returns a rugplot fig for a violin plot.
    zline-ew-open)r+   symbolmarkersr)   Fr&   )r&   r   markerr.   r/   
showlegendr3   )r   r6   r5   r7   Marker)valsZpdf_maxdistancer+   r   r   r   make_violin_rugplot@   s    rA   c              	   C   s(   t jddg| |gddt jjddddS )z?
    Returns the scatterplot fig of most of a violin plot.
    r   r)   r(   r   
rgb(0,0,0)r*   r+   )r   r&   r/   r.   r2   )r   r6   r7   r8   )r   r   r   r   r   make_non_outlier_intervalO   s    rD   c              	   C   sB   t jddg| |gdd|  dd| gdt jjdddd	d
S )z@
    Makes the upper and lower quartiles for a violin plot.
    r   zlower-quartile: r    zupper-quartile: r(      rB   rC   r-   )r   r&   r-   r.   r2   r3   )r   r6   r"   r7   r8   )r   r   r   r   r   make_quartiles\   s    rF   c              	   C   s.   t jdg| gdd|  gdtddddd	S )
z;
    Formats the 'median' hovertext for a violin plot.
    r   zmedian: r    r;   Zsquarezrgb(255,255,255))r:   r+   r-   )r   r&   r-   r.   r<   r3   )r   r6   r"   dict)r   r   r   r   make_medianm   s    
rH   c              
   C   s    t jj| |ddddddd}|S )z-
    Makes the x-axis for a violin plot.
    Fr)   )titler4   showgridzerolineshowlinemirrorticksshowticklabels)r   layoutZXAxis)Zxaxis_titleZxaxis_rangexaxisr   r   r   
make_XAxis{   s    
rR   c              
   C   s    t jj| dddddddd}|S )z-
    Makes the y-axis for a violin plot.
    TrE   F)rI   rO   Z	autorangeZticklenrL   rK   rJ   rM   )r   rP   ZYAxis)Zyaxis_titleyaxisr   r   r   
make_YAxis   s    
rT   Tc                 C   s  t | t} t| d }t| d }t| d }t| d }t| d }t| d }t| d }	t| }
t ||d}|
|}t |}|rd	| d
 nd}| | d |d g}t| ||dt|||dt	||	t
||t|g}|r|t| |||d ||fS )z?
    Refer to FigureFactory.create_violin() for docstring.
    r   r   r   r   r   r   r   d   g       @
   r   g?)r1   )r@   r+   )r   r   r   r   scipy_statsZgaussian_kdeZlinspacer   r9   rD   rF   rH   appendrA   )r?   r1   rugplotr   r   r   r   r   r   r   ZpdfZxxyyZmax_pdfr@   plot_xrange	plot_datar   r   r   
violinplot   s2    

r]   c                 C   s4  g }| | D ]}||kr| | q|r0|  | |g}t|}td|dddd}d}t|D ]\}}t||| t	}|t|krd}t
||| |d\}}t }|D ]}||d|d  q|d7 }|d d	|d t|| |i qb|d d
dtdi |d j|
ddd||	d |S )u
    Refer to FigureFactory.create_violin() for docstring.

    Returns fig for violin plot without colorscale.

       T皙?FZrowscolsZshared_yaxesZhorizontal_spacingZ
print_gridr   r1   rY   rP   xaxis{}yaxis{}r)   closestrI   r=   	hovermodeautosizeheightr*   )rX   sortgroupbyr5   r   	enumerater   r   	get_groupr   r]   r   Layoutappend_traceupdater"   rR   rT   )r   data_headergroup_headercolorsuse_colorscalegroup_statsrY   rk   rj   r*   rI   
group_namer/   gbLfigZcolor_indexkgrr?   r\   r[   rP   itemr   r   r   violin_no_colorscale   sT          
	r~   c           !      C   s  g }| | D ]}||kr| | q|r0|  |D ]}||kr4tdq4| |g}t|}td|dddd}t|d tj	}t|d tj	}g }|D ]}| ||  qt
|}t|}t|D ]\}}t||| t}|| | ||  }t|||}t|d||d	\}}t }|D ]}||d|d  q.|d
 d|d t|| |i qtjdgdgdtd||d|d gd|d ggdddd} || d| |d
 ddtdi |d
 j|
ddd||	d |S )zr
    Refer to FigureFactory.create_violin() for docstring.

    Returns fig for violin plot with colorscale.

    zRAll values/groups in the index column must be represented as a key in group_stats.r_   Tr`   Fra   r   zrgb{}rc   rP   rd   r;      )sizeZcminZcmaxZ
colorscaleZ	showscale)r   r&   r.   r<   r=   re   r)   rf   rg   )rX   rk   r   PlotlyErrorrl   r5   r   clrsZcolor_parserZunlabel_rgbr   r   rm   r   r   rn   r   Zfind_intermediate_colorr]   r"   r   ro   rp   rq   rR   r6   rG   rT   )!r   rr   rs   rt   ru   rv   rY   rk   rj   r*   rI   rw   r/   grouprx   ry   rz   ZlowcolorZ	highcolorZgroup_stats_valueskeyZ	max_valueZ	min_valuer{   r|   r?   ZintermedZintermed_colorr\   r[   rP   r}   Ztrace_dummyr   r   r   violin_colorscale  s          
	r   c                 C   s4  g }| | D ]}||kr| | q|r0|  |D ]}||kr4tdq4| |g}t|}td|dddd}t|D ]~\}}t	|
|| t}t||| |d\}}t }|D ]}||d|d  q|d d	|d t|| |i qz|d d
dtdi |d j|
ddd||	d |S )r^   zMIf colors is a dictionary, all the group names must appear as keys in colors.r_   Tr`   Fra   rc   rP   rd   re   r)   rf   rg   )rX   rk   r   r   rl   r5   r   rm   r   r   rn   r   r]   r   ro   rp   rq   r"   rR   rT   )r   rr   rs   rt   ru   rv   rY   rk   rj   r*   rI   rw   r/   r   rx   ry   rz   r{   r|   r?   r\   r[   rP   r}   r   r   r   violin_dictn  sN        	r   F  X  Violin and Rug Plotc                 C   s  t |trt|d}nt|d}|dkrt | trjt| dkrNtdt	dd | D sjtdt
rt | t
jjjr|dkrtd| | j } t| |d |d	\}}tj|
d
tjjdd|d
|	td|tddd	}|d td
d
dd tj||d}|S t | t
jjjs*td|dkr>td|d
krt |trtt| |||||||||	|
}|S t| |||||||||	|
}|S ndt |trtdt|dk rtdt |tstdt| |||||||||	|
}|S dS )a}  
    **deprecated**, use instead the plotly.graph_objects trace
    :class:`plotly.graph_objects.Violin`.

    :param (list|array) data: accepts either a list of numerical values,
        a list of dictionaries all with identical keys and at least one
        column of numeric values, or a pandas dataframe with at least one
        column of numbers.
    :param (str) data_header: the header of the data column to be used
        from an inputted pandas dataframe. Not applicable if 'data' is
        a list of numeric values.
    :param (str) group_header: applicable if grouping data by a variable.
        'group_header' must be set to the name of the grouping variable.
    :param (str|tuple|list|dict) colors: either a plotly scale name,
        an rgb or hex color, a color tuple, a list of colors or a
        dictionary. An rgb color is of the form 'rgb(x, y, z)' where
        x, y and z belong to the interval [0, 255] and a color tuple is a
        tuple of the form (a, b, c) where a, b and c belong to [0, 1].
        If colors is a list, it must contain valid color types as its
        members.
    :param (bool) use_colorscale: only applicable if grouping by another
        variable. Will implement a colorscale based on the first 2 colors
        of param colors. This means colors must be a list with at least 2
        colors in it (Plotly colorscales are accepted since they map to a
        list of two rgb colors). Default = False
    :param (dict) group_stats: a dictionary where each key is a unique
        value from the group_header column in data. Each value must be a
        number and will be used to color the violin plots if a colorscale
        is being used.
    :param (bool) rugplot: determines if a rugplot is draw on violin plot.
        Default = True
    :param (bool) sort: determines if violins are sorted
        alphabetically (True) or by input order (False). Default = False
    :param (float) height: the height of the violin plot.
    :param (float) width: the width of the violin plot.
    :param (str) title: the title of the violin plot.

    Example 1: Single Violin Plot

    >>> from plotly.figure_factory import create_violin
    >>> import plotly.graph_objs as graph_objects

    >>> import numpy as np
    >>> from scipy import stats

    >>> # create list of random values
    >>> data_list = np.random.randn(100)

    >>> # create violin fig
    >>> fig = create_violin(data_list, colors='#604d9e')

    >>> # plot
    >>> fig.show()

    Example 2: Multiple Violin Plots with Qualitative Coloring

    >>> from plotly.figure_factory import create_violin
    >>> import plotly.graph_objs as graph_objects

    >>> import numpy as np
    >>> import pandas as pd
    >>> from scipy import stats

    >>> # create dataframe
    >>> np.random.seed(619517)
    >>> Nr=250
    >>> y = np.random.randn(Nr)
    >>> gr = np.random.choice(list("ABCDE"), Nr)
    >>> norm_params=[(0, 1.2), (0.7, 1), (-0.5, 1.4), (0.3, 1), (0.8, 0.9)]

    >>> for i, letter in enumerate("ABCDE"):
    ...     y[gr == letter] *=norm_params[i][1]+ norm_params[i][0]
    >>> df = pd.DataFrame(dict(Score=y, Group=gr))

    >>> # create violin fig
    >>> fig = create_violin(df, data_header='Score', group_header='Group',
    ...                    sort=True, height=600, width=1000)

    >>> # plot
    >>> fig.show()

    Example 3: Violin Plots with Colorscale

    >>> from plotly.figure_factory import create_violin
    >>> import plotly.graph_objs as graph_objects

    >>> import numpy as np
    >>> import pandas as pd
    >>> from scipy import stats

    >>> # create dataframe
    >>> np.random.seed(619517)
    >>> Nr=250
    >>> y = np.random.randn(Nr)
    >>> gr = np.random.choice(list("ABCDE"), Nr)
    >>> norm_params=[(0, 1.2), (0.7, 1), (-0.5, 1.4), (0.3, 1), (0.8, 0.9)]

    >>> for i, letter in enumerate("ABCDE"):
    ...     y[gr == letter] *=norm_params[i][1]+ norm_params[i][0]
    >>> df = pd.DataFrame(dict(Score=y, Group=gr))

    >>> # define header params
    >>> data_header = 'Score'
    >>> group_header = 'Group'

    >>> # make groupby object with pandas
    >>> group_stats = {}
    >>> groupby_data = df.groupby([group_header])

    >>> for group in "ABCDE":
    ...     data_from_group = groupby_data.get_group(group)[data_header]
    ...     # take a stat of the grouped data
    ...     stat = np.median(data_from_group)
    ...     # add to dictionary
    ...     group_stats[group] = stat

    >>> # create violin fig
    >>> fig = create_violin(df, data_header='Score', group_header='Group',
    ...                     height=600, width=1000, use_colorscale=True,
    ...                     group_stats=group_stats)

    >>> # plot
    >>> fig.show()
    ZrgbNr   zRIf data is a list, it must be nonempty and contain either numbers or dictionaries.c                 s   s   | ]}t |tV  qd S )N)
isinstancer   )r#   elementr   r   r   	<genexpr>P  s     z create_violin.<locals>.<genexpr>z0If data is a list, it must contain only numbers.zVdata_header must be the column name with the desired numeric data for the violin plot.rc   F   )r   r)   rf   )	rI   ri   fontrj   r=   r*   rQ   rS   rh   rS   )rL   rO   rN   )r   rP   zGError. You must use a pandas DataFrame if you are using a group header.zFThe colors param cannot be a dictionary if you are using a colorscale.r   zHcolors must be a list with at least 2 colors. A Plotly scale is allowed.z,Your group_stats param must be a dictionary.)r   rG   r   Zvalidate_colors_dictZvalidate_colorslistr5   r   r   allpdcoreframeZ	DataFramevaluestolistr]   r   ro   rP   ZFontrR   rT   rq   ZFigurer   r~   r   )r   rr   rs   rt   ru   rv   rY   rk   rj   r*   rI   Zvalid_colorsr\   r[   rP   rz   r   r   r   create_violin  s     


  


r   )r   r   )r   )r   T)
NNNFNTFr   r   r   )Znumbersr   Zplotlyr   r   Zplotly.colorsrt   r   Zplotly.graph_objsr   Zplotly.subplotsr   Z
get_moduler   r   rW   r   r9   rA   rD   rF   rH   rR   rT   r]   r~   r   r   r   r   r   r   r   <module>   s<   





'CgJ          