U
    b                     @  s`   d dl mZ d dlZd dlmZmZmZmZ d dl	m
Z
 d dlZd dlmZ G dd deZdS )    )annotationsN)FilePath
ReadBufferScalarStorageOptions)import_optional_dependency)BaseExcelReaderc                      s   e Zd ZdZd+ddd fddZedd	 Zdd
ddZeddddZeddddZ	ddddZ
ddddZdddddZddd d!Zddd"d#Zddd$d%Zdd&dd'd(Zddd)d*Z  ZS ),	ODFReadera"  
    Read tables out of OpenDocument formatted files.

    Parameters
    ----------
    filepath_or_buffer : str, path to be parsed or
        an open readable stream.
    storage_options : dict, optional
        passed to fsspec for appropriate URLs (see ``_get_filepath_or_buffer``)
    NzFilePath | ReadBuffer[bytes]r   )filepath_or_bufferstorage_optionsc                   s   t d t j||d d S )NZodf)r   )r   super__init__)selfr
   r   	__class__ >/tmp/pip-unpacked-wheel-ck39h295/pandas/io/excel/_odfreader.pyr      s    zODFReader.__init__c                 C  s   ddl m} |S )Nr   )OpenDocument)odf.opendocumentr   )r   r   r   r   r   _workbook_class&   s    zODFReader._workbook_class)r
   c                 C  s   ddl m} ||S )Nr   )load)r   r   )r   r
   r   r   r   r   load_workbook,   s    zODFReader.load_workbookstr)returnc                 C  s   dS )z'Property for compat with other readers. r   )r   r   r   r   empty_value1   s    zODFReader.empty_valuez	list[str]c                 C  s&   ddl m} | j|}dd |D S )z4Return a list of sheet names present in the documentr   Tablec                 S  s   g | ]}| d qS name)getAttribute).0tr   r   r   
<listcomp><   s     z)ODFReader.sheet_names.<locals>.<listcomp>)	odf.tabler   bookgetElementsByType)r   r   tablesr   r   r   sheet_names6   s    zODFReader.sheet_namesint)indexc                 C  s*   ddl m} | | | j|}|| S )Nr   r   )r$   r   Zraise_if_bad_sheet_by_indexr%   r&   )r   r*   r   r'   r   r   r   get_sheet_by_index>   s    
zODFReader.get_sheet_by_indexr   c                 C  s^   ddl m} | | | j|}|D ]}|d|kr&|  S q&|   td| dd S )Nr   r   r   zsheet z
 not found)r$   r   Zraise_if_bad_sheet_by_namer%   r&   r    close
ValueError)r   r   r   r'   tabler   r   r   get_sheet_by_nameE   s    

zODFReader.get_sheet_by_nameboolzlist[list[Scalar]])convert_floatr   c                   sr  ddl m}m}m} | j}| j}||h ||}d}	d}
g }|D ]} fdd|jD }d}g }|D ]f}|j|kr| ||}n| j}| 	|}|| jkr||7 }qj|
| jg|  d}|
|g|  qj|
t|k rt|}
| |}| |r|	|7 }	qF|
| jgg|	  d}	t|D ]}|| q&qF|D ].}t||
k r>|
| jg|
t|   q>|S )z9
        Parse an ODF Table into a list of lists
        r   )CoveredTableCell	TableCellTableRowc                   s   g | ]}|j  kr|qS r   )qname)r!   x
cell_namesr   r   r#   g   s     
 z,ODFReader.get_sheet_data.<locals>.<listcomp>)r$   r2   r3   r4   r5   r&   
childNodes_get_cell_valuer   _get_column_repeatextendlen_get_row_repeat_is_empty_rowrangeappend)r   Zsheetr1   r2   r3   r4   Zcovered_cell_nameZtable_cell_nameZ
sheet_rowsZ
empty_rowsZmax_row_lenr.   Z	sheet_rowZsheet_cellsZempty_cellsZ	table_rowZ
sheet_cellvalueZcolumn_repeatZ
row_repeat_rowr   r7   r   get_sheet_dataR   sF    






zODFReader.get_sheet_datac                 C  s"   ddl m} t|j|dfdS )z
        Return number of times this row was repeated
        Repeating an empty row appeared to be a common way
        of representing sparse rows in the table.
        r   TABLENSznumber-rows-repeated   odf.namespacesrG   r)   
attributesget)r   rD   rG   r   r   r   r>      s    zODFReader._get_row_repeatc                 C  s"   ddl m} t|j|dfdS )Nr   rF   znumber-columns-repeatedrH   rI   )r   cellrG   r   r   r   r;      s    zODFReader._get_column_repeatc                 C  s$   |j D ]}t|j dkr dS qdS )z4
        Helper function to find empty rows
        r   FT)r9   r=   )r   rD   columnr   r   r   r?      s    
zODFReader._is_empty_rowr   c                 C  s@  ddl m} t|dkrtjS |j|df}|dkrJt|dkrFdS dS |d krX| jS |d	krt|j|d
f}|rt	|}||kr|S |S |dkr|j|d
f}t|S |dkr| 
|S |dkr|j|d
f}t|S |dkr|j|df}t|S |dkr&tt|}| S |   td| d S )Nr   )OFFICENSz#N/Az
value-typebooleanTRUETFfloatrB   
percentagestringcurrencydatez
date-valuetimezUnrecognized type )rJ   rO   r   npnanrK   rL   r   rR   r)   _get_cell_string_valuepdZto_datetimerW   r,   r-   )r   rM   r1   rO   Z	cell_typeZ
cell_valuevalZstampr   r   r   r:      sB    



zODFReader._get_cell_valuec           	      C  s   ddl m} ddlm} ddlm} | j}g }|jD ]^}t||r|j|krtt	|j
|dfd}|d|  q|| | q6|t| q6d|S )	z
        Find and decode OpenDocument text:s tags that represent
        a run length encoded sequence of space characters.
        r   )Element)TEXTNS)ScrH    r   )Zodf.elementr]   rJ   r^   Zodf.textr_   r5   r9   
isinstancer)   rK   rL   rA   rZ   r   join)	r   rM   r]   r^   r_   Ztext_srB   fragmentspacesr   r   r   rZ      s    


z ODFReader._get_cell_string_value)N)__name__
__module____qualname____doc__r   propertyr   r   r   r(   r+   r/   rE   r>   r;   r?   r:   rZ   __classcell__r   r   r   r   r	      s$    
=

(r	   )
__future__r   ZnumpyrX   Zpandas._typingr   r   r   r   Zpandas.compat._optionalr   Zpandasr[   Zpandas.io.excel._baser   r	   r   r   r   r   <module>   s   