o
    @gF                      @  s   d dl mZ d dlmZmZ d dlZd dlmZm	Z	m
Z
mZ d dlmZ d dlmZ d dlZd dlmZ d dlmZ erHd d	lmZ d d
lmZ eed dG dd ded ZdS )    )annotations)TYPE_CHECKINGcastN)FilePath
ReadBufferScalarStorageOptions)import_optional_dependency)doc)_shared_docs)BaseExcelReaderOpenDocument)NaTTypestorage_options)r   c                      s   e Zd Z		d-d. fd
dZed/ddZd0ddZed1ddZed2ddZd3ddZ	d4ddZ
	d5d6d"d#Zd7d$d%Zd7d&d'Zd8d)d*Zd1d+d,Z  ZS )9	ODFReaderNfilepath_or_bufferFilePath | ReadBuffer[bytes]r   StorageOptions | Noneengine_kwargsdict | NonereturnNonec                   s   t d t j|||d dS )aF  
        Read tables out of OpenDocument formatted files.

        Parameters
        ----------
        filepath_or_buffer : str, path to be parsed or
            an open readable stream.
        {storage_options}
        engine_kwargs : dict, optional
            Arbitrary keyword arguments passed to excel engine.
        odf)r   r   N)r	   super__init__)selfr   r   r   	__class__ a/var/www/html/development/chatbot/venv/lib/python3.10/site-packages/pandas/io/excel/_odfreader.pyr       s   
zODFReader.__init__type[OpenDocument]c                 C  s   ddl m} |S )Nr   r   )odf.opendocumentr   )r   r   r   r   r    _workbook_class8   s   zODFReader._workbook_classr   c                 C  s   ddl m} ||fi |S )Nr   )load)r"   r$   )r   r   r   r$   r   r   r    load_workbook>   s   zODFReader.load_workbookstrc                 C  s   dS )z'Property for compat with other readers. r   )r   r   r   r    empty_valueE   s   zODFReader.empty_value	list[str]c                 C  s&   ddl m} | j|}dd |D S )z4Return a list of sheet names present in the documentr   Tablec                 S  s   g | ]}| d qS )name)getAttribute).0tr   r   r    
<listcomp>P   s    z)ODFReader.sheet_names.<locals>.<listcomp>)	odf.tabler+   bookgetElementsByType)r   r+   tablesr   r   r    sheet_namesJ   s   zODFReader.sheet_namesindexintc                 C  s*   ddl m} | | | j|}|| S )Nr   r*   )r1   r+   raise_if_bad_sheet_by_indexr2   r3   )r   r6   r+   r4   r   r   r    get_sheet_by_indexR   s   
zODFReader.get_sheet_by_indexr,   c                 C  sZ   ddl m} | | | j|}|D ]}|d|kr |  S q|   td| d)Nr   r*   r,   zsheet z
 not found)r1   r+   raise_if_bad_sheet_by_namer2   r3   r-   close
ValueError)r   r,   r+   r4   tabler   r   r    get_sheet_by_nameY   s   
zODFReader.get_sheet_by_namefile_rows_needed
int | Nonelist[list[Scalar | NaTType]]c                   s  ddl m}m}m} | j}| j}||h ||}d}	d}
g }|D ]} fdd|jD }d}g |D ]2}|j|krB| |}n| j}| 	|}|| jkrT||7 }q5
| jg|  d}
|g|  q5|
tk rrt}
| |}tdkr|	|7 }	n|
| jgg|	  d}	|
fddt|D  |durt||kr nq#|D ]}t||
k r|
| jg|
t|   q|S )z9
        Parse an ODF Table into a list of lists
        r   )CoveredTableCell	TableCellTableRowc                   s$   g | ]}t |d r|j v r|qS )qname)hasattrrE   )r.   x)
cell_namesr   r    r0   }   s    
z,ODFReader.get_sheet_data.<locals>.<listcomp>c                 3  s    | ]} V  qd S Nr   )r.   _)	table_rowr   r    	<genexpr>   s    z+ODFReader.get_sheet_data.<locals>.<genexpr>N)r1   rB   rC   rD   rE   r3   
childNodes_get_cell_valuer(   _get_column_repeatextendlen_get_row_repeatrange)r   sheetr?   rB   rC   rD   covered_cell_nametable_cell_name
sheet_rows
empty_rowsmax_row_lenr=   	sheet_rowsheet_cellsempty_cells
sheet_cellvaluecolumn_repeat
row_repeatrowr   )rH   rK   r    get_sheet_dataf   sP   







zODFReader.get_sheet_datac                 C  "   ddl m} t|j|dfdS )z
        Return number of times this row was repeated
        Repeating an empty row appeared to be a common way
        of representing sparse rows in the table.
        r   TABLENSznumber-rows-repeated   odf.namespacesre   r7   
attributesget)r   ra   re   r   r   r    rR      s   zODFReader._get_row_repeatc                 C  rc   )Nr   rd   znumber-columns-repeatedrf   rg   )r   cellre   r   r   r    rO      s   zODFReader._get_column_repeatScalar | NaTTypec                 C  s:  ddl m} t|dkrtjS |j|df}|dkr%t|dkr#dS dS |d u r,| jS |d	krFt|j|d
f}t	|}||krD|S |S |dkrV|j|d
f}t|S |dkr_| 
|S |dkro|j|d
f}t|S |dkr|j|df}t|S |dkrtt|}tt| S |   td| )Nr   )OFFICENSz#N/Az
value-typebooleanTRUETFfloatr^   
percentagestringcurrencydatez
date-valuetimezUnrecognized type )rh   rm   r&   npnanri   rj   r(   rp   r7   _get_cell_string_valuepd	Timestampr   r   ru   r;   r<   )r   rk   rm   	cell_type
cell_valuevalstampr   r   r    rN      s@   

zODFReader._get_cell_valuec                 C  s   ddl m} ddlm} ddlm} ddlm} | j}| j}g }|j	D ]8}	t
|	|rS|	j|krDt|	j|dfd}
|d|
  q%|	j|krJq%|| |	 q%|t|	d	 q%d
|S )z
        Find and decode OpenDocument text:s tags that represent
        a run length encoded sequence of space characters.
        r   )Element)TEXTNS)
Annotation)Scrf    
r'   )odf.elementr   rh   r   
odf.officer   odf.textr   rE   rM   
isinstancer7   ri   rj   appendrx   r&   stripjoin)r   rk   r   r   r   r   office_annotationtext_sr^   fragmentspacesr   r   r    rx      s"   




z ODFReader._get_cell_string_value)NN)r   r   r   r   r   r   r   r   )r   r!   )r   r   r   r   )r   r&   )r   r)   )r6   r7   )r,   r&   rI   )r?   r@   r   rA   )r   r7   )r   rl   )__name__
__module____qualname__r   propertyr#   r%   r(   r5   r9   r>   rb   rR   rO   rN   rx   __classcell__r   r   r   r    r      s&    



D


'r   r   )
__future__r   typingr   r   numpyrv   pandas._typingr   r   r   r   pandas.compat._optionalr	   pandas.util._decoratorsr
   pandasry   pandas.core.shared_docsr   pandas.io.excel._baser   r"   r   pandas._libs.tslibs.nattyper   r   r   r   r   r    <module>   s    