
    	h:                     N    S r SSKr " S S\5      r " S S5      r " S S5      rg)	z
This module contains a tokenizer for Excel formulae.

The tokenizer is based on the Javascript tokenizer found at
http://ewbi.blogs.com/develops/2004/12/excel_formula_p.html written by Eric
Bachtal
    Nc                       \ rS rSrSrSrg)TokenizerError   z$Base class for all Tokenizer errors. N)__name__
__module____qualname____firstlineno____doc____static_attributes__r       L/var/www/html/env/lib/python3.13/site-packages/openpyxl/formula/tokenizer.pyr   r      s    .r   r   c                   
   \ rS rSrSr\R                  " S5      r\R                  " S5      r\R                  " S5      \R                  " S5      S.r	Sr
S	rS
 rS rS rS rS rS rS rS rS rS rS rSS jrS rS rSrg)	Tokenizer   aB  
A tokenizer for Excel worksheet formulae.

Converts a str string representing an Excel formula (in A1 notation)
into a sequence of `Token` objects.

`formula`: The str string to tokenize

Tokenizer defines a method `._parse()` to parse the formula into tokens,
which can then be accessed through the `.items` attribute.

z^[1-9](\.[0-9]+)?[Ee]$z[ \n]+z"(?:[^"]*"")*[^"]*"(?!")z'(?:[^']*'')*[^']*'(?!')"')z#NULL!z#DIV/0!z#VALUE!z#REF!z#NAME?z#NUM!z#N/Az#GETTING_DATAz,;}) +-*/^&=><%c                 h    Xl         / U l        / U l        SU l        / U l        U R                  5         g )Nr   )formulaitemstoken_stackoffsettoken_parse)selfr   s     r   __init__Tokenizer.__init__.   s-    

r   c           
      \   U R                   (       a  gU R                  (       d  gU R                  S   S:X  a  U =R                   S-  sl         O>U R                  R                  [	        U R                  [        R
                  5      5        gSU R                  4SU R                  4SU R                  4SU R                  4S	U R                  4S
U R                  4SU R                  4SU R                  4SU R                  44	n0 nU H)  u  p4UR                  [        R!                  X45      5        M+     U R                   [#        U R                  5      :  a  U R%                  5       (       a  M:  U R                  U R                      nXPR&                  ;   a  U R)                  5         XR;   a  U =R                   X%   " 5       -  sl         O0U R*                  R                  U5        U =R                   S-  sl         U R                   [#        U R                  5      :  a  M  U R)                  5         g)z5Populate self.items with the tokens from the formula.Nr   =   z"'[# 
z
+-*/^&=><%z{()}z;,)r   r   r   appendTokenLITERAL_parse_string_parse_brackets_parse_error_parse_whitespace_parse_operator_parse_opener_parse_closer_parse_separatorupdatedictfromkeyslencheck_scientific_notationTOKEN_ENDERS
save_tokenr   )r   	consumers
dispatchercharsconsumer	curr_chars         r   r   Tokenizer._parse7   s   ;;||\\!_#KK1KJJeDLL%--@AD&&'$&&'$##$$(()4))*4//04%%&4%%&4(()

	 
(OEdmmE<=  )kkC----//T[[1I---!&z466 

!!),q  kkC-- 	r   c                    U R                  SS9  U R                  U R                     nUS;   d   eU R                  U   nUR	                  U R                  U R                  S 5      nUc%  US:X  a  SOSn[        SU S	U R                   35      eUR                  S
5      nUS:X  a/  U R                  R                  [        R                  U5      5        OU R                  R                  U5        [        U5      $ )ay  
Parse a "-delimited string or '-delimited link.

The offset must be pointing to either a single quote ("'") or double
quote ('"') character. The strings are parsed according to Excel
rules where to escape the delimiter you just double it up. E.g.,
"abc""def" in Excel is parsed as 'abc"def' in Python.

Returns the number of characters matched. (Does not update
self.offset)

:
can_followr   Nr   stringlinkz%Reached end of formula while parsing z in r   )assert_empty_tokenr   r   STRING_REGEXESmatchr   groupr   r'   r(   make_operandr   r5   )r   delimregexrG   subtypes        r   r*   Tokenizer._parse_string_   s     	3/T[[)
"""##E*DLL67="'3,hFG #H	QUVZVbVbUc!deeAC<JJe0078JJe$5zr   c                    U R                   U R                     S:X  d   e[        R                  " SU R                   U R                  S 5       Vs/ s H  oR	                  5       S4PM     nn[        R                  " SU R                   U R                  S 5       Vs/ s H  oR	                  5       S4PM     nnSn[        X#-   5       HW  u  pVXF-  nUS:X  d  M  US-   nU R                  R                  U R                   U R                  U R                  U-    5        Us  $    [        SU R                    35      es  snf s  snf )	z|
Consume all the text between square brackets [].

Returns the number of characters matched. (Does not update
self.offset)

r"   z\[Nr!   z\]r   zEncountered unmatched '[' in )	r   r   refinditerstartsortedr   r'   r   )r   tleftsrights
open_countidx
open_closeouter_rights           r   r+   Tokenizer._parse_brackets{   s4    ||DKK(C///UDLL$>?A? %&'')Q? 	 A ++eT\\$++,%?@B@ '(779b/@ 	 B 
%en5OC$JQ!Ag

!!LLT[[;-FGI""  6 <T\\NKLLABs   D<Ec                    U R                  SS9  U R                  U R                     S:X  d   eU R                  U R                  S nU R                   H  nUR	                  U5      (       d  M  U R
                  R                  [        R                  SR                  U R                  5      U-   5      5        U R                  SS2	 [        U5      s  $    [        SU R                   SU R                   S35      e)	z
Consume the text following a '#' as an error.

Looks for a match in self.ERROR_CODES and returns the number of
characters matched. (Does not update self.offset)

!rA   r#   N zInvalid error code at position  in 'r   )rE   r   r   ERROR_CODES
startswithr   r'   r(   rI   joinr   r5   r   )r   
subformulaerrs      r   r,   Tokenizer._parse_error   s     	3/||DKK(C///\\$++,/
##C$$S))

!!%"4"4RWWTZZ5H35N"OPJJqM3x	 $
 >t{{m5QUQ]Q]P^^_`aar   c                 T   U R                   U R                     S;   d   eU R                  R                  [	        U R                   U R                     [        R
                  5      5        U R                  R                  U R                   U R                  S 5      R                  5       $ )zn
Consume a string of consecutive spaces.

Returns the number of spaces found. (Does not update self.offset).

)r$   r%   N)	r   r   r   r'   r(   WSPACE	WSPACE_RErG   endr   s    r   r-   Tokenizer._parse_whitespace   sv     ||DKK(K777

%T[[ 95<<HI~~##DLL$>?CCEEr   c                    U R                   U R                  U R                  S-    S;   aX  U R                  R                  [	        U R                   U R                  U R                  S-    [        R
                  5      5        gU R                   U R                     nUS;   d   eUS:X  a  [	        S[        R                  5      nGOUS;   a  [	        U[        R
                  5      nOU R                  (       d  [	        U[        R                  5      nO[        S [        U R                  5       5       S5      nU=(       ae    UR                  [        R                  :H  =(       dA    UR                  [        R                  :H  =(       d    UR                  [        R                  :H  nU(       a  [	        U[        R
                  5      nO[	        U[        R                  5      nU R                  R                  U5        g)	z}
Consume the characters constituting an operator.

Returns the number of characters consumed. (Does not update
self.offset)

   )z>=z<=z<>z
%*/^&=><+-%z*/^&=><c              3   f   #    U  H'  nUR                   [        R                  :w  d  M#  Uv   M)     g 7fN)typer(   rg   ).0is     r   	<genexpr>,Tokenizer._parse_operator.<locals>.<genexpr>   s)      4$8qFFell2 $8s   "1	1Nr!   )r   r   r   r'   r(   OP_INOP_POSTOP_PREnextreversedrL   CLOSErq   OPERAND)r   r=   r   previs_infixs        r   r.   Tokenizer._parse_operator   sm    <<DKK!O48JJJJeT[[q9  LL-	L(((#u}}-E)#)U[[1E)U\\2E 4HTZZ$8 459;D + .99-.99- 
 i5i6

% r   c                    U R                   U R                     S;   d   eU R                   U R                     S:X  a&  U R                  5         [        R	                  S5      nOiU R
                  (       aC  SR                  U R
                  5      S-   nU R
                  SS2	 [        R	                  U5      nO[        R	                  S5      nU R                  R                  U5        U R                  R                  U5        g)zi
Consumes a ( or { character.

Returns the number of characters consumed. (Does not update
self.offset)

)({r   r^   r   Nr!   )
r   r   rE   r(   make_subexpr   rb   r   r'   r   )r   r   token_values      r   r/   Tokenizer._parse_opener   s     ||DKK(J666<<$+##%%%c*EZZ''$**-3K

1%%k2E%%c*E

% &r   c                 F   U R                   U R                     S;   d   eU R                  R                  5       R	                  5       nUR
                  U R                   U R                     :w  a  [        SU R                   -  5      eU R                  R                  U5        g)zi
Consumes a } or ) character.

Returns the number of characters consumed. (Does not update
self.offset)

))}zMismatched ( and { pair in '%s'r!   )	r   r   r   pop
get_closervaluer   r   r'   )r   r   s     r   r0   Tokenizer._parse_closer   s     ||DKK(J666  $$&113;;$,,t{{33 1DLL@B B

% r   c                    U R                   U R                     nUS;   d   eUS:X  a  [        R                  S5      nO_ U R                  S   R
                  nU[        R                  :X  a  [        S[        R                  5      nO[        R                  S5      n U R                  R                  U5        g! [         a    [        S[        R                  5      n NBf = f)zi
Consumes a ; or , character.

Returns the number of characters consumed. (Does not update
self.offset)

);,r   rO   r   r!   )r   r   r(   make_separatorr   rq   PARENrv   
IndexErrorr   r'   )r   r=   r   top_types       r   r1   Tokenizer._parse_separator   s     LL-	J&&&((-E6++B/44 u{{*!#u{{3E!005E

%   0c5;;/0s   B9 9$C C c                 H   U R                   U R                     nUS;   a  [        U R                  5      S:  aj  U R                  R                  SR                  U R                  5      5      (       a1  U R                  R                  U5        U =R                  S-  sl        gg)z
Consumes a + or - character if part of a number in sci. notation.

Returns True if the character was consumed and self.offset was
updated, False otherwise.

z+-r!   r^   TF)r   r   r5   r   SN_RErG   rb   r'   )r   r=   s     r   r6   #Tokenizer.check_scientific_notation  sv     LL-	

Oq(JJ$$RWWTZZ%899JJi(KK1Kr   c                     U R                   (       a:  U R                   S   U;  a&  [        SU R                   SU R                   S35      egg)a
  
Ensure that there's no token currently being parsed.

Or if there is a token being parsed, it must end with a character in
can_follow.

If there are unconsumed token contents, it means we hit an unexpected
token transition. In this case, we raise a TokenizerError

rO   z!Unexpected character at position r_   r   N)r   r   r   r   )r   rB   s     r   rE   Tokenizer.assert_empty_token'  sJ     ::$**R.
: #DT[[MQVW[WcWcVdde!fgg ;:r   c                     U R                   (       aW  U R                  R                  [        R	                  SR                  U R                   5      5      5        U R                   SS2	 gg)z9If there's a token being parsed, add it to the item list.r^   N)r   r   r'   r(   rI   rb   rj   s    r   r8   Tokenizer.save_token5  sC    ::JJe001DEF

1 r   c                     U R                   (       d  gU R                   S   R                  [        R                  :X  a  U R                   S   R                  $ SSR                  S U R                    5       5      -   $ )z+Convert the parsed tokens back to a string.r^   r   r    c              3   8   #    U  H  oR                   v   M     g 7frp   )r   )rr   r   s     r   rt   #Tokenizer.render.<locals>.<genexpr>A  s     AjU[[js   )r   rq   r(   r)   r   rb   rj   s    r   renderTokenizer.render;  sX    zzZZ]5==0::a=&&&RWWAdjjAAAAr   )r   r   r   r   r   N)r   )r   r   r	   r
   r   rP   compiler   rh   rF   r`   r7   r   r   r*   r+   r,   r-   r.   r/   r0   r1   r6   rE   r8   r   r   r   r   r   r   r      s     JJ01E

9%I ZZ23ZZ23N5K$L&P8M2b$	F$L, 2"hBr   r   c                       \ rS rSrSr/ SQrSrSrSrSr	Sr
S	rS
rSrSrSrSS jrSrSrSrSrSrS r\S 5       rSrSr\S S j5       rS rSrSr\S 5       rSr g)!r(   iD  a  
A token in an Excel formula.

Tokens have three attributes:

* `value`: The string value parsed that led to this token
* `type`: A string identifying the type of token
* `subtype`: A string identifying subtype of the token (optional, and
             defaults to "")

r   rq   rL   r)   r|   FUNCARRAYr   SEPzOPERATOR-PREFIXzOPERATOR-INFIXzOPERATOR-POSTFIXzWHITE-SPACEc                 (    Xl         X l        X0l        g rp   r   )r   r   type_rL   s       r   r   Token.__init___  s    
	r   TEXTNUMBERLOGICALERRORRANGEc                 d    SR                  U R                  U R                  U R                  5      $ )Nz{0} {1} {2}:)formatrq   rL   r   rj   s    r   __repr__Token.__repr__q  s#    %%diitzzJJr   c                 B   UR                  S5      (       a  U R                  nONUR                  S5      (       a  U R                  nO+US;   a  U R                  nO [	        U5        U R
                  nU " XR                  U5      $ ! [         a    U R                  n N+f = f)zCreate an operand token.r   r#   )TRUEFALSE)	ra   r   r   r   floatr   
ValueErrorr   r|   clsr   rL   s      r   rI   Token.make_operandt  s     C  hhGc""iiG''kkG$e** 5++w//  $))$s   B BBOPENr{   c                 N   US   S;   d   eU(       a/  [         R                  " SU5      (       d   e[        R                  nO>US;   a  [        R                  nO'US;   a  [        R
                  nO[        R                  nUS;   a  U R                  OU R                  nU " XU5      $ )zu
Create a subexpression token.

`value`: The value of the token
`func`: If True, force the token to be of type FUNC

rO   )r   r   r   r   z.+\(|\)z{}z()r&   )rP   rG   r(   r   r   r   r{   r   )r   r   funcr   rL   s        r   r   Token.make_subexp  s     Ry000088K////JJEd]KKEd]KKEJJE$}#))#((5))r   c                 (   U R                   U R                  U R                  U R                  4;   d   eU R                  U R
                  :X  d   eU R                   U R                  :X  a  SOSnU R                  XR                   U R                  :H  S9$ )z6Return a closing token that matches this token's type.r   r   )r   )rq   r   r   r   rL   r   r   )r   r   s     r   r   Token.get_closer  st    yyTYY

DJJ????||tyy(((yyDJJ.CII,BCCr   ARGROWc                 t    US;   d   eUS:X  a  U R                   OU R                  nU " XR                  U5      $ )zCreate a separator token)r   r   r   )r   r   r   r   s      r   r   Token.make_separator  s8     
""""c\#''sww5''7++r   )rL   rq   r   N)r^   )F)!r   r   r	   r
   r   	__slots__r)   r|   r   r   r   r   rx   rv   rw   rg   r   r   r   r   r   r   r   classmethodrI   r   r{   r   r   r   r   r   r   r   r   r   r(   r(   D  s    
 -IGGDEE
CFE GF DFGEEK 0 02 DE* **D C
C, ,r   r(   )r   rP   	Exceptionr   r   r(   r   r   r   <module>r      s6    
/Y /qB qBh	z, z,r   