
    i                     1   U d dl Z d dlZd dlZd dlZd dlZd dlZd dlmZ d dlmZm	Z	m
Z
mZmZ d dlmZ d dlZd dlmZ d dlmZ d dlZd dlmZmZmZ d dlmZmZmZm Z m!Z! d dl"m#Z# d dl$m%Z% d d	l&m'Z' d d
l(m)Z) d dl*m+Z+ d dlm,Z,m-Z-m.Z. d dl/m0Z1 d dl2m3Z3m4Z4 ddl5m6Z6m7Z7 ddlm8Z8m9Z9m:Z:  ed      Z; ed      Z<eejz                  j|                  ejz                  j~                  f   Z@e
eAd<    ej                  eC      ZDej                  j                  ZFej                  j                  ZGej                  j                  ZHej                  j                  ZIej                  j                  ZJ eg eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj`                  eFj                  eFj                  eFj                  eFj                  eFj                  eFj                  e)eFj                  eFj                  eFj                  eFj                  j                  eFj                  j                  eHj                  eIj                        Zui  e       euZveFj                  eFj                  eFj                  eFj                  j                  eFj                  eFj                  eFj                  eFj<                  eFj`                  eFj                  eFj                   eFj                  eFj                  eFj                  j                  eFj
                  eFj                  eFj                  eFj                  gZeeejz                  j                  ejz                  j~                  f      eAd<    eeve       dee@ee@   f   deee<e;f   gee<e;f   f   fdZ eeFj<                  g      dej                  dej                  depdepdedej                  fd       Z eeFj`                        dej                  d ej                  d!e	ej                     d"e	ej                     d#edeej                  ej                  ej                  f   fd$       Z eeFj&                  j                  g      ddd%d&ej(                  d'e	ej*                  j,                     d(e	ej*                  j,                     ddfd)       Z eeFj.                  g      e!	 	 dd*ej                  d'e	ej*                  j,                     d(e	ej*                  j,                     dej                  fd+              Z eeFj0                  g      d,eeepej(                  f      d-ej*                  j,                  d.edej                  fd/       Z eeFj                  g      dd0d*ej                  d1epd2ej                  d3ej                  d4ej*                  j,                  dej                  fd5       Z eeFj2                  j                  g      d,eeepej(                  f      d6eep   d.edej                  fd7       Z eeFj4                  g      dej                  dej                  d!ej                  d8eep   d9eepeep   f   d:eepeep   f   d;eepeep   f   d<ed=eep   d>epd?ee   deej                  ej                  ej                  f   fd@       Z eeFj6                  j8                  g      dd*ej                  dAepdej                  fdB       Z eeFj<                  g      e 	 ddCej                  dDej                  dEe	ej>                     dej                  fdF              Z eeFj@                  g      e 	 	 	 ddCej                  dGej                  dHej                  dEe	ej>                     dIej*                  j,                  d4ej*                  j,                  dej                  fdJ              Z eeFjB                  g      e 	 ddCej                  dKej                  dEe	ej>                     dej                  fdL              Z eeFjD                  j                  g      	 ddMeej                     d1epdej                  fdN       Z eeFjF                  g      d*ej                  dej                  fdO       Z eeFjH                  g      dd0d*ej                  dPej                  d4e	ej*                  j,                     dej                  fdQ       Z eeFjJ                  g      dCej                  dej                  fdR       Z eeFjL                  eFjN                  g      dCej                  dej                  fdS       Z eeFjP                  eGjP                  g      dCej                  dTej                  dej                  fdU       Z eeFjR                  eGjR                  g      dCej                  dTej                  dej                  fdV       Z eeFjT                        	 	 ddCej                  d1e	ep   dXedej                  fdY       Z eeFjV                        	 	 ddCej                  d1e	ep   dXedej                  fdZ       Z eeFjX                  g      dCej                  d1epd[epd\epdej                  f
d]       Z eeFjZ                  j                  g      dCej                  d,eeepej(                  f      dej                  fd^       Z eeFjZ                  j>                  g      dCej                  d_ej>                  dej                  fd`       ZdCej                  deej                  ej`                  f   fdaZ eeFjd                        ddddWdWejf                  dbdCej                  d-eepef   d_e	ej>                     dce	ejh                     dde	ejj                     deedfedgejl                  dej                  fdh       Zddejf                  didjedkej                  f   dCej                  d_e	ej>                     dde	ejj                     dgejl                  d.edej                  fdlZ eeFjp                        dCej                  d.edej                  fdm       Z eeFjr                        dCej                  d.edej                  fdn       Z eeFjt                  j                        dCej                  doepd.edej                  fdp       Z eeFjt                  jv                        dCej                  dqepdoepd.edej                  f
dr       Z eeFjz                  j                        doepd,eeepej(                  f      d.edej                  fds       Z eeHj                  j                        	 ddej                  d!ej                  d"e	ej                     dej                  fdt       Zs eeIj                  j                        dej                  duej                  dvej                  d!ej                  dwej                  dxej                  d"ej                  dyej                  dzej                  d{epdej                  fd|       Zt eej                  j                  j|                        d}ej                  dej                  fd~       Z eeFj                  g      e 	 	 	 ddej                  dej                  depdepdedej                  fd              Z eeFj                  j                        	 ddCeej                     deej                     deej                     dedeej                     f
d       Z eeFj                  j                        	 ddCeej                     deej                     deej                     dedeej                     f
d       Z eeFj                  j                        deej                     deej                     d!ej*                  j,                  deej                     fd       Z eeFj                  j                        deej                     deej                     deej*                  j,                     deej                     fd       ZeFj                  j                  j                  ej                  j                  j                         eeFj                        dej                  d!ej                  d"ej                  ej                     dej                  ej                     dej                  ej                     dedededeej                  ej                  ej                  f   fd              Ze j                  deeedkef   f   fd       Zdeeedkef   f   fdZ eeFj                        dCej                  dej                  dej                  dej                  fd       Z eeJj                  j                        dej                  depdepd#ed_ej>                  deej                  ej                  f   fd       Z eeFj                        	 ddCej                  d2ej                  dej                  dedej                  f
d       Z eeFj                        	 ddCej                  d2ej                  dej                  dedej                  f
d       Z eeFj                  j                        e dej                  dej                  d1epdej>                  dej                  f
d              Z| eeFj                        dddCej                  d1epd2ej                  dej                  dededej                  fd       Zd*ej                  deep   d9e	eepeep   f      d:eepeep   f   d;eepeep   f   ded1epdeej                  ej                  f   fdZ eeFj                        	 	 	 	 dd*ej                  deep   d9e	eepeep   f      d:eepeep   f   d;eepeep   f   dedeej                  ej                  f   fd       Z eeFj                        	 	 	 	 dd*ej                  deep   d9e	eepeep   f      d:eepeep   f   d;eepeep   f   dedeej                  ej                  f   fd       Z eeFj                        d*ej                  deep   deej                  ej                  f   fd       Z eeFj                  j                        dWdWddddej                  dCej*                  j,                  dedede	e   de	ej                     dej                  fd       Z eeFj                        	 	 	 	 ddCej                  dej                  dededede	ej                     deej                  ej                  f   fd       Z eeFj                  j                        	 ddej                  de	ep   dej                  fd       Z	 	 	 	 	 ddej                  d!ej                  d"e	ej                     d9eep   d:eep   d;eep   d>epdej                  fdZy)    N)Callable)AnyOptional	TypeAliasTypeVarUnion)	ParamSpec)core_aten_decompositionsget_decompositionsremove_decompositions)_grid_sampler_2d
_index_addembedding_dense_backwardpw_cast_for_opmath"pw_cast_for_opmath_non_tensor_args)extra_random_decomps)counters)	is_fbcode)	out_dtype)pad_listlike)elementwise_dtypesELEMENTWISE_TYPE_PROMOTION_KINDtype_to_dtype)native_layer_norm)guard_or_falsestatically_known_true   )configinductor_prims)is_gpu,needs_fallback_due_to_atomic_add_limitationsuse_scatter_fallback_T_P_GenericOperatordecomps_to_excludeopsreturnc                     t        | t              r| n| gD ]!  }|t        v st        j	                  d|        # t        j                  | t              S )Nzduplicate decomp: %s)
isinstancelistdecompositionslogwarningdecompregister_decomposition)r'   ops     W/var/www/html/engine/venv/lib/python3.12/site-packages/torch/_inductor/decomposition.pyr0   r0      sL      T*c 5KK.45 ((n==    grad_outputindicesnum_weightspadding_idxscale_grad_by_freqc                 D    | j                   rt        S t        | ||||      S N)is_xpuNotImplementeddecomp_embedding_dense_backward)r4   r5   r6   r7   r8   s        r2   _embedding_dense_backwardr>      s,     *Wk;8J r3   inputnormalized_shapeweightbiasepsc                 D    | j                   rt        S t        | ||||      S r:   )is_mtiar<   decomp_native_layer_norm)r?   r@   rA   rB   rC   s        r2   _native_layer_normrG      s%     }}#E+;VT3OOr3   )minmaxsymbolrH   rI   c                     y r:    )rJ   rH   rI   s      r2   sym_constrain_range_for_sizerM      s     r3   xc                 R    || j                  |      } || j                  |      } | S r:   )	clamp_min	clamp_max)rN   rH   rI   s      r2   clamprR      s/     KK
KKHr3   size
fill_valuekwargsc                     |j                  d      }|.t        t        |            |d<   t        j                  | |fi |S t
        S )Ndtype)getr   typetorchfullr<   )rS   rT   rU   rW   s       r2   r[   r[      sF     JJwE}'Z(89wzz$
5f55r3   alphadimindextensorr]   c                ~    t               s#| j                  t        j                  k(  rt        S t        | |||d|      S )NF)inplacer]   )r   rW   rZ   bfloat16r<   r   )rN   r^   r_   r`   r]   s        r2   	index_addrd      s3     ;177enn4!S%eLLr3   physical_layoutc                 H   t        |      t        t        t        |                  k(  }|rt        j                  | fi |S dgt        |       z  }t        |      D ]
  \  }}|||<    t        j                  |D cg c]  }| |   	 c}fi |j                  |      S c c}w Nr   )r+   rangelenrZ   empty	enumeratepermute)rS   re   rU   is_identitypermpls          r2   empty_permutedrq      s     '4c/6J0K+LLK{{4*6**sSYo. 	DAqDG	{{_=DG=HHPPQUVV=s   <B
bias_sizesstridepaddingdilation
transposedoutput_paddinggroupsoutput_maskc                 .   |
d   rt        | j                  j                        st        S t        j                  | dgt        t        d| j                                     z         }t        j                  | |||||||||	|
d   |
d   dg      \  }}}|||fS )N   r   r   F)
r    devicerY   r<   atensumr+   rh   r^   convolution_backward)r4   r?   rA   rr   rs   rt   ru   rv   rw   rx   ry   	grad_biasgrad_inpgrad_weight_s                  r2   r   r      s     q>(:(:(?(?!@qcDq+//:K1L,M&MNI#88	QQ/ Hk1 k9--r3   decimalsc                 H    d|z  }t         j                  | |z        d|z  z  S )Ng      $@g      ?)r}   round)rN   r   ten_pow_decimalss      r2   	round_decr     s,    X~::a**+s5E/EFFr3   selfbatch2r   c                    t         j                  r| j                  j                  dvrkt	        | j
                  d   dk(        st	        |j
                  d   dk(        r5| j                  d      |j                  d      z  j                  d      }|S | j                  j                  dk(  rt	        | j                  d      dk(        ryt	        |j                  d      dk(        r\t        d   dxx   dz  cc<   t        j                  | j                  d      |j                  d      z  dd	
      j                  d      S t        S )Ncpumpsr   r{   r^   r   inductordecompose_bmmTr^   keepdim)r   coordinate_descent_tuningr|   rY   r   shape	unsqueezer~   rS   r   rZ   squeezer<   )r   r   r   outs       r2   bmmr   %  s    ''DKK,<,<N,R A!!348MLLOq 9
 >>"%(8(8(;;@@Q@GCJ{{5  1!238MKKOq 9
 Z 1Q6199Q&.."44!Til r3   mat1mat2betac                    | j                   j                  dk(  r7t        |j                  d      dk(        rt        |j                  d      dk(        rgt        d   dxx   dz  cc<   t        j                  |j                  d      |j                  d      z  dd      j                  d      }||z  || z  z   S t        |j                  d      dk(        ryt        |j                  d      d	k        r\t        |j                  d      d	k        r?t        d   dxx   dz  cc<   |j                  |z  j                  dd      }||z  || z  z   S t        S )
Nr   r   r   r   r   decompose_addmmTr      )r|   rY   r   rS   r   rZ   r~   r   r   r   Tr<   )r   r   r   r   r   r]   r   s          r2   addmmr   ?  s2    {{5  1!238MIIbMQ9
 Z !23q83))Q$,,r"224il  3;,,!$))A,!"34tyy|r12tyy|r12Z !23q8366D=%%!T%:C3;,,r3   input2c                    t         j                  r| j                  j                  dvrit	        | j
                  d   dk(        st	        |j
                  d   dk(        r3| j                  d      |j                  d      z  j                  d      S | j                  j                  dk(  rVt	        | j                  d      dk(        rt	        | j                  d      dkD        rt	        |j                  d      dk(        ri| j                  |j                  k(  rPt        t        j                  |       t        j                  |      z   dk        rt        d	   d
xx   dz  cc<   | |z  S t	        | j                  d      dk(        ryt	        |j                  d      dk(        r\t        d	   d
xx   dz  cc<   t        j                  | j                  d      |j                  d      z  dd      j                  d      S t        S )Nr   r   r   r{   r   r   r       r   decompose_mmTr   )r   r   r|   rY   r   r   r   r~   rS   rW   r   rZ   numelr   r   r<   )r   r   r   s      r2   mmr   ]  s    ''DKK,<,<N,R A!!348MLLOq 9
 NN1%(8(8(;;@@Q@GG{{5 !$))B-1"45%diilQ&67%fkk!n&9:v||+D 1EKK4G GBNOZ 0A50&=  1!238MKKOq 9
 Z 0A5099Q&.."44!Til r3   tensorsc                    dt         j                  dt        ffd}t        t	        ||             t              dk(  rRt        | dt        j                  id   }d   }||j                  k(  r|j                         S |j                  |      S dt              cxk  rt        |       k  r#n n t        j                  j                        S t              dkD  rt        fdD              rd   }t        |j                         }dk  rt        |j                         z   n|j#                  t                      |j%                        j&                  | j)                  dz         j                         S t*        S )	NrN   r(   c                     t        | j                        dk(  rt        | j                  d   dk(        ryt        | j                        k  rt        | j                     dk(        ryy)Nr   r   FT)ri   r   r   )rN   r^   s    r2   non_empty_tensorzcat.<locals>.non_empty_tensor  sU    " qww<1
a!@QWW.1B"Cr3   r   type_promotion_kindr   rW   c              3   ,   K   | ]  }|d    u   yw)r   NrL   ).0tfiltered_tensorss     r2   	<genexpr>zcat.<locals>.<genexpr>  s!      )%&a  )s   )rZ   Tensorboolr+   filterri   r   r   DEFAULTrW   clonetor}   catdefaultallr   insertr   expandflattenr<   )r   r^   r   promoted_dtype
filtered_tinpr   r   s    `     @r2   r   r     s   
ELL T 2 F#3W=>
!+
 ? G G
  &a(
 !1!11 	
 ^4	

 
S!"	1S\	1xx 0#66 q S )*:) & q!SYY&)AgcC		N"3S#./0(s}}S!((%088cAgFLLNN r3   c                 "   | j                         ret        j                  t        j                  | j                        t        d      t        j                  | j                  | j                              S t        | t        j                        \  }}t        j                  t        j                  || j                        }t        j                  | dk  |d      }t        j                  t        j                  |       t        d      |      S )Nnan)r   rW   r|   r   g        )
is_complexrZ   whereisnanrealfloatatan2imagr   r   INT_TO_FLOATscalar_tensormathpir|   )rN   r   rW   r   rets        r2   angler     s    ||~{{KKuu{{166166/J
 	
 "	;HHHAu 
		TWWE!((	CB
++a!eR
%C;;u{{1~uU|S99r3   yc                   t        j                  |       xr | j                         }t        j                  |      xr |j                         }|r|st        S dt         j                  dt
        fd}d}| j                  dk(  r|j                  dk(  rd}| j                  dk(  r| j                  d      } |j                  dk(  r|j                  d      }|}|||z  }t        j                  | j                  |j                        } ||       s ||      rt        S dt         j                  dt         j                  fd}	| dz   } |dz   } |	| j                  | j                  j                              }
 |	|j                  |j                  j                              }t        j                  |
|z   d	
      j                  |      }|r|d   S |S )Nr`   r(   c                 N    | j                   dk(  ry| j                         d   dk7  S )Nr   Fr   r   )ndimrs   )r`   s    r2   _requires_fallbackzadd.<locals>._requires_fallback  s'    ;;!}}r"a''r3   Fr   Tr   c                     | j                   ^ }}|dz  dk7  rt        d      g ||dz  d}| j                  |      }|S )zNReshape tensor from [*initial_dims, last_dim] to *initial_dims, last_dim/2, 2]r{   r   zQThe size of the last dimension must be even to reshape it to [..., last_dim/2, 2])r   AssertionErrorview)r`   initial_dimslast_dim	new_shapereshaped_tensors        r2   reshape_tensor_complexz#add.<locals>.reshape_tensor_complex  s^     #),,x a<1 c 
 6l5HM515	 ++i0r3   )	start_dim)rZ   	is_tensorr   r<   r   r   r   reshapepromote_typesrW   r   r   r   )rN   r   r]   x_is_complex_tensory_is_complex_tensorr   output_size_zerozcomplex_typer   
x_reshaped
z_reshapedresults                r2   addr     s     //!,?//!,?&9(5<< (D ( vv{qvv{vv{IIaLvv{IIaL	AAI&&qww8L! 21 5u||  $ 	
AA	AA'qvv||(<=J'qvv||(<=J]]:
2bAFF|TFayMr3   c                 2    | j                         rt        S | S r:   )r   r<   r   s    r2   conj_physicalr     s    Kr3   c                     | S r:   rL   r   s    r2   liftr   #  s    Kr3   otherc                 b    t        j                  t        j                  |      || kD  z  | |      S r:   rZ   r   r   r   r   s     r2   fminr   (  '    ;;u{{5)UT\:D%HHr3   c                 b    t        j                  t        j                  |      || k  z  | |      S r:   r   r   s     r2   fmaxr   -  r   r3   Fr   c                 x    | j                   t        j                  k(  rt        j                  | ||      S t        S Nr   )rW   rZ   r   anyr<   r   r^   r   s      r2   amaxr   2  -     zzUZZyy388r3   c                 x    | j                   t        j                  k(  rt        j                  | ||      S t        S r   )rW   rZ   r   r   r<   r   s      r2   aminr  =  r   r3   startlengthc                 N    t        j                  | |||      j                         S r:   )rZ   narrowr   )r   r^   r  r  s       r2   narrow_copyr  H  s"     <<c5&17799r3   c                 J    t         j                  | |      j                         S r:   )r}   r   r   )r   rS   s     r2   view_copy_defaultr	  R  s    
 99T4 &&((r3   rW   c                 @    | j                  |      j                         S r:   )r   r   )r   rW   s     r2   view_copy_dtyper  Z  s    
 775>!!r3   c                     t        j                  |       \  }}|D cg c]  }| j                  |    }}dgt        |      z  }t	        |      D ]
  \  }}|||<    ||fS c c}w rg   )utils3compute_elementwise_output_logical_to_physical_permr   ri   rk   )r   re   r   rp   r   permutationro   s          r2   _get_shape_permutation_liker  b  sx     RRSWXOQ$34qTZZ]4E4#E
"K/* 1A ; 5s   A )rW   layoutr|   
pin_memoryrequires_gradmemory_formatr  r|   r  r  r  c          	         || j                   n|}|| j                  n|}|| j                  n|}|t        j                  k7  r8t        j
                  | j                  ||||||      }|j                  |      S |t        j                  k(  sJ t        |       \  }	}
t        j
                  |	||||||      }|
t        t        t        |
                  k(  r|S |j                  |
      j                         S )N)rW   r  r|   r  r  r  )rW   r  r|   rZ   preserve_formatr[   r   r   stridedr  r+   rh   ri   rl   r   )r   rT   rW   r  r|   r  r  r  r   r   r  s              r2   	full_liker  o  s      -DJJUE"NT[[F"NT[[F---JJ!'
 yy}y55 &&&8>{!'
 $uS%5677M~~k*0022r3   )rW   r|   r  rand_fn.c                j   ||j                   n|}||j                  n|}|t        j                  k7  r& | |j                  f||d|j                  |      S t        |      \  }} | |f||d|}|t        t        t        |                  k(  r|S |j                  |      j                         S )Nr   r  )rW   r|   rZ   r  r   r   r  r+   rh   ri   rl   r   )	r  r   rW   r|   r  rU   r   r  r   s	            r2   
_rand_liker    s      -DJJUE"NT[[F---JJ

 	

 "="
)	* 5T:E; 	F d5[!1233>>+&,,..r3   c                 8    t        t        j                  | fi |S r:   )r  rZ   randr   rU   s     r2   	rand_liker     s    ejj$1&11r3   c                 8    t        t        j                  | fi |S r:   )r  rZ   randnr  s     r2   
randn_liker#    s    ekk42622r3   highc                 v    t        t        j                  t        j                  j
                  d|      | fi |S rg   r  	functoolspartialr}   randintlow)r   r$  rU   s      r2   randint_liker+    s-    i''(8(8!TBDSFSSr3   r*  c                 v    t        t        j                  t        j                  j
                  ||      | fi |S r:   r&  )r   r*  r$  rU   s       r2   randint_like_lowr-    s/     i''(8(8#tDdUfUUr3   c                 F    t        j                  j                  d| |fi |S rg   )r}   r)  r*  )r$  rS   rU   s      r2   r)  r)    s"     <<AtT4V44r3   c                     t         j                  j                  j                  |      }t         j                  j                  j	                  | |||j                         d         S rg   )rZ   r'   
_quantized$wrapped_fbgemm_pack_gemm_matrix_fp16!wrapped_fbgemm_linear_fp16_weightrS   )r?   rA   rB   packed_weights       r2   #linear_dynamic_fp16_unpacked_weightr4    sO     II((MMfUM99AA}dFKKM!$4 r3   input_scaleinput_zero_pointweight_scaleweight_zero_point	out_scaleout_zero_pointout_channelc
           	          t         j                  j                  j                  ||||      }
t         j                  j                  j	                  | |||
|||	      S r:   )rZ   r'   r0  _wrapped_linear_prepack#_wrapped_quantized_linear_prepacked)r?   r5  r6  rA   r7  r8  rB   r9  r:  r;  r3  s              r2   wrapped_quantized_linearr?    s\     II((@@/M 99CC r3   packedc                     dt         j                  dt         j                  fd} || dddf         } || ddd f         }| dd df   j                  t         j                        |z  |z   S )Nu8r(   c                      fddD        \  }}}}t         j                  dk(  r4||dz  z   |dz  z   |dz  z   j                  t        j                        d   S |dz  |dz  z   |dz  z   |z   j                  t        j                        d   S )Nc              3   f   K   | ](  }d |f   j                  t        j                         * yw.N)r   rZ   int32)r   nrB  s     r2   r   zPq_embedding_bag_byte_unpack_decomp.<locals>.bitcast_u8_to_f32.<locals>.<genexpr>  s&     GQbajmmEKK0Gs   .1)r   r   r{      little   r      rE  )sys	byteorderr   rZ   float32)rB  rN   r   r   ws   `    r2   bitcast_u8_to_f32z=q_embedding_bag_byte_unpack_decomp.<locals>.bitcast_u8_to_f32  s    G,G
1a==H$aLAG,R8>>u}}MiXX"Wb)Q!V4q8>>u}}MiXXr3   .i)rZ   r   r   rN  )r@  rP  scalesoffsetss       r2   "q_embedding_bag_byte_unpack_decomprT    sz    Yell Yu|| Y vc2b5j12FsBCx 01G#ss(u}}-6@@r3   agridinterpolation_modepadding_modealign_cornersc                     | j                   t        j                   d      k(  xr' |dk(  xr  | j                  t        j                         }t	        | |||||      }|S )Nr   r   r  )rV  rW  rX  rY  _expand_grid)r|   rZ   is_contiguouscontiguous_formatdecomp_grid_sampler_2d)rU  rV  rW  rX  rY  r[  outputs          r2   grid_sampler_2dr`    sm     	
ELL'' 	C!#	COO%*A*AOBL $	-!#!F Mr3   left_tensorsright_tensorsscalarc                     t         j                  j                  | t         j                  j                  ||      |      S Nr\   )r}   _foreach_addList_foreach_mulr   ra  rb  rc  s       r2   _foreach_addcmul_scalarrj  /  <     !!d$$\=A "  r3   c                     t         j                  j                  | t         j                  j                  ||      |      S re  )r}   rf  rg  _foreach_divri  s       r2   _foreach_addcdiv_scalarrn  ;  rk  r3   start_tensorsend_tensorsc           	          t         j                  j                  | t         j                  j	                  t         j
                  j                  ||       |            S r:   )r}   rf  rg  rh  Scalar_foreach_sub)ro  rp  rA   s      r2   _foreach_lerp_scalarrt  G  sL     !!  "";>	
 r3   scalarsc           	          t         j                  j                  | t         j                  j	                  t         j
                  j                  ||       |            S r:   )r}   rf  rg  rh  
ScalarListrs  )ro  rp  ru  s      r2   _foreach_lerp_scalarlistrx  U  sL     !!$$"";>	
 r3   running_meanrunning_vartrainingexponential_average_factorepsilonc           
          t         j                  | |||||||      \  }}	}
|r||	|
fS ||j                  d      |j                  d      fS )Nr   )r}   native_batch_norm	new_zeros)r?   rA   rB   ry  rz  r{  r|  r}  rU  bcs              r2   miopen_batch_normr  c  sl     $$"	GAq! 1ay	 r3   c                      i t         t        S r:   )r,   r   rL   r3   r2   fast_random_decompsr    s    5n5 455r3   c                      t         j                  rt        S t         j                  rHt        j	                  t
        j                  j                  j                  j                  d       t        S t               S )z"decomps can change based on configN)r   fallback_randomr,   "fallback_embedding_bag_byte_unpackpoprZ   r'   	quantizedembedding_bag_byte_unpackr   r  rL   r3   r2   select_decomp_tabler    sP    00599..HHPPRVW  r3   masksourcec                    ddl m}m}  || j                  |j                        rt
        j                  | |g      \  } }|j                  d      j                  d      dz
  }d | ||fD        \  }}}t
        j                  |||gd      }	t        j                  ||	|      j                  | j                        S t        S )Nr   )BackendFeaturehas_backend_featurer   r   c              3   <   K   | ]  }|j                           y wr:   )r   )r   rN   s     r2   r   z!masked_scatter.<locals>.<genexpr>  s     ,WQQYY[,Ws   )codegen.commonr  r  r|   MASKED_SCATTER_WITH_INDEXr}   broadcast_tensorsr   cumsum_unsafe_masked_indexrZ   r   r   r   r<   )
r   r  r  r  r  
source_idx	self_flat	mask_flatsource_flatr   s
             r2   masked_scatterr    s     D4;;(P(PQ ++T4L9
d\\"%,,Q/!3
,W4vBV,W)	9k**;	J<QRS{{9fi8==djjIIr3   	quant_min	quant_maxc                    t        j                  |       \  }}||z
  t        ||z
        z  }t        j                  |t        j                  |g            }|t        j
                  ||z        j                  t         j                        z
  }t        j                  |||      }|j                  t         j                        |j                  t         j                        fS r:   )rZ   aminmaxr   rI   r   r   r   intrR   float64int64)	r?   r  r  rC   rW   min_valmax_valscale
zero_points	            r2   choose_qparams_tensorr    s     }}U+GWw%	I(=">>EIIeU\\3%01EU[[59<<UYYGGJZI>J88EMM"JMM%++$>>>r3   
accumulatec                     | j                         }t        j                  ||g|j                  |j                        |      }|j                  | j                        S r:   )r   rZ   	index_putr   r   )r   r_   r  r  	flatteneds        r2   putr    sL     IE7FNN5;;7I TZZ((r3   c                 V    t         j                  | |||      }| j                  |      S )N)r  )r}   r  copy_)r   r_   r  r  r   s        r2   put_r    s(     ((4:(
>C::c?r3   r_  input_dtypec                     | |z  }t        j                  ||d      }t        j                  | ||      }| j                  |k7  r|j                  |      }|j                         S )NTr   )rZ   r~   r   fmarW   r   
contiguous)r4   r_  r^   r  new_grad_outputsum_new_grad
grad_inputs          r2   _softmax_backward_datar    sc     "F*O99_#tDL##VG\?KJ K']];/
  ""r3   Tinclude_selfsrcreduction_typer  c                   |dk(  rt        | j                        s| j                  j                  xs | j                  j                  }t	        j
                  |      }|r)| }t	        j
                  |       j                  |||      }	nN| j                  ||d      }t	        j                  |       j                  |||      }	|	j                  |	dk  d      }	|j                  |||      }|r||	z  S ||	z  S t        t        j                  j                  || j                  |j                  |j                  j                  d      rt         S | j"                  |dz   d  j%                         | j"                  d | j%                         z  }
|j%                         g| j"                  |dz   d  | j"                  d | }g t'        | j(                  |z
  | j(                        dt'        d| j(                  |z
        }|j+                  t        j,                        j/                  |
      j1                  |      j3                  |      }| j5                  |||||      S )Nmeanr   r   Tr  )r!   rW   is_floating_pointr   rZ   	ones_likerd   
index_fill
zeros_likemasked_fillr"   r}   scatter_reduce_twor|   rY   r<   r   r   rh   r   r   r  repeat_interleaver   rl   scatter_reduce)r   r^   r_   r  r  r  true_divisiononesr   countsrepeatsindex_shapern   scatter_indexs                 r2   index_reducer    s    (T

) 

44M

8M8Ms#C__T*44S%FF//#ua0C%%d+55c5$GF''
A6FmmC,,sV|?#-?  

		

 jjq#))+djj#.>.D.D.FFG;;=L4::cAgi#8L4::ds;KLKNU499s?DII.NNE!TYY_4MND		7	#				  !   r3   kernel_size	ceil_modec                 2   |dk(  rdg|z  }|dk(  rdg|z  }|s|}t        ||      }t        ||      }t        ||      }t        ||      }t        j                  t        j                  |      }t
        j                  j                  j                  ||      s0|t        j                  t
        j                        j                  kD  rt        S t        j                  | |||||      \  }}	t        j                  |	|| j                   | d  |||      }
||
fS )Nr   r   )n_dim)r   r'  reduceoperatormulrZ   	_inductorlowering%should_fallback_max_pool_with_indicesiinfoint8rI   r<   prims!_low_memory_max_pool_with_offsets'_low_memory_max_pool_offsets_to_indicesr   )rN   r  rs   rt   ru   r  r^   window_sizevalsrS  r5   s              r2   _max_pool_with_indicesr    s"    1}39!|#) {C0KHc*H7C(G&#&F""8<<=K 	  FFs 	G 	
 UZZ0444;;	MD' ;;	G =r3   c           	      &    t        | |||||d      S )Nr{   r   r  rN   r  rs   rt   ru   r  s         r2   max_pool2d_with_indicesr  T        "	;9! r3   c           	      &    t        | |||||d      S )NrH  r   r  r  s         r2   max_pool3d_with_indicesr  b  r  r3   output_sizec                     | j                   ^ }}}|\  }}|dk(  s|dk(  r:g |||}| j                  |      | j                  |t        j                        fS ||z  dk(  r(||z  dk(  r ||z  ||z  g}t        j                  | |      S t        S )Nr   r   )r   	new_emptyrZ   r  r}   r  r<   )	rN   r  batchh_inw_inh_outw_outo_sizer  s	            r2   adaptive_max_pool2dr  p  s     UD$LE5zUaZ'5'%''{{6"AKKekkK$JJJe|qTE\Q.u}dem4++A{;;r3   	out_int32rightsidesortersorted_sequencer  r  r  r  c                ~    t         j                  | t        j                  |g| j                        ||||      d   S )Nr|   r  r   )r}   searchsortedrZ   r`   r|   )r  r   r  r  r  r  s         r2   searchsorted_scalarr    sK     dVO$:$:;   	 	r3   noiselowerupper	generatorc                    |rS| dk  }t         j                  | |||      }t        j                  || |z  |       }t        j                  ||d      }	||	fS ||z   dz  }
t         j	                  | |
      t        j
                         fS )Nr   )r   r   r{   )r}   uniformrZ   r   
leaky_relur   )r   r  r  r  r{  r   not_positiverr_  	noise_outnegative_slopes              r2   rrelu_with_noise_functionalr    s     qyLLueyLA\4!8T:KKa3	y  %-1,t^4ellnDDr3   repeatc                 N   t         j                  j                  rt        S |t	        |      t
        urt        S | j                  j                  dk(  rt        S | j                  t        j                  t        j                  fv sJ | j                  dk(  sJ | j                  d      }t        j                  || j                        }t        j                  ||| j                  t        j                  k(  d      }t        j                  || j!                  d      dz
        S )Nr   r   r   r  T)r  r  )rI   )r   tritonautotune_at_compile_timer<   rY   r  r|   rW   rZ   rF  r  r   r  aranger  rR   rS   )r	  r  r  posr5   s        r2   repeat_interleave_Tensorr    s    
 }}-- d;/s:}}U"<<EKK5555;;!]]1F
,,{6==
9C   ;DG ;;wFKKNQ$677r3   r   r  c           	      8   | j                         dk(  r|j                         dk(  sJ d       |d   }|d   }|d   }| j                  d      }|j                  d      }t        j                  j	                  ||||df|df|df|      }	|	j                  d      S )NrH  z,Expect (N,C_in,L) and (C_out,C_in//groups,K)r   r   r   )rs   rt   ru   rx   )r^   r   r}   conv2dr   r   )
r?   rA   rB   rs   rt   ru   rx   input_2d	weight_2dout_2ds
             r2   conv1d_to_conv2dr    s     99;!

 1 61
 AYFajG{H r"H  $I [[  {!A ! F >>"r3   )NNr:   )Nr   r   )NF)r   r   F)F)Nr   r   F)g      ?gUUUUUU?FN)Nr  r  r  r   )r'  loggingr   r  rL  typingcollections.abcr   r   r   r   r   r   typing_extensionsr	   rZ   torch._decomp_decompr/   torch._prims_common_prims_commonr  $torch.ao.quantization.fx._decomposedr
   r   r   torch._decomp.decompositionsr   r^  r   r   r=   r   r   $torch._decomp.decompositions_for_rngr   torch._dynamo.utilsr   torch._environmentr   !torch._higher_order_ops.out_dtyper   torch._inductor.utilsr   r   r   r   torch._refsr   rF   %torch.fx.experimental.symbolic_shapesr   r    r   r   r    r!   r"   r#   r$   _opsOperatorBaseOpOverloadPacketr%   __annotations__	getLogger__name__r-   r'   r}   r  r  r0  quantized_decomposed_adaptive_avg_pool2d_backwardindex_selectaddmvr  bitwise_and_bitwise_or_
clamp_min_distelu
empty_likeflipgeluhardtanhlcmr  linalg_vector_norm_log_softmax max_pool2d_with_indices_backward_native_batch_norm_legit#_native_batch_norm_legit_functional$_native_batch_norm_legit_no_training_batch_norm_with_update"_batch_norm_with_update_functional_batch_norm_no_updatebatch_norm_backwardr  native_group_normnll_loss2d_backwardpermute_copyrrelu_with_noise_backward_softmaxsin_sqrt__to_copytril_indicestriu_indicesunbind_copyr  upsample_bilinear2dvecr4  r?  inductor_decompositionsr,   _unsafe_indexr  #_unsafe_masked_index_put_accumulate+_scaled_dot_product_flash_attention_for_cpur   r  rQ   rP   rd   gluselect_scatterslice_scattersplitr   r   r~   unbindbaddbmmr&   r+   
OpOverloadr0   r   r>   	ShapeTyper   tuplerG   rM   SymInttypesNumberrR   r[   rq   r   r   r   r   r   rW   r   r   r   r   r   r   r   detach_r   r   r   r  r  	view_copyr	  r  
StrideTyper  r  r  r  r|   r  r  r   r#  r+  	low_dtyper-  r)  r  rT  r`  _foreach_addcmulrr  rj  _foreach_addcdivrn  _foreach_lerprt  rw  rx  r  py_impl_CDispatchKeyAutogradcachedictr  r  r  choose_qparamsr`   r  r  r  r  strr  r  r  r  r  r  r  	Generatorr  r  r  rL   r3   r2   <module>rt     s       
  $ ; ; '   # + 
  F ( ( 7 . 
 F W $  T]t_#	JJUZZ888 )  g!yy~~		II	YY!!
yy55 ,+**++ 	

+ 		+
 	+ 	+ 	+ 			+ 	+ 	+ 			+ 			+ 	+ 	+ 	+  	!+" 	#+$ 	--%+& 	%%'+( 	00)+* 	11++, 	$$-+. 	///+0 	""1+2 	  3+4 	5+6 	7+8 	9+: 	  ;+< 	=+> 	&&?+@ 	A+B 			C+D 	

E+F 	G+H 	I+J 	K+L 	M+N 	O+P 	  $$Q+R 	55S+T 	++U+- \ K,.J2IJ
 	,,44<<NNNN!!NNHHJJLLHHKKLL%W Duzz44ejj6Q6QQRS * n&8 9>	&6!77	8>xB (2r6"223> 6678\\  	
  \\ 9" ../
P<<
Poo
P U\\"
P 5<<
 	
P
 

P 5<<u||34
P 0
P ::BBCD )-(,	LL 
%++$$	% 
%++$$	%	
 
 E %# )-(,	||		%++$$	%	 
%++$$	%	 \\		 $ &	 $	
uS%,,&'
(	""	 	 \\		 %	 () !"M||M	M <<M LL	M ;;M \\M *M* ,,4456W
uS%,,&'
(W#YW W \\	W 7W  2234..<<. LL. S		.
 #tCy.!. 3S	>". CcN#. . I. . d. 5<<u||34. 5.@ ,,-.G G GU\\ G /G
 
# (,
,,LL $ \\	  $0 %
 (,  !
,,
,, ,, $	
 ++

 ;; \\  &8 	" (, 
,, LL  $  \\	   # N ))*+ :%,,:	: \\: ,:z %:U\\ :ell : &:& 
#
 +/	@||@||@ EKK&&'	@
 \\@ $@F ++,-   . DLL12u||   3 EJJ/0Iu|| IELL IU\\ I 1I EJJ/0Iu|| IELL IU\\ I 1I 		" 
,,	#  \\	 # 		" 
,,	#  \\	 # ))*+:
,,:	: : 	:
 \\: ,: //01)
,,)
uS%,,&'
() \\) 2) --./"
,,";;" \\" 0"
 
,,
 
5??E,,,-
  '
 $(%)%)).)>)>)3
,,)3c5j!)3 EKK 	)3
 U\\")3 U\\")3 )3 )3 &&)3 \\)3 ()3` $(%)).)>)>/c5<<'(/
,,/ EKK 	/
 U\\"/ &&/ / \\/@ '2ELL 2C 2ELL 2 (2 (3U\\ 3S 3U\\ 3 )3 ))112Tu|| T3 T# T%,, T 3T ))334V
,,V V(+V7:V
\\V 5V ,,-5
5
uS%,,&'
(5 5 \\	5 .5 	EEMMN $(<<LL 5<<
  \\	 O 
;;CCD<< ll LL	
 ,, || ,, || LL  \\ E4 		++EEF
Au|| 
A 
A G
A --./  ||
,,  	
  \\  0: --445
 	
u||
u||$ % 	
 
%,, 6 --445
 	
u||
u||$ % 	
 
%,, 6 **112
%
ell#
 KK
 
%,,	
 3
 **556
%
ell#
 %++$$%
 
%,,	
 7
 ''(<(<(E(EF../<<LL //%,,
' //%,,/	
 .  !&  5<<u||34 0 G< 6T#xS'9"9: 6 6!T#xS'9"9: ! ++,
,,
,, LL \\	 -$ ,;;BBC?<<?? ? 
	?
 ;;? 5<<%&? D? !
 	
)
,,
)<<
) LL
) 	
)
 \\
) "
) 		"
 	
,,<< LL 	
 \\ # 33;;<##LL# 
# 	#
 \\#  =#( ))* 1
,,1	1 <<1 
	1
 1 1 \\1 +1h5||5c5 U3S	>*+5 3S	>"	5
 CcN#5 5 
5 5<<%&5p 445 /3%&&'
||
c
 U3S	>*+
 3S	>"	

 CcN#
 
 5<<%&
 6
 445 /3%&&'
||
c
 U3S	>*+
 3S	>"	

 CcN#
 
 5<<%&
 6
 001||"&s)
5<<%& 2" ))001
 %)	\\	
++

	 		
 	 3-	 U\\"	 \\	 2	& 889 %+/E
,,E<<E E 	E
 E (E 5<<%&E :E& ..556 "&8LL8#8 \\8 784 $()<<)LL) 5<<
 ) #J	)
 3Z) Cj) ) \\)r3   