
    i                     /   U d dl Z d dlZd dlZd dlZd dlZd dlZd dlmZmZmZm	Z	m
Z
 d dlmZmZ d dlZd dlmZ d dlmZ d dlZd dlmZmZmZ d dlmZmZmZmZm Z  d dl!m"Z" d dl#m$Z$ d dl%m&Z& d d	l'm(Z( d d
l)m*Z* d dlm+Z+m,Z,m-Z- d dl.m/Z/m0Z0 ddl1m2Z2m3Z3 ddlm4Z4m5Z5m6Z6  e	d      Z7 ed      Z8e
ejr                  jt                  ejr                  jv                  f   Z<ee=d<    ej|                  e?      Z@ej                  j                  ZBej                  j                  ZCej                  j                  ZDej                  j                  ZEej                  j                  ZF eg eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  eBj                  e(eBj                  eBj                  eBj                  eBj                  j                  eBj                  j                  eDj                  eEj                        Zri  e       erZseBj                  eBj                  eBj                  eBj                  j                  eBj                  eBj                  eBj                  eBj:                  eBj                  eBj                  eBj                  eBj                  eBj                   j                  eBj                  eBj                  eBj                  eBj
                  gZee
ejr                  j                  ejr                  jv                  f      e=d<    eese       de
e<ee<   f   deee8e7f   gee8e7f   f   fdZ eeBj:                  g      dej                  dej                  demdemdedej                  fd       Z eeBj                  j                  g      ddddej                  deej                  j                     d eej                  j                     ddfd!       Z eeBj                   g      e 	 	 dd"ej                  deej                  j                     d eej                  j                     dej                  fd#              Z eeBj"                  g      d$ee
emej                  f      d%ej                  j                  d&edej                  fd'       Z eeBj                  g      dd(d"ej                  d)emd*ej                  d+ej                  d,ej                  j                  dej                  fd-       Z| eeBj$                  j                  g      d$ee
emej                  f      d.eem   d&edej                  fd/       Z eeBj&                  g      dej                  d0ej                  d1ej                  d2eem   d3e
emeem   f   d4e
emeem   f   d5e
emeem   f   d6ed7eem   d8emd9ee   deej                  ej                  ej                  f   fd:       Z eeBj*                  j,                  g      dd"ej                  d;emdej                  fd<       Z eeBj0                  g      e	 dd=ej                  d>ej                  d?eej2                     dej                  fd@              Z eeBj4                  g      e	 	 	 dd=ej                  dAej                  dBej                  d?eej2                     dCej                  j                  d,ej                  j                  dej                  fdD              Z eeBj6                  g      e	 dd=ej                  dEej                  d?eej2                     dej                  fdF              Z eeBj8                  j                  g      	 ddGeej                     d)emdej                  fdH       Z eeBj:                  g      d"ej                  dej                  fdI       Z eeBj<                  g      dd(d"ej                  dJej                  d,eej                  j                     dej                  fdK       Z eeBj>                  g      d=ej                  dej                  fdL       Z eeBj@                  eBjB                  g      d=ej                  dej                  fdM       Z eeBjD                  eCjD                  g      d=ej                  dNej                  dej                  fdO       Z eeBjF                  eCjF                  g      d=ej                  dNej                  dej                  fdP       Z eeBjH                        	 	 dd=ej                  d)eem   dRedej                  fdS       Z eeBjJ                        	 	 dd=ej                  d)eem   dRedej                  fdT       Z eeBjL                  g      d=ej                  d)emdUemdVemdej                  f
dW       Z eeBjN                  j                  g      d=ej                  d$ee
emej                  f      dej                  fdX       Z eeBjN                  j2                  g      d=ej                  dYej2                  dej                  fdZ       Zd=ej                  deejT                  ejV                  f   fd[Z eeBjZ                        ddddQdQej\                  d\d=ej                  d%e
emef   dYeej2                     d]eej`                     d^eejb                     d_ed`edaejd                  dej                  fdb       Zddej\                  dcddedeej                  f   d=ej                  dYeej2                     d^eejb                     daejd                  d&edej                  fdfZ eeBjh                        d=ej                  d&edej                  fdg       Z eeBjj                        d=ej                  d&edej                  fdh       Z eeBjl                  j                        d=ej                  diemd&edej                  fdj       Z eeBjl                  jn                        d=ej                  dkemdiemd&edej                  f
dl       Z eeBjr                  j                        diemd$ee
emej                  f      d&edej                  fdm       Z eeDj                  j                        	 dd0ej                  d1ej                  dneej                     dej                  fdo       Zp eeEj                  j                        d0ej                  dpej                  dqej                  d1ej                  drej                  dsej                  dnej                  dtej                  duej                  dvemdej                  fdw       Zq eej                  j                  jt                        dxej                  dej                  fdy       Z eeBjx                  g      e	 	 	 ddzej                  d{ej                  d|emd}emd~edej                  fd              Z eeBjz                  j|                        	 dd=eej                     deej                     deej                     dedeej                     f
d       Z eeBj                  j|                        	 dd=eej                     deej                     deej                     dedeej                     f
d       Z eeBj                  j|                        deej                     deej                     d1ej                  j                  deej                     fd       Z eeBj                  j                        deej                     deej                     deej                  j                     deej                     fd       ZeBj                  j                  j                  ej                  j                  j                         eeBj                        d0ej                  d1ej                  dnej                  ej                     dej                  ej                     dej                  ej                     dedededeej                  ej                  ej                  f   fd              Ze j                  deeedeef   f   fd       Zdeeedeef   f   fdZ eeBj                        d=ej                  dej                  dej                  dej                  fd       Z eeFj                  j                        d0ej                  demdemdedYej2                  deej                  ej                  f   fd       Z eeBj                        	 dd=ej                  d*ej                  dej                  dedej                  f
d       Z eeBj                        	 dd=ej                  d*ej                  dej                  dedej                  f
d       Z eeBj                  j                        edej                  dej                  d)emdej2                  dej                  f
d              Zy eeBj                        ddd=ej                  d)emd*ej                  dej                  dededej                  fd       Zd"ej                  deem   d3ee
emeem   f      d4e
emeem   f   d5e
emeem   f   ded)emdeej                  ej                  f   fdZ eeBj                        	 	 	 	 dd"ej                  deem   d3ee
emeem   f      d4e
emeem   f   d5e
emeem   f   dedeej                  ej                  f   fd       Z eeBj                        	 	 	 	 dd"ej                  deem   d3ee
emeem   f      d4e
emeem   f   d5e
emeem   f   dedeej                  ej                  f   fd       Z eeBj                        d"ej                  deem   deej                  ej                  f   fd       Z eeBj                  j|                        dQdQddddej                  d=ej                  j                  dededee   deej                     dej                  fd       Z eeBj                        	 	 	 	 dd=ej                  dej                  dedededeej                     deej                  ej                  f   fd       Z eeBj                  j                        	 ddej                  deem   dej                  fd       Zy)    N)AnyCallableOptionalTypeVarUnion)	ParamSpec	TypeAlias)core_aten_decompositionsget_decompositionsremove_decompositions)_grid_sampler_2d
_index_addembedding_dense_backwardpw_cast_for_opmath"pw_cast_for_opmath_non_tensor_args)extra_random_decomps)counters)	is_fbcode)	out_dtype)pad_listlike)elementwise_dtypesELEMENTWISE_TYPE_PROMOTION_KINDtype_to_dtype)guard_or_falsestatically_known_true   )configinductor_prims)is_gpu,needs_fallback_due_to_atomic_add_limitationsuse_scatter_fallback_T_P_GenericOperatordecomps_to_excludeopsreturnc                     t        | t              r| n| gD ]!  }|t        v st        j	                  d|        # t        j                  | t              S )Nzduplicate decomp: %s)
isinstancelistdecompositionslogwarningdecompregister_decomposition)r&   ops     W/var/www/html/engine/venv/lib/python3.12/site-packages/torch/_inductor/decomposition.pyr/   r/      sL      T*c 5KK.45 ((n==    grad_outputindicesnum_weightspadding_idxscale_grad_by_freqc                 D    | j                   rt        S t        | ||||      S N)is_xpuNotImplementeddecomp_embedding_dense_backward)r3   r4   r5   r6   r7   s        r1   _embedding_dense_backwardr=      s,     *Wk;8J r2   )minmaxsymbolr>   r?   c                     y r9    )r@   r>   r?   s      r1   sym_constrain_range_for_sizerC      s     r2   xc                 R    || j                  |      } || j                  |      } | S r9   )	clamp_min	clamp_max)rD   r>   r?   s      r1   clamprH      s/     KK
KKHr2   size
fill_valuekwargsc                     |j                  d      }|.t        t        |            |d<   t        j                  | |fi |S t
        S )Ndtype)getr   typetorchfullr;   )rI   rJ   rK   rM   s       r1   rQ   rQ      sF     JJwE}'Z(89wzz$
5f55r2   alphadimindextensorrS   c                ~    t               s#| j                  t        j                  k(  rt        S t        | |||d|      S )NF)inplacerS   )r   rM   rP   bfloat16r;   r   )rD   rT   rU   rV   rS   s        r1   	index_addrZ      s3     ;177enn4!S%eLLr2   physical_layoutc                     dgt        |       z  }t        |      D ]
  \  }}|||<    t        j                  |D cg c]  }| |   	 c}fi |j	                  |      S c c}w Nr   )len	enumeraterP   emptypermute)rI   r[   rK   permpls         r1   empty_permutedre      se     3T?D/* 1Q;;9AQ9DVDLLTRR9s   Ainputweight
bias_sizesstridepaddingdilation
transposedoutput_paddinggroupsoutput_maskc                 .   |
d   rt        | j                  j                        st        S t        j                  | dgt        t        d| j                                     z         }t        j                  | |||||||||	|
d   |
d   dg      \  }}}|||fS )N   r   r   F)
r   devicerO   r;   atensumr*   rangerT   convolution_backward)r3   rf   rg   rh   ri   rj   rk   rl   rm   rn   ro   	grad_biasgrad_inpgrad_weight_s                  r1   rv   rv      s     q>(:(:(?(?!@qcDq+//:K1L,M&MNI#88	QQ/ Hk1 k9--r2   decimalsc                 H    d|z  }t         j                  | |z        d|z  z  S )Ng      $@g      ?)rs   round)rD   r{   ten_pow_decimalss      r1   	round_decr   	  s,    X~::a**+s5E/EFFr2   selfbatch2r   c                    t         j                  r| j                  j                  dvrkt	        | j
                  d   dk(        st	        |j
                  d   dk(        r5| j                  d      |j                  d      z  j                  d      }|S | j                  j                  dk(  rt	        | j                  d      dk(        ryt	        |j                  d      dk(        r\t        d   dxx   dz  cc<   t        j                  | j                  d      |j                  d      z  dd	
      j                  d      S t        S )Ncpumpsr   rq   rT   r   inductordecompose_bmmTrT   keepdim)r   coordinate_descent_tuningrr   rO   r   shape	unsqueezert   rI   r   rP   squeezer;   )r   r   r   outs       r1   bmmr     s    ''DKK,<,<N,R A!!348MLLOq 9
 >>"%(8(8(;;@@Q@GCJ{{5  1!238MKKOq 9
 Z 1Q6199Q&.."44!Til r2   mat1mat2betac                    | j                   j                  dk(  r7t        |j                  d      dk(        rt        |j                  d      dk(        rgt        d   dxx   dz  cc<   t        j                  |j                  d      |j                  d      z  dd      j                  d      }||z  || z  z   S t        |j                  d      dk(        ryt        |j                  d      d	k        r\t        |j                  d      d	k        r?t        d   dxx   dz  cc<   |j                  |z  j                  dd      }||z  || z  z   S t        S )
Nr   r   r   r   r   decompose_addmmTr      )rr   rO   r   rI   r   rP   rt   r   r   r   Tr;   )r   r   r   r   r   rS   r   s          r1   addmmr   )  s2    {{5  1!238MIIbMQ9
 Z !23q83))Q$,,r"224il  3;,,!$))A,!"34tyy|r12tyy|r12Z !23q8366D=%%!T%:C3;,,r2   input2c                    t         j                  r| j                  j                  dvrit	        | j
                  d   dk(        st	        |j
                  d   dk(        r3| j                  d      |j                  d      z  j                  d      S | j                  j                  dk(  rVt	        | j                  d      dk(        rt	        | j                  d      dkD        rt	        |j                  d      dk(        ri| j                  |j                  k(  rPt        t        j                  |       t        j                  |      z   dk        rt        d	   d
xx   dz  cc<   | |z  S t	        | j                  d      dk(        ryt	        |j                  d      dk(        r\t        d	   d
xx   dz  cc<   t        j                  | j                  d      |j                  d      z  dd      j                  d      S t        S )Nr   r   r   rq   r   r   r       r   decompose_mmTr   )r   r   rr   rO   r   r   r   rt   rI   rM   r   rP   numelr   r   r;   )r   r   r   s      r1   mmr   G  s    ''DKK,<,<N,R A!!348MLLOq 9
 NN1%(8(8(;;@@Q@GG{{5 !$))B-1"45%diilQ&67%fkk!n&9:v||+D 1EKK4G GBNOZ 0A50&=  1!238MKKOq 9
 Z 0A5099Q&.."44!Til r2   tensorsc                    dt         j                  dt        ffd}t        t	        ||             t              dk(  rRt        | dt        j                  id   }d   }||j                  k(  r|j                         S |j                  |      S dt              cxk  rt        |       k  r#n n t        j                  j                        S t              dkD  rt        fdD              rd   }t        |j                         }dk  rt        |j                         z   n|j#                  t                      |j%                        j&                  | j)                  dz         j                         S t*        S )	NrD   r'   c                     t        | j                        dk(  rt        | j                  d   dk(        ryt        | j                        k  rt        | j                     dk(        ryy)Nr   r   FT)r^   r   r   )rD   rT   s    r1   non_empty_tensorzcat.<locals>.non_empty_tensoru  sU    " qww<1
a!@QWW.1B"Cr2   r   type_promotion_kindr   rM   c              3   ,   K   | ]  }|d    u   yw)r   NrB   ).0tfiltered_tensorss     r1   	<genexpr>zcat.<locals>.<genexpr>  s!      )%&a  )s   )rP   Tensorboolr*   filterr^   r   r   DEFAULTrM   clonetors   catdefaultallr   insertr   expandflattenr;   )r   rT   r   promoted_dtype
filtered_tinpr   r   s    `     @r1   r   r   p  s   
ELL T 2 F#3W=>
!+
 ? G G
  &a(
 !1!11 	
 ^4	

 
S!"	1S\	1xx 0#66 q S )*:) & q!SYY&)AgcC		N"3S#./0(s}}S!((%088cAgFLLNN r2   c                 "   | j                         ret        j                  t        j                  | j                        t        d      t        j                  | j                  | j                              S t        | t        j                        \  }}t        j                  t        j                  || j                        }t        j                  | dk  |d      }t        j                  t        j                  |       t        d      |      S )Nnan)r   rM   rr   r   g        )
is_complexrP   whereisnanrealfloatatan2imagr   r   INT_TO_FLOATscalar_tensormathpirr   )rD   rz   rM   r   rets        r1   angler     s    ||~{{KKuu{{166166/J
 	
 "	;HHHAu 
		TWWE!((	CB
++a!eR
%C;;u{{1~uU|S99r2   yc                H   t        j                  |       xr | j                         }t        j                  |      xr |j                         }|r|st        S d}| j                  dk(  r|j                  dk(  rd}| j                  dk(  r| j                  d      } |j                  dk(  r|j                  d      }|}|||z  }t        j                  | j                  |j                        }dt         j                  dt         j                  fd}| dz   } |dz   } || j                  | j                  j                              }	 ||j                  |j                  j                              }
t        j                  |	|
z   d	      j                  |      }|r|d   S |S )
NFr   Tr   rV   r'   c                     | j                   ^ }}|dz  dk7  rt        d      g ||dz  d}| j                  |      }|S )zNReshape tensor from [*initial_dims, last_dim] to *initial_dims, last_dim/2, 2]rq   r   zQThe size of the last dimension must be even to reshape it to [..., last_dim/2, 2])r   AssertionErrorview)rV   initial_dimslast_dim	new_shapereshaped_tensors        r1   reshape_tensor_complexz#add.<locals>.reshape_tensor_complex  s^     #),,x a<1 c 
 6l5HM515	 ++i0r2   )	start_dim)rP   	is_tensorr   r;   ndimreshapepromote_typesrM   r   r   r   r   )rD   r   rS   x_is_complex_tensory_is_complex_tensoroutput_size_zerozcomplex_typer   
x_reshaped
z_reshapedresults               r1   addr     sZ     //!,?//!,?&9vv{qvv{vv{IIaLvv{IIaL	AAI&&qww8Lu||  $ 	
AA	AA'qvv||(<=J'qvv||(<=J]]:
2bAFF|TFayMr2   c                 2    | j                         rt        S | S r9   )r   r;   r   s    r1   conj_physicalr     s    Kr2   c                     | S r9   rB   r   s    r1   liftr     s    Kr2   otherc                 b    t        j                  t        j                  |      || kD  z  | |      S r9   rP   r   r   r   r   s     r1   fminr   	  '    ;;u{{5)UT\:D%HHr2   c                 b    t        j                  t        j                  |      || k  z  | |      S r9   r   r   s     r1   fmaxr     r   r2   Fr   c                 x    | j                   t        j                  k(  rt        j                  | ||      S t        S Nr   )rM   rP   r   anyr;   r   rT   r   s      r1   amaxr     -     zzUZZyy388r2   c                 x    | j                   t        j                  k(  rt        j                  | ||      S t        S r   )rM   rP   r   r   r;   r   s      r1   aminr     r   r2   startlengthc                 N    t        j                  | |||      j                         S r9   )rP   narrowr   )r   rT   r   r   s       r1   narrow_copyr   )  s"     <<c5&17799r2   c                 J    t         j                  | |      j                         S r9   )rs   r   r   )r   rI   s     r1   view_copy_defaultr   3  s    
 99T4 &&((r2   rM   c                 @    | j                  |      j                         S r9   )r   r   )r   rM   s     r1   view_copy_dtyper   ;  s    
 775>!!r2   c                     t        j                  |       }|D cg c]  }| j                  |    }}dgt        |      z  }t	        |      D ]
  \  }}|||<    ||fS c c}w r]   )utils3compute_elementwise_output_logical_to_physical_permr   r^   r_   )r   r[   rd   r   permutationrc   s         r1   _get_shape_permutation_liker  C  ss     OOPTUO$34qTZZ]4E4#E
"K/* 1A ; 5s   A)rM   layoutrr   
pin_memoryrequires_gradmemory_formatr  rr   r  r  r	  c          	         || j                   n|}|| j                  n|}|| j                  n|}|t        j                  k7  r8t        j
                  | j                  ||||||      }|j                  |      S |t        j                  k(  sJ t        |       \  }	}
t        j
                  |	||||||      }|
t        t        t        |
                  k(  r|S |j                  |
      j                         S )N)rM   r  rr   r  r  r	  )rM   r  rr   rP   preserve_formatrQ   r   r   stridedr  r*   ru   r^   ra   r   )r   rJ   rM   r  rr   r  r  r	  r   r   r  s              r1   	full_liker  P  s      -DJJUE"NT[[F"NT[[F---JJ!'
 yy}y55 &&&8>{!'
 $uS%5677M~~k*0022r2   )rM   rr   r	  rand_fn.c                j   ||j                   n|}||j                  n|}|t        j                  k7  r& | |j                  f||d|j                  |      S t        |      \  }} | |f||d|}|t        t        t        |                  k(  r|S |j                  |      j                         S )Nr   r  )rM   rr   rP   r  r   r   r  r*   ru   r^   ra   r   )	r  r   rM   rr   r	  rK   r   r  r   s	            r1   
_rand_liker  }  s      -DJJUE"NT[[F---JJ

 	

 "="
)	* 5T:E; 	F d5[!1233>>+&,,..r2   c                 8    t        t        j                  | fi |S r9   )r  rP   randr   rK   s     r1   	rand_liker    s    ejj$1&11r2   c                 8    t        t        j                  | fi |S r9   )r  rP   randnr  s     r1   
randn_liker    s    ekk42622r2   highc                 v    t        t        j                  t        j                  j
                  d|      | fi |S r]   r  	functoolspartialrs   randintlow)r   r  rK   s      r1   randint_liker     s-    i''(8(8!TBDSFSSr2   r  c                 v    t        t        j                  t        j                  j
                  ||      | fi |S r9   r  )r   r  r  rK   s       r1   randint_like_lowr"    s/     i''(8(8#tDdUfUUr2   c                 F    t        j                  j                  d| |fi |S r]   )rs   r  r  )r  rI   rK   s      r1   r  r    s"     <<AtT4V44r2   biasc                     t         j                  j                  j                  |      }t         j                  j                  j	                  | |||j                         d         S r]   )rP   r&   
_quantized$wrapped_fbgemm_pack_gemm_matrix_fp16!wrapped_fbgemm_linear_fp16_weightrI   )rf   rg   r$  packed_weights       r1   #linear_dynamic_fp16_unpacked_weightr*    sO     II((MMfUM99AA}dFKKM!$4 r2   input_scaleinput_zero_pointweight_scaleweight_zero_point	out_scaleout_zero_pointout_channelc
           	          t         j                  j                  j                  ||||      }
t         j                  j                  j	                  | |||
|||	      S r9   )rP   r&   r&  _wrapped_linear_prepack#_wrapped_quantized_linear_prepacked)rf   r+  r,  rg   r-  r.  r$  r/  r0  r1  r)  s              r1   wrapped_quantized_linearr5    s\     II((@@/M 99CC r2   packedc                     dt         j                  dt         j                  fd} || dddf         } || ddd f         }| dd df   j                  t         j                        |z  |z   S )Nu8r'   c                      fddD        \  }}}}t         j                  dk(  r4||dz  z   |dz  z   |dz  z   j                  t        j                        d   S |dz  |dz  z   |dz  z   |z   j                  t        j                        d   S )Nc              3   f   K   | ](  }d |f   j                  t        j                         * yw.N)r   rP   int32)r   nr8  s     r1   r   zPq_embedding_bag_byte_unpack_decomp.<locals>.bitcast_u8_to_f32.<locals>.<genexpr>  s&     GQbajmmEKK0Gs   .1)r   r   rq      little   r      r;  )sys	byteorderr   rP   float32)r8  rD   r   r   ws   `    r1   bitcast_u8_to_f32z=q_embedding_bag_byte_unpack_decomp.<locals>.bitcast_u8_to_f32  s    G,G
1a==H$aLAG,R8>>u}}MiXX"Wb)Q!V4q8>>u}}MiXXr2   .i)rP   r   r   rD  )r6  rF  scalesoffsetss       r1   "q_embedding_bag_byte_unpack_decomprJ    sz    Yell Yu|| Y vc2b5j12FsBCx 01G#ss(u}}-6@@r2   agridinterpolation_modepadding_modealign_cornersc                     | j                   t        j                   d      k(  xr' |dk(  xr  | j                  t        j                         }t	        | |||||      }|S )Nr   r   r  )rL  rM  rN  rO  _expand_grid)rr   rP   is_contiguouscontiguous_formatdecomp_grid_sampler_2d)rK  rL  rM  rN  rO  rQ  outputs          r1   grid_sampler_2drV    sm     	
ELL'' 	C!#	COO%*A*AOBL $	-!#!F Mr2   left_tensorsright_tensorsscalarc                     t         j                  j                  | t         j                  j                  ||      |      S NrR   )rs   _foreach_addList_foreach_mulr   rW  rX  rY  s       r1   _foreach_addcmul_scalarr`    <     !!d$$\=A "  r2   c                     t         j                  j                  | t         j                  j                  ||      |      S r[  )rs   r\  r]  _foreach_divr_  s       r1   _foreach_addcdiv_scalarrd    ra  r2   start_tensorsend_tensorsc           	          t         j                  j                  | t         j                  j	                  t         j
                  j                  ||       |            S r9   )rs   r\  r]  r^  Scalar_foreach_sub)re  rf  rg   s      r1   _foreach_lerp_scalarrj  (  sL     !!  "";>	
 r2   scalarsc           	          t         j                  j                  | t         j                  j	                  t         j
                  j                  ||       |            S r9   )rs   r\  r]  r^  
ScalarListri  )re  rf  rk  s      r1   _foreach_lerp_scalarlistrn  6  sL     !!$$"";>	
 r2   running_meanrunning_vartrainingexponential_average_factorepsilonc           
          t         j                  | |||||||      \  }}	}
|r||	|
fS ||j                  d      |j                  d      fS )Nr   )rs   native_batch_norm	new_zeros)rf   rg   r$  ro  rp  rq  rr  rs  rK  bcs              r1   miopen_batch_normrz  D  sl     $$"	GAq! 1ay	 r2   c                      i t         t        S r9   )r+   r   rB   r2   r1   fast_random_decompsr|  d  s    5n5 455r2   c                  B    t         j                  rt        S t               S )z"decomps can change based on config)r   fallback_randomr+   r|  rB   r2   r1   select_decomp_tabler  k  s      r2   masksourcec                    ddl m}m}  || j                  |j                        rt
        j                  | |g      \  } }|j                  d      j                  d      dz
  }d | ||fD        \  }}}t
        j                  |||gd      }	t        j                  ||	|      j                  | j                        S t        S )Nr   )BackendFeaturehas_backend_featurer   r   c              3   <   K   | ]  }|j                           y wr9   )r   )r   rD   s     r1   r   z!masked_scatter.<locals>.<genexpr>  s     ,WQQYY[,Ws   )codegen.commonr  r  rr   MASKED_SCATTER_WITH_INDEXrs   broadcast_tensorsr   cumsum_unsafe_masked_indexrP   r   r   r   r;   )
r   r  r  r  r  
source_idx	self_flat	mask_flatsource_flatr   s
             r1   masked_scatterr  r  s     D4;;(P(PQ ++T4L9
d\\"%,,Q/!3
,W4vBV,W)	9k**;	J<QRS{{9fi8==djjIIr2   	quant_min	quant_maxepsc                    t        j                  |       \  }}||z
  t        ||z
        z  }t        j                  |t        j                  |g            }|t        j
                  ||z        j                  t         j                        z
  }t        j                  |||      }|j                  t         j                        |j                  t         j                        fS r9   )rP   aminmaxr   r?   r   r}   r   intrH   float64int64)	rf   r  r  r  rM   min_valmax_valscale
zero_points	            r1   choose_qparams_tensorr    s     }}U+GWw%	I(=">>EIIeU\\3%01EU[[59<<UYYGGJZI>J88EMM"JMM%++$>>>r2   
accumulatec                     | j                         }t        j                  ||g|j                  |j                        |      }|j                  | j                        S r9   )r   rP   	index_putr   r   )r   rU   r  r  	flatteneds        r1   putr    sL     IE7FNN5;;7I TZZ((r2   c                 V    t         j                  | |||      }| j                  |      S )N)r  )rs   r  copy_)r   rU   r  r  r   s        r1   put_r    s(     ((4:(
>C::c?r2   rU  input_dtypec                     | |z  }t        j                  ||d      }t        j                  | ||      }| j                  |k7  r|j                  |      }|j                         S )NTr   )rP   rt   r   fmarM   r   
contiguous)r3   rU  rT   r  new_grad_outputsum_new_grad
grad_inputs          r1   _softmax_backward_datar    sc     "F*O99_#tDL##VG\?KJ K']];/
  ""r2   Tinclude_selfsrcreduction_typer  c                   |dk(  rt        | j                        s| j                  j                  xs | j                  j                  }t	        j
                  |      }|r)| }t	        j
                  |       j                  |||      }	nN| j                  ||d      }t	        j                  |       j                  |||      }	|	j                  |	dk  d      }	|j                  |||      }|r||	z  S ||	z  S t        t        j                  j                  || j                  |j                  |j                  j                  d      rt         S | j"                  |dz   d  j%                         | j"                  d | j%                         z  }
|j%                         g| j"                  |dz   d  | j"                  d | }g t'        | j(                  |z
  | j(                        dt'        d| j(                  |z
        }|j+                  t        j,                        j/                  |
      j1                  |      j3                  |      }| j5                  |||||      S )Nmeanr   r   Tr  )r    rM   is_floating_pointr   rP   	ones_likerZ   
index_fill
zeros_likemasked_fillr!   rs   scatter_reduce_tworr   rO   r;   r   r   ru   r   r   r  repeat_interleaver   ra   scatter_reduce)r   rT   rU   r  r  r  true_divisiononesr   countsrepeatsindex_shaperb   scatter_indexs                 r1   index_reducer    s    (T

) 

44M

8M8Ms#C__T*44S%FF//#ua0C%%d+55c5$GF''
A6FmmC,,sV|?#-?  

		

 jjq#))+djj#.>.D.D.FFG;;=L4::cAgi#8L4::ds;KLKNU499s?DII.NNE!TYY_4MND		7	#				  !   r2   kernel_size	ceil_modec                 2   |dk(  rdg|z  }|dk(  rdg|z  }|s|}t        ||      }t        ||      }t        ||      }t        ||      }t        j                  t        j                  |      }t
        j                  j                  j                  ||      s0|t        j                  t
        j                        j                  kD  rt        S t        j                  | |||||      \  }}	t        j                  |	|| j                   | d  |||      }
||
fS )Nr   r   )n_dim)r   r  reduceoperatormulrP   	_inductorlowering%should_fallback_max_pool_with_indicesiinfoint8r?   r;   prims!_low_memory_max_pool_with_offsets'_low_memory_max_pool_offsets_to_indicesr   )rD   r  ri   rj   rk   r  rT   window_sizevalsrI  r4   s              r1   _max_pool_with_indicesr    s     1}39!|#){C0KHc*H7C(G&#&F""8<<=K 	  FFs 	G 	
 UZZ0444;;	MD' ;;	G =r2   c           	      &    t        | |||||d      S )Nrq   r   r  rD   r  ri   rj   rk   r  s         r1   max_pool2d_with_indicesr  -        "	;9! r2   c           	      &    t        | |||||d      S )Nr>  r   r  r  s         r1   max_pool3d_with_indicesr  ;  r  r2   output_sizec                     | j                   ^ }}}|\  }}|dk(  s|dk(  r:g |||}| j                  |      | j                  |t        j                        fS ||z  dk(  r(||z  dk(  r ||z  ||z  g}t        j                  | |      S t        S )Nr   r   )r   	new_emptyrP   r  rs   r  r;   )	rD   r  batchh_inw_inh_outw_outo_sizer  s	            r1   adaptive_max_pool2dr  I  s     UD$LE5zUaZ'5'%''{{6"AKKekkK$JJJe|qTE\Q.u}dem4++A{;;r2   	out_int32rightsidesortersorted_sequencer  r  r  r  c                ~    t         j                  | t        j                  |g| j                        ||||      d   S )Nrr   r  r   )rs   searchsortedrP   rV   rr   )r  r   r  r  r  r  s         r1   searchsorted_scalarr  [  sK     dVO$:$:;   	 	r2   noiselowerupper	generatorc                    |rS| dk  }t         j                  | |||      }t        j                  || |z  |       }t        j                  ||d      }	||	fS ||z   dz  }
t         j	                  | |
      t        j
                         fS )Nr   )r  r   rq   )rs   uniformrP   r   
leaky_relur   )r   r  r  r  rq  r  not_positiverrU  	noise_outnegative_slopes              r1   rrelu_with_noise_functionalr  o  s     qyLLueyLA\4!8T:KKa3	y  %-1,t^4ellnDDr2   repeatc                    t         j                  j                  rt        S |t	        |      t
        urt        S | j                  j                  dk(  rt        S | j                  t        j                  t        j                  fv sJ | j                  dk(  sJ | j                  d      }t        j                  || j                        }t        j                  ||| j                  t        j                  k(  d      S )Nr   r   r   r  T)r  r  )r   tritonautotune_at_compile_timer;   rO   r  rr   rM   rP   r<  r  r   r  aranger  )r  r  r  poss       r1   repeat_interleave_Tensorr    s    
 }}-- d;/s:}}U"<<EKK5555;;!]]1F
,,{6==
9C ;D r2   )NNru  r9   )Nr   r   )NF)r   r   F)r   )F)Nr   r   F)g      ?gUUUUUU?FN)r  loggingr   r  rB  typingr   r   r   r   r   typing_extensionsr   r	   rP   torch._decomp_decompr.   torch._prims_common_prims_commonr  $torch.ao.quantization.fx._decomposedr
   r   r   torch._decomp.decompositionsr   rT  r   r   r<   r   r   $torch._decomp.decompositions_for_rngr   torch._dynamo.utilsr   torch._environmentr   !torch._higher_order_ops.out_dtyper   torch._inductor.utilsr   r   r   r   %torch.fx.experimental.symbolic_shapesr   r    r   r   r   r    r!   r"   r#   _opsOperatorBaseOpOverloadPacketr$   __annotations__	getLogger__name__r,   r&   rs   r  	quantizedr&  quantized_decomposed_adaptive_avg_pool2d_backwardindex_selectaddmvr   bitwise_and_bitwise_or_
clamp_min_distelu
empty_likeflipgeluhardtanhlcmr  linalg_vector_norm_log_softmax max_pool2d_with_indices_backward_native_batch_norm_legit#_native_batch_norm_legit_functional$_native_batch_norm_legit_no_training_batch_norm_with_update"_batch_norm_with_update_functional_batch_norm_no_updatebatch_norm_backwardrv  native_group_normnative_layer_normnll_loss2d_backwardpermute_copyrrelu_with_noise_backward_softmaxsin_sqrt__to_copytril_indicestriu_indicesunbind_copyr  upsample_bilinear2dvecr*  r5  inductor_decompositionsr+   _unsafe_indexr  #_unsafe_masked_index_put_accumulate+_scaled_dot_product_flash_attention_for_cpur   r  rG   rF   rZ   gluselect_scatterslice_scattersplitr   r   rt   unbindbaddbmmr%   r*   
OpOverloadr/   r   r=   rC   SymInttypesNumberrH   rQ   re   rv   tupler}   r{   r   r   rM   r   r   r   r   r   r   r   detach_r   r   r   r   r   	view_copyr   r   	ShapeType
StrideTyper  r  r  r   r  rr   r	  r  r  r  r   	low_dtyper"  r  embedding_bag_byte_unpackrJ  rV  _foreach_addcmulrh  r`  _foreach_addcdivrd  _foreach_lerprj  rm  rn  rz  py_impl_CDispatchKeyAutogradcachedictr|  r  r  choose_qparamsrV   r  r  r  r  strr  r  r  r  r  r  r  	Generatorr  r  rB   r2   r1   <module>ra     s       
  : : 2   # + 
  F ( ( 7 . 
 X $  T]t_#	JJUZZ888 )  g!yy~~		II	YY!!
yy55 ,+**++ 	

+ 		+
 	+ 	+ 	+ 			+ 	+ 	+ 			+ 			+ 	+ 	+ 	+  	!+" 	#+$ 	--%+& 	%%'+( 	00)+* 	11++, 	$$-+. 	///+0 	""1+2 	  3+4 	5+6 	7+8 	9+: 	  ;+< 	=+> 	&&?+@ 	A+B 			C+D 	

E+F 	G+H 	I+J 	K+L 	M+N 	O+P 	  $$Q+R 	55S+T 	++U+- \ K,.J2IJ
 	,,44<<NNNN!!NNHHJJLLHHKKLL#W Duzz44ejj6Q6QQRS ( n&8 9>	&6!77	8>xB (2r6"223> 6678\\  	
  \\ 9" ::BBCD )-(,	LL 
%++$$	% 
%++$$	%	
 
 E %# )-(,	||		%++$$	%	 
%++$$	%	 \\		 $ &	 $	
uS%,,&'
(	""	 	 \\		 %	 () !"M||M	M <<M LL	M ;;M \\M *M* ,,4456S
uS%,,&'
(S#YS S \\	S 7S 2234..<<. LL. S		.
 #tCy.!. 3S	>". CcN#. . I. . d. 5<<u||34. 5.@ ,,-.G G GU\\ G /G
 
# (,
,,LL $ \\	  $0 %
 (,  !
,,
,, ,, $	
 ++

 ;; \\  &8 	" (, 
,, LL  $  \\	   # N ))*+ :%,,:	: \\: ,:z %:U\\ :ell : &:& 
#
 +/	7||7||7 EKK&&'	7
 \\7 $7t ++,-   . DLL12u||   3 EJJ/0Iu|| IELL IU\\ I 1I EJJ/0Iu|| IELL IU\\ I 1I 		" 
,,	#  \\	 # 		" 
,,	#  \\	 # ))*+:
,,:	: : 	:
 \\: ,: //01)
,,)
uS%,,&'
() \\) 2) --./"
,,";;" \\" 0"
 
,,
 
5??E,,,-
  '
 $(%)%)).)>)>)3
,,)3c5j!)3 EKK 	)3
 U\\")3 U\\")3 )3 )3 &&)3 \\)3 ()3` $(%)).)>)>/c5<<'(/
,,/ EKK 	/
 U\\"/ &&/ / \\/@ '2ELL 2C 2ELL 2 (2 (3U\\ 3S 3U\\ 3 )3 ))112Tu|| T3 T# T%,, T 3T ))334V
,,V V(+V7:V
\\V 5V ,,-5
5
uS%,,&'
(5 5 \\	5 .5 	EEMMN $(<<LL 5<<
  \\	 O 
;;CCD<< ll LL	
 ,, || ,, || LL  \\ E4 		++EEF
Au|| 
A 
A G
A --./  ||
,,  	
  \\  0: --445
 	
u||
u||$ % 	
 
%,, 6 --445
 	
u||
u||$ % 	
 
%,, 6 **112
%
ell#
 KK
 
%,,	
 3
 **556
%
ell#
 %++$$%
 
%,,	
 7
 ''(<(<(E(EF../<<LL //%,,
' //%,,/	
 .  !&  5<<u||34 0 G< 6T#xS'9"9: 6 6!T#xS'9"9: ! ++,
,,
,, LL \\	 -$ ,;;BBC?<<?? ? 
	?
 ;;? 5<<%&? D? !
 	
)
,,
)<<
) LL
) 	
)
 \\
) "
) 		"
 	
,,<< LL 	
 \\ # 33;;<##LL# 
# 	#
 \\#  =#( ))* 1
,,1	1 <<1 
	1
 1 1 \\1 +1h1||1c1 U3S	>*+1 3S	>"	1
 CcN#1 1 
1 5<<%&1h 445 /3%&&'
||
c
 U3S	>*+
 3S	>"	

 CcN#
 
 5<<%&
 6
 445 /3%&&'
||
c
 U3S	>*+
 3S	>"	

 CcN#
 
 5<<%&
 6
 001||"&s)
5<<%& 2" ))001
 %)	\\	
++

	 		
 	 3-	 U\\"	 \\	 2	& 889 %+/E
,,E<<E E 	E
 E (E 5<<%&E :E& ..556 "&LL# \\ 7r2   