
    Vh|\                    bV   U d dl Z d dlZd dlmZ d dlmZ d dlmZmZ d dl	m
Z
mZ d dl	Z	d dlZd dlmc mZ d dlmZ d dlmZ d dlmZ d d	lmZmZmZ d d
lmZmZmZmZm Z m!Z!m"Z"m#Z#m$Z$m%Z%m&Z& d dl'm(Z( d dl)m*Z*m+Z+m,Z,m-Z-m.Z.m/Z/m0Z0m1Z1m2Z2m3Z3m4Z4m5Z5m6Z6m7Z7 d dl8m9Z9m:Z:m;Z;m<Z<m=Z=m>Z>m?Z? d dl@mAZA d dlBZBe j                  j                  e j                  j                  j                  j                  e j                  j                  j                  j                  e j                  j                  j                  j                  e j                  j                  j                  j                  gZHeIeA   eJd<   e j                  j                  e j                  j                  e j                  j                  e j                  j                  j                  j                  e j                  j                  j                  j                  hZOePeQ   eJd<   g  e
j                  eHD  cg c]#  } | j                  D cg c]  } eT| |       c}% c}}       ZUeIeQ   eJd<   eUD cg c]	  }|eOvs| c}ZUi ZVeWeQeXf   eJd<   eHD ]W  ZYeYj                  D ]F  ZZ eTeYeZ      Z[eYj                  j                  dd      j                  dd      Z^e[eVvs=e^ deZ eVe[<   H Y  edd      Z_ G d de      ZCd Z` G d d      Za G d d      Zb G d  d!e      Zc G d" d#      Zd G d$ d%      Zed& Zfd' Zgd( Zhd) Zid* Zjd+ Zkd, Zld- Zmd. Znd/ Zod0 Zpd1 Zqd2 Zrd3 Zsd4 Ztd5 Zud6 Zvd7 Zwd8 Zxd9 Zyd: Zzd; Z{d< Z|d= Z}d> Z~d? Zd@ ZdA ZdB ZdC ZdD ZdE ZdF ZdG ZdH ZdI ZdJ ZdK ZdL ZdM ZdN ZdO ZdP ZdQ ZdR ZdS ZdT ZdU ZdV ZdW ZdX ZdY ZdZ Zd[ Zd\ Zd] Zd^ Zd_ Zd` Zda Zdb Zdc Zdd Zde Zdf Zdg Zdh Zdi Zdj Zdk Zdl Zdm Zdn Zdo Zdp Zdq Zdr Zds Zdt Zdu Zdv Zdw Zdx Zdy Zdz Zd{ Zd| Zd} ZddZd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Zd Z e(ej                  ddexr e= d       e(ej                  ddexr e= d       e(ej                  ddexr e= d       e(ej                  ddexr e=e j                  fd       e( e&dg      ddd       e( e&dg      ddd      fZd Zd Zd Zd Zd Zd Ze j                  j                  j                         xr) e j                  j                  j                  dd       Zg  eee j                  j                  ev e(e%      f       eee j                  j                  e<ew e(e%       e(ej                  dd eBj                  d            f       eee j                  j                  e<ex e( ej                  d      dd       e(e%      f       eee j                  j                  ey       eee j                  j                  e<ez       eee j                  j                  e<e{ e( ej                  d      dd       e(e%      f       eee j                  j                  es       eee j                  j                  et e(ej                  dd eBj                  d      d       e(e;de j                  gd      f       eee j                  j                  eue< e( ej                  d      dd       e(e%      f       eee j                  j                  de| e(ej                  dd eBj                  d             e(ej                  dd eBj                  d            f       eee j                  j                  de} e(edd eBj                  d             e(ej                  dd eBj                  d             e(ej                  dd eBj                  d            f       eee j                  j                  de~ e(e%       e(ej                  dd eBj                  d             e(ej                  dd eBj                  d            f       eee j                  j                  e e(ej                  ddde j                  g      f       eee j                  j                   eedd~      e<d e( e!d      dd       e(e"dde j                  g       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                   eedd~      e<d e( e!d      dd       e(e"dde j                  g       e(ej                  ddde j                  g       e(ej                  ddde j                  e j                  g       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                   eedd~      e<d e( e!d      dd       e(e"dde j                  g       e(e%d       e(ej                  dd      f e( e#e j                  di      dd      f       eee j                  j                   eedd~d      e<d ee j                         e( e!d      dd       e(e"dde j                  g       e(ej                  dde j                  fd       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd       e( e#e j                  di      dd      fë       eee j                  j                   eedd~d      e<d ee j                         e( e!d      dd       e(e"dde j                  g       e(ej                  dde j                  e j                  e j                  f       e(ej                  ddde j                  e j                  g       e(ej                  ddde j                  e j                  g       e(ej                  dde j                  fd       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd       e( e#e j                  di      dd      fë       eee j                  j                   eedd~d       ee j                        e<d e( e!d      dd       e(e"dde j                  g       e(e%       e(ej                  dd       e(ej                  ddde j                  e j                  ge=ī       e(ej                  dde j                  fd      f e( e#e j                  di      dd       e( e#e j                  di      dd       e( e#e j                  di      dd      fū       eee j                  j                  e e( ej                  d      dd      f       eee j                  j                  e e(ej                  ddde j                  g      f       eee j                  j                  ee< e(e%       e( ej                  d      dd      f       eee j                  j                  ee< e(e%       e( ej                  d      dd      f       eee j                  j                  e e( ej                  d      dd      f       eee j                  j                  e e( ej                  d      dd       e(e:dde j                  gd      f       eee j                  j                   eedd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                    eedd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(ej                  ddde j                  g       e(ej                  ddde j                  e j                  g       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                   eedd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(e%       e(ej                  dd      f e( e#e j                  di      dd      f       eee j                  j                   eeddd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                   eeddd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(ej                  ddde j                  g       e(ej                  ddde j                  e j                  g       e(e;ddde j                  g       e(e;ddde j                  g      f e( e#e j                  di      dd      f       eee j                  j                   eeddd      e<d e( e!d      dd       e(e"dde j                  g       e(e$       e(e%       e(ej                  dd      f e( e#e j                  di      dd      f       eee j                  j
                  ef e( ej                  d      dd      f       eee j                  j                  eg e( ee j                   e ddƫ      e j                   e ddƫ      i      dddȬ      g e( ej                  d      dd       e(ej                  ddde j                  g      fɫ       eee j                  j                  e e( ej                  d      dd       e( ej                  d      dd      f       eee j                  j                  e e( ej                  d      dd       e( ej                  d      dd       e(ej                  dd eBj                  d      d      f       eee j                  j                  e e( ej                  d      dd       e( ej                  d      dd       e( ej                  d      dd       e(e:d      f       eee j                  j                  e       eee j                  j                  e       eee j                  j                  ee< e(e:d      f       eee j                  j                  eh e( ej                  d      dd       e( ej                  d      dd       e( ej                  d      dd       e( ej                  d      dd      f       eee j                  j                  el e( ej                  d      dd       e(e;ddde j                  g       e(ej                  ddde j                  g      f       eee j                  j                  e e( ej                  d      dd      f       eee j                  j                  e e( ej                  d      dd       e(e:dd       e( ej                  d      dd      f       eee j                  j                   e e( ej                  d      dd       e(e:dd       e( ej                  d      dd      f       eee j                  j"                  e e( ej                  d      dd       e(ej                  ddde j                  g      f       eee j                  j$                  e e( ej                  d      dd      f       eee j                  j&                  ei e( ej                  d      dd       e(ej                  ddde j                  g      f       eee j                  j(                  ej e( ej                  d      dd      f       eee j                  j*                  ek e( ej                  d      dd      f       eee j                  j,                  e e( ej                  d      dd      f       eee j                  j.                  e e( ej                  d      dd       e(ej                  ddde j                  g      f       eee j                  j0                  e e( ej                  d      dd       e(e:de j                  gd      f       eee j                  j2                  e e( ej                  d      dd       e(e:de j                  gd      f       eee j                  j4                  e edd~ʫ       e(ej                  dd       e( ee j                   e dd̬ƫ      i      dde j                  gdȬ       e(ej                  dde j                  gd      fͫ       eee j                  j6                  e e( ej                  d      dd       e(e:dd       e( ej                  d      dd       e( ej                  d      dd       e( ej                  d      dd      f       eee j                  j8                  e e(ej                  ddde j                  g      f       eee j                  j:                  e       eee j                  j<                  e eddΫ       e( ej                  d      dd       e( ee j                   e ddƫ      i      dddȬ       e( ej                  d      ddd       e( ej                  d      ddd       e( ej                  d      dde=d      fϫ       eee j                  j>                  e e(ej                  ddd       e(ej                  ddd       e(ej                  ddd       e(ej                  ddd       e(ej                  ddd      f       eee j                  j@                  eerdn) e(ej                  dd eBj                  d      d      fd~ҫ       eee j                  jB                  e       eee j                  jD                   eedӫ      d e( ej                  d      dd      fԫ       eee j                  jF                   eedӫ      d e( ej                  d      dd      fԫ       eee j                  jH                   eedӫ      d e(edd       e(edd       e(eddǫ       e(edd֫       e(eddѫ       e( ej                  d      dd      fԫ       eee j                  jJ                  e e(edd       e(edd       e(eddǫ       e(eddЫ       e(edd֫       e(eddѫ      f       eee j                  jL                  e e( ej                  d      dd      f       eee j                  jN                  e       eee j                  jP                  de e( ej                  d      dddȬ      g e( ej                  d      dd       e(ej                  dd׫      fث       eee j                  jR                  de e( ee j                   e ddƫ      i      ddde>٫       e( ee j                   e ddڬƫ      i      ddd       e( ej                  d      dddȬ      g e( ej                  d      dd      fث       eee j                  jT                  e e( ej                  d      dddȬ      g e( ej                  d      dd      fɫ       eee j                  jV                  ed e( ej                  d      dddȬ      g e( ej                  d      dd      f۫       eee j                  jX                  de e( ej                  d      dd      f       eee j                  jZ                  e e( ee j                   e ddƫ      i      ddd      g e( ej                  d      dd      fɫ       eee j                  j\                  eerdn) e(ej                  dd eBj                  d      d      f       eee j                  j^                  e       eee j                  j`                  e e(e%      f       eee j                  jb                  e e(e%      f       eee j                  jd                   eedܫ      eҬݫ       eee j                  jf                  eeҬݫ       eee j                  jh                  eeӬݫ       eee j                  jj                  eerdn) e(ej                  dd eBj                  d      d      f       eee j                  jl                  e e(ej                  ddde j                  g      f       eee j                  jn                  e       eee j                  jp                  e       eee j                  jr                  e e( ej                  d      dd       e(ej                  ddde j                  g      f       eee j                  jt                  e e( ej                  d      dd       e(ej                  ddde j                  g      f       eee j                  jv                  e e( ej                  d      dd      f       eee j                  jx                  e e(e%      f       eee j                  jz                  e e(e%      f       eee j                  j|                  e       eee j                  j~                  eerdn) e(ej                  dd eBj                  d      d      f       eee j                  j                  eerdn) e(ej                  dd eBj                  d      d      f       eee j                  j                  e e(e%      f       eee j                  j                  e e(e%      f       eee j                  j                  d eedܫ      eeѬޫ       eee j                  j                  d eed~ܫ      eeѬޫ       eee j                  j                  dee e(e%      feѬ߫       eee j                  j                  e       eee j                  j                  ee< e( ej                  d      ddd       e( ej                  d      ddd      f       eee j                  j                  ee< e( ej                  d      ddd       e( ej                  d      ddd      f       eee j                  j                  eì       eee j                  j                  ee< e( ej                  d      ddd       e( ej                  d      ddd      f       eee j                  j                  ee< e( ej                  d      ddd       e( ej                  d      ddd      f       eee j                  j                  e e(e%      f       eee j                  j                  eƬ       eee j                  j                  e e(ej                  ddd      f       eee j                  j                  e e(ej                  ddd      f       eee j                  j                  eeլݫ       eee j                  j                  ee֬ݫ       eee j                  j                  ee e(ej                  dd      f       eee j                  j                  eɬ       eee j                  j                  e e(ej                  ddd      f       eee j                  j                  e e(ej                  ddd      f      ZVeIee   eJd<   yc c}w c c}} w c c}w )    N)deepcopy)Enum)wrapspartial)chainproduct)pack_padded_sequence)make_tensor)
TEST_CUDNN)floating_typesfloating_and_complex_types_andget_all_fp_dtypes)_TestParametrizer_update_param_kwargsexpectedFailureMPStoleranceOverridetolskipCUDAIfCudnnVersionLessThanskipCUDAIfRocmprecisionOverrideskipMetaskipMPSskipCUDAVersionIn)DecorateInfo)cosineembeddingloss_referencecross_entropy_loss_referencectcloss_referencehingeembeddingloss_referencehuberloss_referencekldivloss_referencemarginrankingloss_referencemultimarginloss_referencemultilabelmarginloss_referencenllloss_referencenlllossNd_referencesmoothl1loss_referencesoftmarginloss_referenceget_reduction)freeze_rng_state	skipIfMPSskipIfMPSOnMacOS13GRADCHECK_NONDET_TOLTEST_WITH_ROCM
IS_WINDOWSskipIfTorchDynamo)
ModuleTypeMODULE_NAMESPACESMODULES_TO_SKIPMODULE_CLASSESMODULE_CLASS_NAMESztorch. z.modules.TrainEvalMode)
train_only	eval_onlytrain_and_evalc                   >    e Zd ZdZdej
                  dfdZd Zd Zy)moduleszQ PROTOTYPE: Decorator for specifying a list of modules over which to run a test. NTc                 h    t        |      | _        |t        |      nd | _        || _        || _        y N)listmodule_info_listsetallowed_dtypestrain_eval_modeskip_if_dynamo)selfmodule_info_iterablerB   rC   rD   s        V/home/dcms/DCMS/lib/python3.12/site-packages/torch/testing/_internal/common_modules.py__init__zmodules.__init__M   s5     $%9 :5C5Oc.1UY.,    c                 X   g }| j                   t        j                  k(  s| j                   t        j                  k(  r|j	                  d       | j                   t        j
                  k(  s| j                   t        j                  k(  r|j	                  d       |j                  s|d d }|S )NTF   )rC   r7   r8   r:   appendr9   train_and_eval_differ)rE   module_infotraining_flagss      rG   _get_training_flagszmodules._get_training_flagsT   s      M$<$<<$$(D(DD!!$'  M$;$;;$$(D(DD!!%( 00+BQ/NrI   c           
   #   P  K   |t        d      | j                  D ]U  }t        |j                  |j                              }| j
                  |j                  | j
                        }| j                  |      }t        ||      D ]  \  }}|j                  }	t        |      dkD  r|	d|rdnd z  }	d|i}
t        |
d|       t        |
d|       	 t              fd	       }| j                  r?t        j                  j                   j"                  j$                  s t'        d
      |      }t)        |j*                  |j,                  j,                  |j                  |      }||	|
|f  X y # t.        $ r#}t1        d|	 d|j2                   d       |d }~ww xY ww)NzThe @modules decorator is only intended to be used in a device-specific context; use it with instantiate_device_type_tests() instead of instantiate_parametrized_tests()rK   _
train_mode	eval_moderN   dtypetrainingc                       | i |S r>    )argskwargstests     rG   test_wrapperz/modules._parametrize_test.<locals>.test_wrapper~   s    #T4V44rI   z/Policy: we don't run ModuleInfo tests w/ DynamozFailed to instantiate z for module !)RuntimeErrorr@   rA   supported_dtypesdevice_typerB   intersectionrP   r   formatted_namelenr   r   rD   torchtesting	_internalcommon_utilsTEST_WITH_TORCHINDUCTORr/   r   get_decorators__name__	Exceptionprintname)rE   r[   generic_cls
device_clsrN   dtypesrO   rV   rU   	test_nameparam_kwargsr\   decorator_fnexs    `            rG   _parametrize_testzmodules._parametrize_testd   s      B C C  00 "	K55j6L6LMNF"".,,T-@-@A!55kBN%,^V%D !5 (66	~&*1X\;$O!PPI !.{;$\7EB$\:xH4[5 !5 **5==3J3J3W3W3o3o'k'89j'klx'y#*;+E+E{G[G[+/==*:P:PRW$YL (L,OO1"	> ! 29+\+JZJZI[[\]^Hs+   CF&BE71F&7	F# FF##F&)	rj   
__module____qualname____doc__r7   r:   rH   rP   ru   rX   rI   rG   r<   r<   J   s"    [<@!.!=!=d- (rI   r<   c                 <    | t         v r	t         |    S | j                  S r>   )r4   rj   )
module_clss    rG   get_module_common_namer{      s"    ''!*--"""rI   c                       e Zd ZdZddgZd Zy)FunctionInputz: Contains args and kwargs to pass as input to a function. rY   rZ   c                      || _         || _        y r>   )rY   rZ   )rE   rY   rZ   s      rG   rH   zFunctionInput.__init__   s    	rI   Nrj   rv   rw   rx   	__slots__rH   rX   rI   rG   r}   r}      s    D"IrI   r}   c                        e Zd ZdZg dZddZy)ModuleInputzA Contains args / kwargs for module instantiation + forward pass. constructor_inputforward_inputdescreference_fnNc                 x    || _         || _        || _        | _        t	              fd       }|| _        y y )Nc                 x    t        |      t        |      }} | t        | j                               g|i |S r>   )r   r?   
parameters)mrY   rZ   r   s      rG   copy_reference_fnz/ModuleInput.__init__.<locals>.copy_reference_fn   s;      (~x/?f $AtALLN';MdMfMMrI   )r   r   r   r   r   )rE   r   r   r   r   r   s       ` rG   rH   zModuleInput.__init__   sP    !2*	(#< N !N !2D $rI   )Nr5   Nr   rX   rI   rG   r   r      s    KNI2rI   r   c                       e Zd ZdZdZdZy)ModuleErrorEnumz7 Enumerates when error is raised when testing modules. r   rK   N)rj   rv   rw   rx   CONSTRUCTION_ERRORFORWARD_ERRORrX   rI   rG   r   r      s    AMrI   r   c                   :    e Zd ZdZg dZej                  eddZy)ErrorModuleInputzw
    A ModuleInput that will cause the operation to throw an error plus information
    about the resulting error.
    module_error_inputerror_on
error_typeerror_regex)r   r   c                <    || _         || _        || _        || _        y r>   r   )rE   r   r   r   r   s        rG   rH   zErrorModuleInput.__init__   s"     #5 $&rI   N)	rj   rv   rw   rx   r   r   r   r^   rH   rX   rI   rG   r   r      s"    
 PI
 *<<(		'rI   r   c                       e Zd ZdZdd e       ej                  ej                  fej                  ej                  fddddddddZ	d	 Z
d
 Zed        Zed        Zy)
ModuleInfoz+ Module information to be used in testing. rX   NT        F)skips
decoratorsrp   dtypesIfMPSdtypesIfHpusupports_gradgradgradcheck_nondet_tolmodule_memformat_affects_outrM   module_error_inputs_funcgradcheck_fast_modec                @   || _         || _        g |r|ng |r|ng | _        || _        || _        || _        || _        |	| _        |
| _        || _	        || _
        || _        t        |t        j                  j                  j                   j"                        | _        y r>   )rz   module_inputs_funcr   rp   r   r   r   r   r   rM   r   r   
issubclassrd   nnr<   lazyLazyModuleMixinis_lazy)rE   rz   r   r   r   rp   r   r   r   r   r   rM   r   r   s                 rG   rH   zModuleInfo.__init__   s    & %"4Z:Z2Z5%VXZ&&!2$8!,H)%:"(@%#6 !*ehh.>.>.C.C.S.STrI   c                     g }| j                   D ]U  }t        |t              r2|j                  |||||      s)|j	                  |j                          E|j                  |       W |S r>   )r   
isinstancer   	is_activeextendrL   )rE   
test_classrq   devicerU   rr   result	decorators           rG   ri   zModuleInfo.get_decorators   s_     	)I)\2&&z9fe\ZMM)"6"67i(	) rI   c                 ^    |dk(  r| j                   S |dk(  r| j                  S | j                  S )Nmpshpu)r   r   rp   )rE   r`   s     rG   r_   zModuleInfo.supported_dtypes   s4    %###E!###;;rI   c                 ,    t        | j                        S r>   )r{   rz   rE   s    rG   rm   zModuleInfo.name  s    %doo66rI   c                 :    | j                   j                  dd      S )Nr6   rR   )rm   replacer   s    rG   rb   zModuleInfo.formatted_name	  s    yy  c**rI   )rj   rv   rw   rx   r   rd   float16float32bfloat16rH   ri   r_   propertyrm   rb   rX   rI   rG   r   r      s~    5  &(#mmU]]<#nnemm=#'&).3',*.%)UB 7 7 + +rI   r   c           
      $   t        t        |||      }t        t        dd      t         |d            d       t        t        ddd	      t         |d            d
d       t        t        dd      t         |d            dd       g}|S )Nr   rU   requires_grad
         r   )inputc                     t        j                  ||d   j                               |d   j                  dd      j	                  dd      z   S )Nr   rK   r   r   )rd   mmtviewexpand)r   pr   s      rG   <lambda>z/module_inputs_torch_nn_Linear.<locals>.<lambda>  sE    UXXeQqTVVX5NQRSTQUQZQZ[\^`QaQhQhijlmQn5n rI   r   r   r   Fbiasno_biasc                 P    t        j                  ||d   j                               S )Nr   )rd   r   r   r   r   is      rG   r   z/module_inputs_torch_nn_Linear.<locals>.<lambda>  s    !QqTVVX1F rI   r         no_batch_dimc                     t        j                  |j                  dd      |d   j                               j                  d      |d   z   S )NrK   r   r   )rd   r   r   r   r   s      rG   r   z/module_inputs_torch_nn_Linear.<locals>.<lambda>  s=    !&&B-11R1W1WXZ1[^_`a^b1b rI   r   r
   r   r}   )rN   r   rU   r   rV   rZ   
make_inputmodule_inputss           rG   module_inputs_torch_nn_Linearr     s    V5P]^J 	mB&:"/j6I"J!n	p 	mB&F"/
70C"D"!F	H 	mAq&9"/
1">'!b	dM rI   c                 b   t        t        |||      }ddt        t        ddd      t         |d       |d                  t        t        dddd	
      t         |d       |d            dfd      t        t        ddd      t         |d       |d            dfd      g}|S )Nr   c                     t        j                  d||d   |      }|rp|j                  d   dk(  r|j                  d      |d   z   }|S ||d   j                  dd      j	                  |j                  d   |d   j                  d         z   }|S )Nzbn,anm,bm->bar   rK   r   )rd   einsumshaper   r   )r   r   x1x2r   r   s         rG   bilinear_reference_fnz>module_inputs_torch_nn_Bilinear.<locals>.bilinear_reference_fn&  s    or1Q4<xx{aR1Q4/   !A$))Ar"2"9"9"((1+qtzzRS}"UUrI      r   r   )r   r   )r   r   r   Fr   r   c                      | |||d      S )NFr   rX   r   r   r   r   r   s       rG   r   z1module_inputs_torch_nn_Bilinear.<locals>.<lambda>6  s    6KAqRTVX_d6e rI   r   r   c           	      Z     | ||j                  dd      |j                  dd            S )NrK   r   )r   r   s       rG   r   z1module_inputs_torch_nn_Bilinear.<locals>.<lambda>:  s3    6KAqRTRYRYZ[]_R`bdbibijkmobp6q rI   )Tr   )	rN   r   rU   r   rV   rZ   r   r   r   s	           @rG   module_inputs_torch_nn_Bilinearr   #  s    V5P]^J 	mAq!&<"/
60BJvDV"W!6	8 	mAq!%&H"/
60BJvDV"W"!e	g 	mAq!&<"/
1z!}"M'!q	sM rI   c           
      b   t        t        |||      }di fdddifdddifddd	ifd
d
difg}g }|D ]  \  }	}
|
fd} |d      j                         }|j                  d
d      r |d      n |d      j                         }|j	                  t        t        di |
t        ||      |	|              |d      j                         }|j                  d
d      r |d      n |d      j                         }|j	                  t        t        di |
t        ||      d|	z   |              |S )Nr   r5   reduction_sum	reductionsumreduction_batchmean	batchmeanreduction_nonenone
log_targetTc                     t        ||fi |S r>   )r    r   r   r   r   constructor_kwargss        rG   r   z6module_inputs_torch_nn_KLDivLoss.<locals>.reference_fnM      &q!B/ABBrI   r   r   Fr   rX   scalar_)r   r
   loggetrL   r   r}   )rN   r   rU   r   rV   rZ   r   casesr   r   r   r   r   targetscalar_inputscalar_targets                   rG    module_inputs_torch_nn_KLDivLossr   @  sh   V5P]^J 
R	;./	k :;	K01	d+,%E M$) 
  8J 	C 8$((*)/L%)HH%jYaNbNfNfNh-*M:L*M&3E6&B!%13	
 ""~))+ %jju=JrN:b>CUCUCW 	 	-*M:L*M&3L,&O&-%13	
%
2 rI   c                 t   |||fd}t        t        ||d      }di fdddifddd	ifd
d
difdd |d      j                         ifd |d      j                         ddfd |d      j                         ddfg}g }	|D ]4  \  }
}|fd}|	j                  t	        t        d i |t         |d      t        j                  d|      j                         j                  d      j                         j                               |
|             |fd}|	j                  t	        t        d i |t         |d      t        j                  ddd|      j                         j                  d      j                         j                               d|
 |             |	j                  t	        t        d i |t         |d      t        j                  ddddd|      j                         j                  d      j                         j                               d|
 |             |	j                  t	        t        d i |t         |d      t        j                  dd|      j                         j                  d      j                         j                               d|
 |             7 |	S )!Nc                 ^    t        | ||d      j                  d      j                  |      S )NFr   rK   dim)r
   log_softmaxrequires_grad_)r   r   rU   r   s       rG   r   z2module_inputs_torch_nn_NLLLoss.<locals>.make_inputi  s/    5u).00;0B>>R_C`	arI   Fr   r5   r   r   r   r   r   ignore_indexr   weightsweightr   weights_ignore_index)r  r  weights_ignore_index_negr   c                     t        ||fi |S r>   )r$   r   s        rG   r   z4module_inputs_torch_nn_NLLLoss.<locals>.reference_fn  s    $Q@-?@@rI   )   r   r  r   r   c                     t        ||fi |S r>   )r%   r   s        rG   nd_reference_fnz7module_inputs_torch_nn_NLLLoss.<locals>.nd_reference_fn  r   rI   )r   r   r   r   r   nd_)r   r   r   r   r   r   higher_dim_)r   r   r   3d_rX   )r   r
   absrL   r   r}   rd   emptyuniform_mulfloorlong)rN   r   rU   r   rV   rZ   r   make_weightr   r   r   r   r   r  s                 rG   module_inputs_torch_nn_NLLLossr  h  s   !'uM a +fEQVWK 
R	;./	K01	.!,-	X{1~11345	KN,>,>,@RS!TU	#A0B0B0DVX%YZ%E M$) )
  8J 	A 	-*M:L*M&3Jw4G49KK64R4[4[4]4a4abc4d4j4j4l4q4q4s'u!%1	3	
 <N 	C 	-*M:L*M&3&|4!KK1a?HHJNNqQWWY^^`'b  #4&\%46	
 	-*M:L*M&3&'9:!KK1aAfENNPTTUVW]]_ddf'h  +4&1%46	
 	-*M:L*M&3&y1!KK1V<EEGKKANTTV[[]'_  #4&\%46	
E)
V rI   c                 >   t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifg}g }	|D ][  \  }
}|	j                  t        t	        di |t	         |d       |d       |d      j                               |
t                     ] |	S )Nr   Fr5   r   r   r   reduction_meanmeanr   r   r   rK   r   rX   )r   r
   rL   r   r}   r  no_batch_dim_reference_fn)rN   r   rU   r   rV   rZ   r   make_targetr   r   r   r   s               rG   &module_inputs_torch_nn_GaussianNLLLossr     s    V5P]^J+fEQVWK 
R	;./	K01	K01	%E M$) 
  -*M:L*M&3JqM4?N4>qM4E4E4G'I "%>@	

 rI   c                    t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifdddifdddifddddfg}ddg }	|D ]  \  }
}|ffd	}|j                  dd      }|r |d      n$ |d      j                         j	                  d      }|	j                  t        t        di |t        | |d      j                         j                               |
|              |	S )Nr   Fr5   r   r   r   r  r  r   r   fullTno_log_input	log_inputfull_no_log_input)r"  r$  c                    |r#| j                         |j                  |       z
  }n%| |j                  | |z   j                               z
  }|r`||j                  |j                               |z
  ddt        j                  z  |z  j                         z  z   j                  |dk  d      z  }|dk(  r|S |dk(  r!|j                         | j                         z  S |j                         S )N      ?       @rK   r   r   r  )expr  r   mathpimasked_fillr   numel)r   r   r$  r"  r   epsr   s          rG   poissonnllloss_reference_fnzJmodule_inputs_torch_nn_PoissonNLLLoss.<locals>.poissonnllloss_reference_fn  s    UUWquuQx'FC}}//FquuQUUW~)C2<!3C2H2H2J,JJWWXY]^X^`abbFM& ::<!'')++::<rI   c                      ||fi |S r>   rX   )r   r   r   r   r   r/  s        rG   r   z;module_inputs_torch_nn_PoissonNLLLoss.<locals>.reference_fn  s    .q!J7IJJrI   r   r   r   r   MbP?r   )TFr  g:0yE>rX   )
r   r
   r   r  addrL   r   r}   floor_abs_)rN   r   rU   r   rV   rZ   r   r  r   r   r   r   r   r$  r   r/  s                  @rG   %module_inputs_torch_nn_PoissonNLLLossr6    s<   V5P]^J+fEQVWK 
R	;./	K01	K01	&$ 	+u-.	t%@A%E   M$) 
  8J 	K '**;=	,5
<(:l;S;W;W;Y;];]^c;d-*M:L*M&3E4?4M4T4T4V4[4[4]'_!%1	3	

 rI   c                    t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifg}dd}	g }
|D ]  \  }}|
j                  t        t	        di |t	         |d       |d            |t        |	fi |             |
j                  t        t	        di |t	         |d       |d            | dt        |	fi |              |
S )Nr   Fr5   r   r   r   r  r  r   r   c                     |dk(  r||z
  j                  d      S |dk(  r3||z
  j                  d      j                         |j                         z  S ||z
  j                  d      j                         S )Nr   r   r  )powr   r-  )r   r   r   r   r   s        rG   mse_loss_reference_fnz=module_inputs_torch_nn_MSELoss.<locals>.mse_loss_reference_fn  se    E;;q>!& E;;q>%%'!'')33E;;q>%%''rI   r1  r   rX   _scalar)r  r   r
   rL   r   r}   )rN   r   rU   r   rV   rZ   r   r  r   r:  r   r   r   s                rG   module_inputs_torch_nn_MSELossr=    s#   V5P]^J+fEQVWK 
R	;./	K01	K01	%E( M$) 
  -*M:L*M&3J|4L4?4M'O!%,-B%YFX%Y	[	
 	-*M:L*M&3JrN4?O'E $vW-%,-B%YFX%Y	[	

  rI   c                    fd} |dd      rdnd} |dd      } |dd	      }|Kt        |t              sJ j                         D ]&  \  }}	||v s|	||   }
|	j                  |
      |<   ( |D cg c]  }|j                  |       }}t	               5   | |i j                  |      }ddd       |r!t        |       }|d
k(  rj                  d      S S c c}w # 1 sw Y   3xY w)a  Reference function for modules supporting no batch dimensions.

    Unbatched inputs are unsqueezed to form a
    single batch input before passing them to the module.
    The output is squeezed to compare with the
    output of unbatched input to the module.

    Currently it only supports modules which return a single Tensor as output.
    You can bind the following kwargs.
    Kwargs:
        batch_first[bool] : If True, all the Tensors in `args` while be unsqueezed at dim `0` .
                        and output will be squeezed at dim `0` else dim `1` for both.
        kwargs_to_batchify[dict] : Dictionary specifying the name of the argument and dimension to unsqueeze.
                               Useful if there are few arguments whose batch dimension are different
                               from the ones selected by `batch_first`.
        is_criterion[bool] : Specify if the module is a criterion and handle the reduction for output accordingly.
    c                 V    j                  | |      }| v rj                  |        |S r>   )r   pop)keydefaultvrZ   s      rG   get_and_popz.no_batch_dim_reference_fn.<locals>.get_and_pop-  s*    JJsG$&=JJsOrI   batch_firstTr   rK   kwargs_to_batchifyNis_criterionFr   )r   dictitems	unsqueezer)   squeezer(   )r   r   rY   rZ   rD  	batch_dimrF  rG  krC  bdimr   single_batch_input_argsoutputr   s      `           rG   r  r    s   $ !51I$%94@~u5L%,d333LLN 	.DAq&&1=)!,KK-q		.
 HLLeuy9LL		 J+6v6>>yIJ !!$	>>!$$M MJ Js   7C C%%C.c                 ~   |j                  dd      rdnd}d|v r|j                  d       d|v r|d   |d   j                  d      |d<   |D cg c]  }|j                  |       }}t               5   | |i |}|d   j	                  |      |d   j	                  d      fcddd       S c c}w # 1 sw Y   yxY w)a  Reference function for MultiheadAttention supporting no batch dimensions.

    Unbatched inputs are unsqueezed to form a
    single batch input before passing them to the module.
    The output is squeezed to compare with the
    output of unbatched input to the module.
    rE  Tr   rK   key_padding_maskN)r   r@  rJ  r)   rK  )r   r   rY   rZ   rL  r   rO  rP  s           rG   no_batch_dim_reference_mharS  I  s     ZZt4!I

=!V#/A(B(N%+,>%?%I%I!%L!"GKLeuy9LL		 D+6v6q	!!),fQi.?.?.BCD D MD Ds   B.40B33B<c                 r   t        |      dk(  r|\  }d}n$t        |      dk(  r|\  }}|j                  d      }|d   rdnd}|j                  d       j                  |      }|f}t               5   | |i |}|d   j	                  |      |d   j	                  d      fcddd       S # 1 sw Y   yxY w)a  Reference function for RNN and GRU supporting no batch dimensions.

    Unbatched inputs are unsqueezed to form a
    single batch input before passing them to the module.
    The output is squeezed to compare with the
    output of unbatched input to the module.
    rK   Nr   rE  r   rc   rJ  r@  r)   rK  	r   r   rY   rZ   inphrL  rO  rP  s	            rG   no_batch_dim_reference_rnn_grurY  \  s     4yA~	TaQKKNM*I
JJ}
--	
"C"Ah		 D+6v6q	!!),fQi.?.?.BCD D Ds   30B--B6c                    t        |      dk(  r|\  }d}n;t        |      dk(  r-|\  }}|d   j                  d      |d   j                  d      f}|d   rdnd}|j                  d       j                  |      }|f}t               5   | |i |}|d   j	                  |      |d   d   j	                  d      |d   d   j	                  d      ffcddd       S # 1 sw Y   yxY w)a  Reference function for LSTM supporting no batch dimensions.

    Unbatched inputs are unsqueezed to form a
    single batch input before passing them to the module.
    The output is squeezed to compare with the
    output of unbatched input to the module.
    rK   Nr   r   rE  rU  rV  s	            rG   no_batch_dim_reference_lstmr[  t  s     4yA~	TaQqT^^A!q 12M*I
JJ}
--	
"C"Ah		 b+6v6q	!!),vay|/C/CA/Fq	RSH\H\]^H_.`ab b bs   
A
CC'c                    |\  }\  }}|j                  d      |j                  d      |j                  d      ff}t               5   | |i |}|d   j                  d      |d   j                  d      fcddd       S # 1 sw Y   yxY w)zReference function for LSTMCell supporting no batch dimensions.

    The module is passed the input and target in batched form with a single item.
    The output is squeezed to compare with the no-batch input.
    r   rK   N)rJ  r)   rK  )	r   r   rY   rZ   rW  rX  crO  rP  s	            rG   no_batch_dim_reference_lstmcellr^    s     KC!Q"}}Q/!++a.!++a.1QR		 <+6v6q	!!!$fQi&7&7&:;< < <s   0B  B	c                     dD cg c]C  }t        t        |      t         | d       | d            t        t        d      d|       E c}S c c}w )	N)r   r  r   )r   r   r   TrG  no_batch_dim_r   r   r   r   )r   r}   r   r  )r   r   s     rG   $generate_regression_criterion_inputsrd    s[     34  	+i@'
5(9:a>J !:N ,		
4 4 4s   AAc                 d   t        t        |||      }t        t        d      t         |d            dt              t        t        d      t         |d                  t        t        d	d	      t         |d            d
      t        t        ddd      t         |d            d      gS )Nr   r   )kernel_size)r      r   r   )r   r   rg  r   r   r   strider   r   r   rK   
stride_padr   r
   r   r}   r  rN   r   rU   r   rV   rZ   r   s          rG    module_inputs_torch_nn_AvgPool1dro    s    V5P]^J 	m&B"/
60B"C'!:	< 	mA&6"/
90E"F	HmD$&?"/
90E"F!	# 	mAq!&<"/
90E"F%	'( (rI   c                 R   t        t        |||      }t        t        d      t         |d            dt              t        t        d      t         |d                  t        t        dd      t         |d            d	      t        t        ddd
      t         |d            d	      t        t        dd      t         |d            d	      t        t        ddd      t         |d            d	      t        t        ddd
d      t         |d            d	      gS )Nr   r   r   r   rg  rg  r   r   r   r   rg  rg  rh  rj  rk  rK   rK   rl  rK   divisor_overridedivisordivisor_stridedivisor_stride_padrm  rn  s          rG    module_inputs_torch_nn_AvgPool2drz    s   V5P]^J 	mF&;"/
90E"F'!:	< 	mF&;"/
<0H"I	KmFF&C"/
<0H"I!	# 	mFFF&K"/
<0H"I%	' 	mFQ&O"/
<0H"I"	$ 	mFFUV&W"/
<0H"I)	+ 	mFFF]^&_"/
<0H"I-	/'0 0rI   c                    t        t        |||      }t        t        d      t         |d            dt              t        t        d      t         |d                  t        t        dd      t         |d	            d
      t        t        ddd      t         |d	            d      t        t        ddd      t         |d	            d      t        t        ddd      t         |d            d      t        t        ddd      t         |d            d      t        t        ddd      t         |d            d      t        t        dd      t         |d            d      t        t        ddd      t         |d	            d      t        t        dddd      t         |d	            d      t        t        dddd      t         |d	            d      t        t        dddd      t         |d            d      t        t        dddd      t         |d            d       t        t        dddd      t         |d            d!      gS )"Nr   r   r   r   r   r   r   r   r   r   r   r   r   r   r   rh  r   r   r   r   r   r   rj  rk  rK   rK   rK   rl  r   )rK   r   rK   stride_pad_gpu_fixedkw_output)r   r   r   rK   )rK   rK   r   )r   r   r   r   r   stride_pad_gpu_general_outputr   r   stride1_pad0_gpu_inputstride_pad_gpu_input_nooverlapru  rw  rx  ry  %divisor_stride_pad_gpu_fixedkw_output%divisor_stride_pad_gpu_general_outputdivisor_stride1_pad0_gpu_input&divisor_stride_pad_gpu_input_nooverlaprm  rn  s          rG    module_inputs_torch_nn_AvgPool3dr    sQ   V5P]^J 	mI&>"/
<0H"I'!:	< 	mI&>"/
?0K"L	NmAy&A"/
?0K"L!	# 	mAq)&D"/
?0K"L%	' 	mAq)&D"/
?0K"L8	: 	mIq)&L"/
?0K"L8	: 	mAq!&<"/
?0K"L1	3 	mAq)&D"/
?0K"L9	; 	mIPQ&R"/
?0K"L"	$ 	mAyST&U"/
?0K"L)	+ 	mAq)VW&X"/
?0K"L-	/ 	mAq)VW&X"/
?0K"L@	B 	mIq)^_&`"/
?0K"L@	B 	mAq!a&P"/
?0K"L9	; 	mAq)VW&X"/
?0K"LA	CW-D -DrI   c           
         t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      t        t        d	      t         |d            d
      gS )Nr   r   rK   r   r   singlerk  r   r   r   rc  rK   
one_outputrm  rn  s          rG   (module_inputs_torch_nn_AdaptiveAvgPool1dr    s    V5P]^J 	mA&7"/
90E"F!	# 	mA&7"/
60B"C!:'	) 	mA&7"/
90E"F%	'
( 
(rI   c                    t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      t        t        d	      t         |d            d
      t        t        d      t         |d            d      t        t        d      t         |d            d      gS )Nr   r   rK   r   r   rg  r  rk  r   r   rg  r   rc  rK   single_1x1outputr   r   tupler   N
tuple_nonerm  rn  s          rG   (module_inputs_torch_nn_AdaptiveAvgPool2dr    s    V5P]^J 	mA&7"/
<0H"I!	# 	mA&7"/
90E"F!:'	) 	mA&7"/
<0H"I+	- 	mF&;"/
<0H"I 	" 	mI&>"/
<0H"I%	'( (rI   c                    t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      t        t        d	      t         |d
            d      t        t        d      t         |d
            d      t        t        d      t         |d            d      gS )Nr   r   )r   r   r   r      r  rk  )r   r   r   r  r   rc  r   r   r   )r   r   r   r   r  r  )Nr   r   r  )r   r   r   )rK   rK   r   r   rg  last_dimrm  rn  s          rG   (module_inputs_torch_nn_AdaptiveAvgPool3dr  *  s    V5P]^J 	mA&7"/
?0K"L!	# 	mA&7"/
<0H"I!:'	) 	mI&>"/
?0K"L 	" 	mL&A"/
?0K"L%	' 	mI&>"/
?0K"L#	%& &rI   c           	          t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      gS )	Nr   r   r  r  rk  r  r   rc  rm  rn  s          rG   (module_inputs_torch_nn_AdaptiveMaxPool1dr  @  sb    V5P]^J 	mA&7"/
90E"F!	# 	mA&7"/
60B"C!:'	)	* *rI   c                 ^   t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      t        t        d	      t         |d            d
      t        t        d      t         |d            d      gS )Nr   r   r  r  rk  r  r   rc  r  r  r  r  rm  rn  s          rG   (module_inputs_torch_nn_AdaptiveMaxPool2dr  M  s    V5P]^J 	mA&7"/
<0H"I!	# 	mA&7"/
90E"F!:'	) 	mF&;"/
<0H"I 	" 	mI&>"/
<0H"I%	'( (rI   c                    t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            t        d      t        t        d	      t         |d            d
      t        t        d      t         |d            d      t        t        d      t         |d            d      t        t        d	      t         |d            d      gS )Nr   r   )r   r   r   rg  r  r  rk  )r   r   rg  r  r   rc  r  r  )r   Nr   r  )r   r      	   r   single_nonatomic)r   r   rg  r   r   tuple_nonatomicrm  rn  s          rG   (module_inputs_torch_nn_AdaptiveMaxPool3dr  `  s    V5P]^J 	mA&7"/
?0K"L!	# 	mA&7"/
<0H"I!:'	) 	mI&>"/
?0K"L 	" 	mL&A"/
?0K"L%	' 	mA&6"/
;K0L"M+	- 	mI&>"/
;K0L"M*	,#- -rI   c                 P   t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            d      t        t        dd	d       t         |d            d
      t        t        dd	dd      t         |d            d      t        t        dd	ddd      t         |d            d      t        t        dd	dd      t         |d            d      t        t        dd	dd      t         |d            d      gS )Nr   r   r   affinerk  r   )r   r   r   3d_inputr2  affine_simple_average333333?F
not_affineTnot_tracking_stats3d_input_not_affine)r   r   r  
zero_batchr   rn  s          rG   "module_inputs_torch_nn_BatchNorm1dr  y  s"   V5P]^J 	mB&8"/
70C"D!	# 	mA&7"/
90E"F#	% 	mBd&C"/
70C"D0	2 	mBc5&I"/
70C"D%	' 	mBc4&O"/
70C"D-	/ 	mAtS%&H"/
90E"F.	0 	mAtS%&H"/
90E"F%	''( (rI   c                    t        t        |||      }t        t        d      t         |d                  t        t        ddd       t         |d            d      t        t        ddd      t         |d            d	      t        t        dddd
      t         |d            d      t        t        ddddd
      t         |d            d      t        t        dddd
      t         |d            d      gS )Nr   r   rs  rh  r2  2d_simple_averagerk  g?momentumFr  Tr  r   r  )r   r   r   r   r  r   rn  s          rG   "module_inputs_torch_nn_BatchNorm2dr    s    V5P]^J 	mA&7"/
<0H"I	KmAtT&B"/
<0H"I,	. 	mAtS&A"/
<0H"I#	% 	mAtS%&H"/
<0H"I%	' 	mAtS$&N"/
<0H"I-	/ 	mAtS%&H"/
<0H"I%	'( (rI   c                    t        t        |||      }t        t        d      t         |d                  t        t        ddd       t         |d            d      t        t        ddd      t         |d            d	      t        t        dddd
      t         |d            d      t        t        ddddd
      t         |d            d      t        t        dddd
      t         |d            d      gS )Nr   r   r~  rh  r2  3d_simple_averagerk  ffffff?r  Fr  Tr  r   r  )r   r   r   r   r   r  r   rn  s          rG   "module_inputs_torch_nn_BatchNorm3dr    s    V5P]^J 	mA&7"/
?0K"L	NmAtT&B"/
?0K"L,	. 	mAtS&A"/
?0K"L#	% 	mAtS%&H"/
?0K"L%	' 	mAtS$&N"/
?0K"L-	/ 	mAtS%&H"/
?0K"L%	'( (rI   c                    |d   }|j                  dd      }|j                  dd      }t        t        |||      }	|ri gni ddig}
d\  }}}|ft        d	 t	        |      D              z   }d
|z   }t        j                  ddg|
      D cg c]N  \  }}t        |rt        ||fi |nt        |||fi |t         |	|r|n|            |rdnd|rd nt              P c}}S c c}}w )NNr   F
transposedr   paddingsamer  c              3   &   K   | ]	  }|d z     ywr  rX   ).0r   s     rG   	<genexpr>z0module_inputs_torch_nn_ConvNd.<locals>.<genexpr>  s     *CQ1q5*Cs   ri  Tr5   r   r   )
r   r   r
   r  range	itertoolsr   r   r}   r  )rN   r   rU   r   rV   rZ   r  r   r  r   conv_kwargs_listrf  C_inC_outinput_no_batch_shapeinput_batch_shape
with_batchconv_kwargss                     rG   module_inputs_torch_nn_ConvNdr    s   sA::fe$DL%0JV5P]^J)tY4G/H&Ku 7U*C%(*C%CC33 (1'8'8$HX'Y $J 	[_}UK'W;'W'4T5+']Q\']"/
-7)=Q1S #T *"*4$:S	V  s   AC$c                 J   t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifdddifg}g }	|D ]\  \  }
}|fd}|	j                  t        t	        di |t	         |d       |d       |d      j                               |
|             ^ |	S )Nr   Fr5   r   r   r   r  r  r   r   marginr  c                     t        |||fi |S r>   )r   r   r   i1i2r   r   s         rG   r   z@module_inputs_torch_nn_CosineEmbeddingLoss.<locals>.reference_fn  s    0RQ>PQQrI   r  r   )r  r   rX   r   r
   rL   r   r}   signrN   r   rU   r   rV   rZ   r   r  r   r   r   r   r   s                rG   *module_inputs_torch_nn_CosineEmbeddingLossr    s    V5P]^J+fEQVWK 
R	;./	K01	K01	Hc?#%E M$) 

  =O 	R 	-*M:L*M&3Jx4H*U]J^4?4F4K4K4M'O!%1	3	
	

 rI   c                 d   t        t        |||      }t        t        d      t         |d            d       t        t        d      t         |d            d	      t        t               t         |d
            dt              t        t        d      t         |d            d	      gS )Nr   r(  alphar   r   r   c                 ^    t        j                  |dk\  |d|j                         dz
  z        S )Nr   r   rK   rd   wherer)  r   s      rG   r   z,module_inputs_torch_nn_ELU.<locals>.<lambda>  s'    Q!VQQUUWWX[HY1Z rI   r   rX   scalarrk  r   r   r   r   r   r   r   4d_inputrm  rn  s          rG   module_inputs_torch_nn_ELUr    s    V5P]^J 	m"&="/
90E"F!Z	\ 	m"&="/
2"?!	# 	mo"/
40@"A'!:	< 	m"&="/
<0H"I#	%& &rI   c           
          t        t        |||      }t        t        d      t         |d            d       t        t        d      t         |d            d d	
      t        t        d      t         |d            dt              gS )Nr   r(  r  r  c                 d    t        j                  |dk\  |dd|z  j                         dz
  z        S Nr   r(  r'  rK   r  r   s      rG   r   z-module_inputs_torch_nn_CELU.<locals>.<lambda>  -    Q!VQrTUvlln_`N`Ha1b rI   r   rX   c                 d    t        j                  |dk\  |dd|z  j                         dz
  z        S r  r  r   s      rG   r   z-module_inputs_torch_nn_CELU.<locals>.<lambda>  r  rI   r  rc  r  r   r   rm  rn  s          rG   module_inputs_torch_nn_CELUr    s    V5P]^J 	m"&="/
90E"F!b	d 	m"&="/
2"?!b!	# 	m"&="/
40@"A'!:	<= =rI   c           
         t        t        |||      }t        t               t         |d                  t        t        d      t         |d            d      t        t               t         |d            d	t        
      gS )Nr   )r   rg  rh  rK   r   rg  r  r  rk  r`  r   r   rm  rn  s          rG   module_inputs_torch_nn_GLUr    sy    V5P]^J 	mo"/
60B"C	EmA&6"/
90E"F	  	mo"/
40@"A'!:	<	= 	=rI   c           
         t        t        |||      }t        t        d      t         |d            d d      t        t        d      t         |d            d 	      t        t               t         |d
            dt              gS )Nr   r   rX   c                 j    |dz  dt        j                  |t        j                  d      z        z   z  S Nr'        ?r(  rd   erfr*  sqrtr   r   xrR   s       rG   r   z-module_inputs_torch_nn_GELU.<locals>.<lambda>+  0    QWeiiPQTXT]T]^aTbPbFc@c5d rI   r  rc  r  c                 j    |dz  dt        j                  |t        j                  d      z        z   z  S r  r  r  s       rG   r   z-module_inputs_torch_nn_GELU.<locals>.<lambda>/  r  rI   r   r  r   r   rm  rn  s          rG   module_inputs_torch_nn_GELUr  %  s    V5P]^J 	mF&;"/
2"?!d!	# 	mF&;"/
90E"F!d	f 	mo"/
40@"A'!:	<= =rI   c                 V   t        t        |||      }t        t               t         |d            d      t        t               t         |d            t        d      t        t               t         |d            d	      t        t               t         |d
            d      gS Nr   rX   r  rk  r   r   rc  r1  channels_last_mem_format)r   r   r   r   r   channels_last_3d_mem_formatrm  rn  s          rG   module_inputs_torch_nn_ReLUr  6      V5P]^J 	mo"/
2"?!	# 	mo"/
1">!:'	) 	mo"/
<0H"I3	5 	mo"/
?0K"L6	89 9rI   c                 V   t        t        |||      }t        t               t         |d            d      t        t               t         |d            t        d      t        t               t         |d            d	      t        t               t         |d
            d      gS r  rm  rn  s          rG   module_inputs_torch_nn_ReLU6r  I  r  rI   c                    t        t        |||      }t        t               t         |d                  t        t               t         |d            t        d      t        t        d      t         |d            d	      t        t        d
      t         |d            d	      t        t        d      t         |d            d	      gS )Nr   r  rh  r   r   rc  r'  with_negvalrk  r   r   with_zero_negvalrX   with_negval_scalarrm  rn  s          rG    module_inputs_torch_nn_LeakyReLUr  \  s    V5P]^J 	mo"/
90E"F	Hmo"/
1">!:'	) 	mC&8"/
90E"F&	( 	mC&8"/
80D"E+	- 	mC&8"/
2"?-	/0 0rI   c                    t        t        |||      }t        t               t         |d            d      t        t               t         |d            t        d      t        t               t         |d            d	 d
      t        t        d      t         |d            d d      t        t               t         |d            d d      t        t        d      t         |d            d d      t        t               t         |d            d d      t        t        d      t         |d            d d      gS )Nr   rX   r  rk  r   r   rc  r   r   r   c                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S Nr   min)maxrd   clampr   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>~  5    QA1FUV\]I^abcdaefgahIh1h rI   1dr   c                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S r  r  r   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>  r  rI   1d_multiparamr1  c                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S r  r  r   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>  r  rI   2dc                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S r  r  r   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>  r  rI   2d_multiparam)r   r   r   r   rg  c                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S r  r  r   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>  r  rI   3dc                 r    t        j                  |d      t        j                  |d      |d   d   z  z   S r  r  r   s      rG   r   z.module_inputs_torch_nn_PReLU.<locals>.<lambda>  r  rI   3d_multiparamrm  rn  s          rG   module_inputs_torch_nn_PReLUr  q  s)   V5P]^J 	mo"/
2"?!	# 	mo"/
1">!:'	) 	mo"/
90E"F!h	 	mA&6"/
90E"F!h(	* 	mo"/
<0H"I!h	 	mA&6"/
<0H"I!h(	* 	mo"/
?0K"L!h	 	mA&6"/
?0K"L!h(	*9+ +rI   c           
         t        t        |||      }t        t               t         |d                  t        t               t         |d            t        d      t        t               t         |d            d	      gS )
Nr   r  rh  r   r   rc  rX   r  rk  rm  rn  s          rG   module_inputs_torch_nn_SELUr    st    V5P]^J 	mo"/
90E"F	Hmo"/
1">!:'	) 	mo"/
2"?!	#	$ 	$rI   c           
         t        t        |||      }t        t               t         |d            d d      t        t               t         |d            t        d      t        t               t         |d            d	 
      gS )Nr   rX   c                 2    |t        j                  |      z  S r>   rd   sigmoidr  s       rG   r   z-module_inputs_torch_nn_SiLU.<locals>.<lambda>      Qq9I5I rI   r  rc  r   r   r  c                 2    |t        j                  |      z  S r>   r  r  s       rG   r   z-module_inputs_torch_nn_SiLU.<locals>.<lambda>  r!  rI   r   rm  rn  s          rG   module_inputs_torch_nn_SiLUr#    s~    V5P]^J 	mo"/
2"?!I!	# 	mo"/
1">!:'	) 	mo"/
90E"F!I	KL LrI   c           
         t        t        |||      }t        t        d      t         |d            d       t        t        d      t         |d            d d	
      t        t        d      t         |d            t        d
      gS )Nr   rK   r      c                     t        j                  |      j                  t        j                  |      j                  dd      j	                  dd            S NrK   Tr   r&  )rd   r)  divr   r   r   s      rG   r   z0module_inputs_torch_nn_Softmax.<locals>.<lambda>  s?    11A1A%))A,BRBRSTVZB[BbBbcegiBj1k rI   r   r   rX   c                     t        j                  |      j                  t        j                  |      j                  dd            S )Nr   Trd   r)  r)  r   r   s      rG   r   z0module_inputs_torch_nn_Softmax.<locals>.<lambda>  s0    11A1A%))A,BRBRSTVZB[1\ rI   r  rc  r   r   r   r   rm  rn  s          rG   module_inputs_torch_nn_Softmaxr-    s    V5P]^J 	mA&6"/
80D"E!k	m 	mA&6"/
2"?!\!	# 	mB&7"/
60B"C!:'	)* *rI   c           	          t        t        |||      }t        t               t         |d            d       t        t               t         |d            t        d      gS )Nr   rK   r   r   r&  c                     t        j                  |      j                  t        j                  |      j                  dd            S NrK   Fr+  r   s      rG   r   z2module_inputs_torch_nn_Softmax2d.<locals>.<lambda>  s0    11A1A%))A,BRBRSTV[B\1] rI   r   r  r   rc  rm  rn  s          rG    module_inputs_torch_nn_Softmax2dr2    s]    V5P]^J 	mo"/
>0J"K!]	_ 	mo"/
90E"F!:'	)	* *rI   c                 h   t        t        |||      }t        t        d      t         |d            d       t        t        d      t         |d            d d	      t        t        d
      t         |d            d d	      t        t        d      t         |d            t        d	      gS )Nr   rK   r%  c                     t        j                  |      j                  t        j                  |      j                  dd      j	                  dd            j                         S r(  )rd   r)  div_r   r   log_r   s      rG   r   z3module_inputs_torch_nn_LogSoftmax.<locals>.<lambda>  sH    11B1B599Q<CSCSTUW[C\CcCcdfhjCk1l1q1q1s rI   r   r/  c                     t        j                  |      j                  t        j                  |      j                  dd            j	                         S r1  rd   r)  r5  r   r6  r   s      rG   r   z3module_inputs_torch_nn_LogSoftmax.<locals>.<lambda>  9    11B1B599Q<CSCSTUW\C]1^1c1c1e rI   
multiparamrc  r   rX   c                     t        j                  |      j                  t        j                  |      j                  dd            j	                         S )Nr   Fr8  r   s      rG   r   z3module_inputs_torch_nn_LogSoftmax.<locals>.<lambda>  r9  rI   multiparam_scalarr   r,  r   rm  rn  s          rG   !module_inputs_torch_nn_LogSoftmaxr=    s    V5P]^J 	mA&6"/
80D"E!s	u 	mA&6"/
>0J"K!e%	' 	mA&6"/
2"?!e,	. 	mB&7"/
60B"C!:'	)* *rI   c                 \   t        t        |||      }t        t        d      t         |d                  t        t        d      t         |d            d      t        t        d      t         |d	            d
      t        t        d      t         |d            t        d      gS )Nr   rK   r%  rh  )r   r   r   r   multidimrk  r   rX   r  r   )r   r   r   r   rc  rm  rn  s          rG   module_inputs_torch_nn_Softminr@    s    V5P]^J 	mA&6"/
80D"E	GmA&6"/
=0I"J#	% 	mA&6"/
2"?!	# 	mB&7"/
:0F"G!:'	)* *rI   c                    t        t        |||      }t        t               t         |d            d       t        t        d      t         |d            d d      t        t        dd	      t         |d            d
 d      t        t        dd	      t         |d            d d      t        t               t         |d            t        d      gS )Nr   r%  c                 R    t        j                  t        j                  |            S r>   rd   log1pr)  r   s      rG   r   z1module_inputs_torch_nn_Softplus.<locals>.<lambda>  s    UYYq\1J rI   r   r   c                 ^    dt        j                  t        j                  d|z              z  S )Nr'  r   rC  r   s      rG   r   z1module_inputs_torch_nn_Softplus.<locals>.<lambda>  s$    5;;uyyQRUVQVGW;X1X rI   betarc  c                     |dz  dkD  j                  |      |z  |dz  dk  j                  |      dz  dz  t        j                  t        j                  d|z              z  z   S Nr   rG  r  r(  type_asrd   rD  r)  r   s      rG   r   z1module_inputs_torch_nn_Softplus.<locals>.<lambda>	  b    !a%4(@(@(Ca(GEd?33A6;b@5;;uyyYZ]^Y^O_C``)a rI   beta_thresholdrX   c                     |dz  dkD  j                  |      |z  |dz  dk  j                  |      dz  dz  t        j                  t        j                  d|z              z  z   S rI  rJ  r   s      rG   r   z1module_inputs_torch_nn_Softplus.<locals>.<lambda>  rL  rI   beta_threshold_scalarr   r   rm  rn  s          rG   module_inputs_torch_nn_SoftplusrP    s    V5P]^J 	mo"/
80D"E!J	L 	mA&6"/
80D"E!X	! 	mAt&<"/
80D"Ea)	+ 	mAt&<"/
2"?a0	2 	mo"/
1">!:'	))* *rI   c                 X   t        t        |||      }t        t               t         |d                  t        t        d      t         |d            d      t        t        d      t         |d            d      t        t               t         |d	            t        d
      gS )Nr   r  rh  rK   lambdark  rX   lambda_scalarr   r   rc  rm  rn  s          rG   !module_inputs_torch_nn_SoftshrinkrT    s    V5P]^J 	mo"/
90E"F	HmA&7"/
90E"F!	# 	mA&7"/
2"?(	* 	mo"/
1">!:'	)* *rI   c           
         t        t        |||      }t        t               t         |d            d       t        t               t         |d            d d      t        t               t         |d	            t        d
      gS )Nr   r  c                 P    |j                  dt        j                  |      z         S NrK   r)  rd   r  r   s      rG   r   z1module_inputs_torch_nn_Softsign.<locals>.<lambda>0      q599Q<7G1H rI   r   rX   c                 P    |j                  dt        j                  |      z         S rW  rX  r   s      rG   r   z1module_inputs_torch_nn_Softsign.<locals>.<lambda>3  rY  rI   r  rc  r   r   rm  rn  s          rG   module_inputs_torch_nn_Softsignr[  *  s|    V5P]^J 	mo"/
90E"F!H	J 	mo"/
2"?!H!	# 	mo"/
1">!:'	)* *rI   c           
         t        t        |||      }t        t               t         |d                  t        t               t         |d            d      t        t               t         |d            t        d	      gS 
Nr   r1  rh  rX   r  rk  r   r   rc  rm  rn  s          rG   module_inputs_torch_nn_Tanhr^  ;  t    V5P]^J 	mo"/
<0H"I	Kmo"/
2"?!	# 	mo"/
1">!:'	)	* 	*rI   c           
         t        t        |||      }t        t               t         |d                  t        t               t         |d            d      t        t               t         |d            t        d	      gS r]  rm  rn  s          rG   !module_inputs_torch_nn_Tanhshrinkra  K  r_  rI   c                 f   t        t        |||      }t        t        dd      t         |d            d      t        t        dd      t         |d            d      t        t        dd      t         |d	            d
      t        t        dd      t         |d            t        d      gS )Nr   r(  r  r1  threshold_valuerk  g      $@large_valuerX   threshold_value_scalarr   r   rc  rm  rn  s          rG    module_inputs_torch_nn_Thresholdrf  Z  s    V5P]^J 	mB&;"/
<0H"I*	, 	mB&<"/
<0H"I&	( 	mB&;"/
2"?1	3 	mB&;"/
1">!:'	)* *rI   c           
         t        t        |||      }t        t               t         |d            d       t        t               t         |d            d d      t        t               t         |d	            t        d
      gS )Nr   r  c                 X    |t        j                  t        j                  |            z  S r>   rd   tanhFsoftplusr   s      rG   r   z-module_inputs_torch_nn_Mish.<locals>.<lambda>s      UZZ

15N1N rI   r   rX   c                 X    |t        j                  t        j                  |            z  S r>   ri  r   s      rG   r   z-module_inputs_torch_nn_Mish.<locals>.<lambda>v  rm  rI   r  rc  r   r   rm  rn  s          rG   module_inputs_torch_nn_Mishro  m  s|    V5P]^J 	mo"/
90E"F!N	P 	mo"/
2"?!N!	# 	mo"/
1">!:'	)* *rI   c           
          t        t        |||      }t        t               t         |d       |d            d       t        t               t         |d       |d            d d      gt	        |      z   S )	Nr   r  c                 b    d|j                         z  t        d t        ||      D              z  S )Nr  c              3   d   K   | ](  \  }}||z
  j                         j                          * y wr>   )r  r   )r  abs      rG   r  zBmodule_inputs_torch_nn_L1Loss.<locals>.<lambda>.<locals>.<genexpr>  s6      I`MQQPQ KLa%IZIZI\ I`s   .0)r-  r   zipr   r   r   r   s       rG   r   z/module_inputs_torch_nn_L1Loss.<locals>.<lambda>  s9    BNS I`UXYZ\]U^I` F` 5` rI   r   rX   c                 l    d|j                         z  ||z
  j                         j                         z  S )Nr  )r-  r  r   rv  s       rG   r   z/module_inputs_torch_nn_L1Loss.<locals>.<lambda>  s(    BNa!e[[]EVEVEX4X rI   r  rc  )r   r
   r   r}   rd  rn  s          rG   module_inputs_torch_nn_L1Lossrx  ~  s    V5P]^J 	mo"/
90E0:90E#G"`	a
 	mo"/
2
2"O!X!	#	$ 'K:&V	W 	WrI   c                 p   t        t        |||      }di fdddifdddifddd	ifg}g }|D ]  \  }	}
|
fd
}|j                  t        t	        di |
t	         |d       |d            |	|             |j                  t        t	        di |
t	         |d       |d            d|	 |              |S )Nr   r5   r   r   r   r  r  r   r   c                     t        ||fi |S r>   )r&   r   s        rG   r   z9module_inputs_torch_nn_SmoothL1Loss.<locals>.reference_fn  s    )!QE2DEErI   r   r   r   rX   r   r<  rN   r   rU   r   rV   rZ   r   r   r   r   r   r   s               rG   #module_inputs_torch_nn_SmoothL1Lossr}    s    V5P]^J 
R	;./	K01	K01	%E M$) 
  8J 	F 	-*M:L*M&3Jw4G4>w4G'I!%1	3	
 	-*M:L*M&3JrN4>rN'D&tf-%1	3	

& rI   c                    t        t        |||      }t        t        ||d      }t        t        ||d      }di fdddifdddifd	dd
ifdd |d      ifg}	dd}
g }|	D ]m  \  }}|j                  t        t	        di |t	         |ddd       |d      j                  d      j                  |            |t        |
fi |             o  |d      }|j                  t        t	        |      t	         |ddd       |d      j                  d      j                  |            dt        |
|                   |S )Nr   Fr5   r   r   r   r  r  r   r   r  r  r   c                     ||j                         z  d|z
  d|z
  j                         z  z    }|||z  }|dk(  r|S |dk(  r!|j                         |j                         z  S |j                         S )NrK   r   r  )r   r   r-  r   r   r   r   r   r  r   s          rG   bce_loss_reference_fnz=module_inputs_torch_nn_BCELoss.<locals>.bce_loss_reference_fn  ss    quuw;!a%AE;;=!889f_FM& ::<!'')++::<rI   r  {Gz?Gz?lowhighr   r   rX   )r  scalar_weightr  Nr   r
   rL   r   r}   gtto)rN   r   rU   r   rV   rZ   r   r  r  r   r  r   r   r   r  s                  rG   module_inputs_torch_nn_BCELossr    sw   V5P]^J+fEQVWK+fEQVWK 
R	;./	K01	K01	X{5123%E  M$) 
  -*M:L*M&3JxTX`4a4?4I4L4LQ4O4R4RSX4Y'[!%,-B%YFX%Y	[	

  OMm=&I"/
24h0W0;B0B0B10E0H0H0O#Q(!()>}!U		W rI   c                    t        t        |||      }t        t        ||d      }t        t        ||d      }di fdddifdddifd	dd
ifdd |d      ifdd |d      ifg}	dd}
g }|	D ]m  \  }}|j                  t        t	        di |t	         |ddd       |d      j                  d      j                  |            |t        |
fi |             o |S )Nr   Fr5   r   r   r   r  r  r   r   r  r  r  scalar_weightsrX   c                    | j                  d      }d|z
  j                  |      j                  |      j                  | j                         j                  | |z
  j                               j	                               }|||z  }|dk(  r|S |dk(  r!|j                         |j                         z  S |j                         S )Nr   r	  rK   r   r  )r  mul_add_exp_r6  r   r-  )r   r   r   r   r   r  max_valr   s           rG   bce_withlogitsloss_reference_fnzQmodule_inputs_torch_nn_BCEWithLogitsLoss.<locals>.bce_withlogitsloss_reference_fn  s    2***#a%a%%g.33gXOO4E4J4JQBQXLK^K^K`4a4f4f4hif_FM& ::<!'')++::<rI   r  r  r  r  r   r   r  r  )rN   r   rU   r   rV   rZ   r   r  r  r   r  r   r   r   s                 rG   (module_inputs_torch_nn_BCEWithLogitsLossr    s    V5P]^J+fEQVWK+fEQVWK 
R	;./	K01	K01	X{5123	Hk"o67%E  M$) 
  -*M:L*M&3JxTX`4a4?4I4L4LQ4O4R4RSX4Y'[!%,-L%cPb%c	e	

 rI   c                    t        t        |||      }t        t        |t        j                  d      }t        t        ||d      }g d}	di fdd |d      ifddd	ifd
d
difdd	ddfg}
g }t	        |	|
      D ]  \  }\  }}||fd}|j                  t        t        d)d|i|t         |d       |ddd            d| d| |             |j                  t        t        d)d|i|t         |d       |ddd            d| d| |             |j                  t        t        d)d|i|t         |d       |ddd            d| d| |             |j                  t        t        d)d|i|t         |d       |ddd            d | d| |             |j                  dd       D|j                  t        t        d)d|i|t         |d!       |d!      j                  d	"            d#| d| |             |j                  t        t        d)d|i|t         |d$       |d$      j                  d	"            d%| d| |             |j                  t        t        d)d|i|t         |d&       |d&      j                  d	"            d'| d| |             |j                  t        t        d)d|i|t         |d       |d      j                  d	"            d(| d| |             |j                  t        t        d)d|i|t         |d       |d)dd            d*| d| t        t        d+,                    |S )-Nr   F)r  r   r   r5   r  r  r  r  rK   label_smoothingg333333?ignore_index_label_smoothing)r  r  c                      t        ||fd|i|S )Nr   )r   )r   r   r   r   r   r   s         rG   r   z=module_inputs_torch_nn_CrossEntropyLoss.<locals>.reference_fn  s    /1`	`M_``rI   r   )r   r   r   r   )r   r   r   r   r   r  4d_rR   r   )r   r   r   )r   r   r  r   r   r   2d_)r   r   r   r   r   r   )r   r   r   r   r   r  )r   r   r   r   r  4d_prob_target_)r   r   r   3d_prob_target_)r   r   2d_prob_target_higher_dim_prob_target_rX   rb  Tra  )r   r
   rd   r  r   rL   r   r}   r   softmaxr  )rN   r   rU   r   rV   rZ   r   r  r  
reductionsr   r   r   r   r   r   s                   rG   'module_inputs_torch_nn_CrossEntropyLossr  
  s(   V5P]^J+fEJJV[\K+fEQVWK3J	R	X{4012	.!,-	.56	'!PT)UV%E M18U1K D-	-D,/8M_ 	a 	-*b)*bOa*b&3J|4L4?	qWX4Y'["4&)5%1	3	
 	-*b)*bOa*b&3Jy4I4?ATU4V'X"4&)5%1	3	
 	-*b)*bOa*b&3Jv4F4?QR4S'U"4&)5%1	3	
 	-*b)*bOa*b&3J?Q4R4?UV]^4_'a*4&)=%1	3	
 !!.$7?  m.fi.fSe.f*7
<8P8B<8P8X8X]^8X8_+a#24&)!E)5	7   m.fi.fSe.f*7
98M8B98M8U8UZ[8U8\+^#24&)!E)5	7   m.fi.fSe.f*7
68J8B68J8R8RWX8R8Y+[#24&)!E)5	7   m.fi.fSe.f*7
CU8V8BCU8V8^8^cd8^8e+g#:4&)!M)5	7   m.fi.fSe.f*7
48H8CBATU8V+X#0a	{!C)01JY])^	`}DL rI   c                    t        t        |||      }t        t        |d      }di fdddifddd	ifd
ddifdddifg}t        j                  t        j                  g}	g }
t        |	|      D ]  \  }\  }}|fd}|j                  dd      }|dk(  rdnd}|dk(  rdnd}|
j                  t        t        di |t         |d      j                  d       |d|||      dd      | d|             |
j                  t        t        di |t         |d      j                  d       |d|||      t        j                  d|      t        j                  d|            | d|             |
j                  t        t        di |t         |d      j                  d       |d|||      dd      | d|             |
j                  t        t        di |t         |d      j                  d       |d|||      t        j                  d|      t        j                  d|            | d|              |
S ) Nr   F)r   r   r5   r   r   r   r  r  r   r   blank   c                      t        ||||fi |S r>   )r   )r   r   r   r   iltlr   s          rG   r   z4module_inputs_torch_nn_CTCLoss.<locals>.reference_fnr  s    $Q2rH5GHHrI   r   rK   r  )2   r   r  r   )r      )rU   r  r  )r  r  r  )r     r&  _lengths_intlistsr   r  _lengths_tensors)K   _1d_target_lengths_intlists_1d_target_lengths_tensorsrX   )r   r
   rd   intr  r   r   rL   r   r}   r  tensor)rN   r   rU   r   rV   rZ   r   r  r   target_dtypesr   target_dtyper   r   r   r  r  r  s                     rG   module_inputs_torch_nn_CTCLossr  c  s   V5P]^J+fEJK 
R	;./	K01	K01	7B- %E YY

+MM4;M54Q -
00t/@R 	I #&&w2B;aAb[rb"/"E2D"E+J{,C,O,OPQ,R,7|Y\cg,h,8,H v./)+	
 	"/"E2D"E+J{,C,O,OPQ,R,7|Y\cg,h,1LLf,U,1LLf,UW v-.)+		
 	"/"E2D"E+J{,C,O,OPQ,R,7|adko,p,8,H v89)+	
 	"/"E2D"E+J{,C,O,OPQ,R,7|adko,p,1LLf,U,1LLf,UW v78)+		
I-
^ rI   c                    t        t        |||      }t        t        ddd      t         |d            d      t        t        ddd      t         |d	            d
      t        t        ddd      t         |d            d      t        t        dddd      t         |d            d      t        t        dddd      t         |d            d      t        t        ddd      t         |d            d      t        t        dddd      t         |d            d      t        t        dddd      t         |d            d      gS )Nr   r   rg  r2  )r   rg  r   	1d_affinerk  r  )r   r  1d_affine_GNrK   )   rg  1d_affine_large_batchr   Fr   r   r   1d_no_affine_INr   r   1d_no_affine_LN)r   rg  r   r   	2d_affine)r   r   r   r   2d_no_affine_IN2d_no_affine_LNr   rn  s          rG    module_inputs_torch_nn_GroupNormr    sU   V5P]^J 	+Aq$7'
9(=>	 	+Ar48'
7(;<	! 	+Aq$7'
8(<=(	* 	+Aq$>'
9(=>"	$ 	+Ar4?'
7(;<"	$ 	+Aq$7'
<(@A	 	+Aq$>'
<(@A"	$ 	+Aq$>'
<(@A"	$;! !rI   c           
         t        t        |||      }t        t        d      t         |d                  t        t        d      t         |d            d      t        t               t         |d            t        d	
      gS )Nr   r(  )r   r   r   r   rh  rX   r  rk  r   r   rc  rm  rn  s          rG   !module_inputs_torch_nn_Hardshrinkr    s~    V5P]^J 	+B/'
<(@A	
 	+B/'
27	

 	+o'
162		
 rI   c           	          t        t        |||      }t        t               t         |d            t        d      t        t               t         |d            d      gS )Nr   r   r   rc  r  r  rk  rm  rn  s          rG    module_inputs_torch_nn_Hardswishr    s]    V5P]^J 	+o'
162		
 	+o'
<(@A	 rI   c           
         t        t        |||      }t        t               t         |d            d       t        t               t         |d            d d      t        t               t         |d	            t        d
      gS )Nr   r  c                 &    |j                  dd      S Nr   rK   r  r   s      rG   r   z1module_inputs_torch_nn_Hardtanh.<locals>.<lambda>      Q rI   r   rX   c                 &    |j                  dd      S r  r  r   s      rG   r   z1module_inputs_torch_nn_Hardtanh.<locals>.<lambda>  r  rI   r  rc  r   r   rm  rn  s          rG   module_inputs_torch_nn_Hardtanhr    s~    V5P]^J 	+o'
9(=>7	

 	+o'
277		
 	+o'
162		
 rI   c                    t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifdddifg}g }	|D ]   \  }
}|fd}|	j                  t        t	        di |t	         |d       |d      j                  d      j                  |      j                  d      j                  d            |
|             |	j                  t        t	        di |t	         |d       |d      j                  d      j                  |      j                  d      j                  d            d|
 |              |	S )Nr   Fr5   r   r   r   r  r  r   r   r  r'  c                     t        ||fi |S r>   )r   r   s        rG   r   z?module_inputs_torch_nn_HingeEmbeddingLoss.<locals>.reference_fn  s    /1K8JKKrI   r  r   r   rK   r   rX   r   )	r   r
   rL   r   r}   r  r  r  sub_r  s                rG   )module_inputs_torch_nn_HingeEmbeddingLossr  	  sx   V5P]^J+fEQVWK 
R	;./	K01	K01	Hc?#%E M$) 
  8J 	L 	-*M:L*M&3Ju4E4?4F4I4I!4L4O4OPU4V4[4[\]4^4c4cde4f'h!%1	3	
 	-*M:L*M&3JrN4?O4F4Fq4I4L4LU4S4X4XYZ4[4`4`ab4c'e&tf-%1	3	

& rI   c                     t        t        |||      }di fdddifdddifddd	ifg}g }|D ]G  \  }	}
|
fd
}|j                  t        t	        di |
t	         |d       |d            |	|             I |S )Nr   r5   r   r   r   r  r  r   r   c                     t        ||fi |S r>   )r   r   s        rG   r   z6module_inputs_torch_nn_HuberLoss.<locals>.reference_fn8  r   rI   r{  r   rX   r<  r|  s               rG    module_inputs_torch_nn_HuberLossr  ,  s    V5P]^J 
R	;./	K01	K01	%E M$) 

  8J 	C 	-*M:L*M&3Jw4G4>w4G'I!%1	3	
	

 rI   c                 T   t        t        |||      }|j                  dd      }|d   }d\  }	}
}}}dddd	}||   }d
|z   }t        |rt	        |
|      nt	        |	|
|      t	         ||                  t        |rt	        |
|||      nt	        |	|
|||      t	         ||            d      t        |rt	        |
|      nt	        |	|
|      t	         ||            t
        d      t        |rt	        |
|||      nt	        |	|
|||      t	         ||            t
        d      gS )Nr   r   Fr  )r   r2  r  FT)r   r  rr  r}  rK   r   r   r`  rh  tracking_statsrk  tracking_stats_no_batch_dimrc  r   )r   r
   r   r   r}   r  )rN   r   rU   r   rV   rZ   r   r   r  num_featuresr.  r  r  track_running_statsinput_no_batch_shape_dictr  r  s                    rG   %module_inputs_torch_nn_InstanceNormNdr  F  sQ   V5P]^J::fe$DsA?X<L#x)<$+	l K4Q733 	04c8,-VY[c:d'
3D(EF		H
 	MQc8V5HIlC6CVW'
3D(EF!	# 	04c8,-VY[c:d'
3G(HI2.	0 	MQc8V5HIlC6CVW'
3G(HI2	!) rI   c                 ^   t        t        |||      }t        t        dgd      t         |d            d      t        t        dgd      t         |d            d      t        t        dgdd	      t         |d            d
      t        t        g dd      t         |d            d      t        t        g ddd	      t         |d            d      t        t        dgd      t         |d            d      t        t        g dddd	      t         |d            d      gS )Nr   r   r2  r  1d_elementwise_affinerk     r   r   !1d_elementwise_affine_large_batchF1d_no_elementwise_affiner   r   r   r   r   r   r   3d_elementwise_affine3d_no_elementwise_affiner   r   1d_empty_elementwise_affineT)elementwise_affiner   3d_elementwise_affine_no_biasr   rn  s          rG    module_inputs_torch_nn_LayerNormr  m  s+   V5P]^J 	+QC6'
9(=>(	* 	+QC6'
;(?@4	6 	+QCu='
9(=>+	- 	+It<'
<(@A(	* 	+ItUC'
<(@A+	- 	+QC6'
6(:;.	0 	+ItPT[`a'
<(@A0	23 rI   c                    t        t        |||      }d }t        t        dgd      t         |d            d|      t        t        dgd      t         |d            d	|      t        t        dgdd
      t         |d            d|      t        t        g dd      t         |d            d|      t        t        g ddd
      t         |d            d|      t        t        dgd      t         |d            d|      gS )Nr   c                    | j                   }|)t        j                  |j                        j                   }|j                  }| j
                  }| j                  }t        t        |            D cg c]
  }||z
  dz
   }}j                         }|t        j                  |j                  d      j                  |d      | j                   z         z  }	||	|z  }	|	j                  |      S c c}w )NrK   r   T)r  keepdim)r.  rd   finforU   ndimnormalized_shaper  r  rc   floatrsqrtr9  r  rK  )
r   r   r   r.  r  r  r  dims
upcasted_ir   s
             rG   rms_norm_reference_fnz=module_inputs_torch_nn_RMSNorm.<locals>.rms_norm_reference_fn  s    ee;++agg&**Cvv--&+C0@,A&BCq1CCWWY
ekk*..*;*@*@TSW*@*X[\[`[`*`aafF~~a   Ds   2C0r   r2  r  r  r   r  r  Fr  r  r  r  r  r  r  r   )rN   r   rU   r   rV   rZ   r   r  s           rG   module_inputs_torch_nn_RMSNormr    s   V5P]^J! 	+QC6'
9(=>(.		0
 	+QC6'
;(?@4.		0
 	+QCu='
9(=>+.		0
 	+It<'
<(@A(.		0
 	+ItUC'
<(@A+.		0
 	+QC6'
6(:;..		05 rI   c           
         t        t        |||      }t        t        d      t         |d            d      t        t        d      t         |d            d      t        t        d	d
dd      t         |d            d      gS )Nr   r   )rK   r   r  r  rk  r   )rK   r   r  r  2d_uneven_padrK   r  r'  r(  )rK   r   r  r  r  3d_custom_paramsr   rn  s          rG   (module_inputs_torch_nn_LocalResponseNormr    s    V5P]^J 	+A/'
9(=>	 	+A/'
<(@A 	" 	+Ar3;'
?(CD#	% rI   c           
         t        t        |||      }t        t        dd      t         |d            d      t        t        ddd      t         |d                  t        t        ddd      t         |d	            t        d
      gS )Nr         ?r   )rK   r   r  normrk  r   rh  )r   r  r   rc  rm  rn  s          rG   module_inputs_torch_nn_LPPool1dr     s    V5P]^J 	+C3'
9(=>	 	+Aq!4'
9(=>	@ 	+Aq!4'
6(:;2		! rI   c           
         t        t        |||      }t        t        ddd      t         |d                  t        t        ddd      t         |d            t        d      t        t        dd      t         |d            d	
      gS )Nr   r   rK   r   r  r  rh  r   r  r  r   rc  r  r  rk  rm  rn  s          rG   module_inputs_torch_nn_LPPool2dr    s    V5P]^J 	+Aq!4'
<(@A	C 	+Aq!4'
9(=>2		!
 	+C3'
<(@A	 rI   c           
         t        t        |||      }t        t        ddd      t         |d                  t        t        ddd      t         |d            t        d      t        t        dd      t         |d            d	
      gS )Nr   r   )rK   r   r  r  r  rh  )r   r  r  r  r   rc  r  r  rk  rm  rn  s          rG   module_inputs_torch_nn_LPPool3dr    s    V5P]^J 	+Aq!4'
?(CD	F 	+Aq!4'
<(@A2		!
 	+C3'
?(CD	 rI   c           
         t        t        |||      }t        t        d      t         |d            d      t        t        dd      t         |d            d      t        t        dd      t         |d            d	      gS )
Nr   r   )r   r   r   r  rk  rj  Treturn_indicesr	  r   rn  s          rG    module_inputs_torch_nn_MaxPool1dr
    s    V5P]^J 	+A.'
:(>?	 	+Aq1'
:(>?	 	+AdC'
:(>?!	# rI   c           
         t        t        |||      }t        t        ddd      t         |d            d      t        t        ddd      t         |d            d	      t        t        dddd
      t         |d            d      gS )Nr   r   r   rq  rt  r  r  rk  r  r  Tr  r	  r   rn  s          rG    module_inputs_torch_nn_MaxPool2dr  "  s    V5P]^J 	+FFFC'
9(=>	 	+FFFC'
<(@A	 	+FFFSWX'
<(@A!	# rI   c                 `   t        t        |||      }t        t        d      t         |d                  t        t        dd      t         |d            d      t        t        ddd      t         |d            d	      t        t        dddd
      t         |d            d      gS )Nr   r|  r  rh  r   rj  rk  r  stride_paddingTr  r	  r   rn  s          rG    module_inputs_torch_nn_MaxPool3dr  4  s    V5P]^J 	+I6'
?(CD	F 	+Ay9'
?(CD	 	+Aq)<'
?(CD!	# 	+Aq)DQ'
?(CD!	# rI   c                    t        t        ||      }fd}t        t        dd |             t         |d            d      t        t        d	d
 |             t         |d            d      t        t        dd |       d      t         |d            d      t        t        dd |             t         |d            t        d      t        t        d	d
 |             t         |d            t        d      gS )Nr   c                  l    t        j                  dt         j                         j                         S )N)rK   r   r   rU   r   rd   r  doubler  r  s   rG   make_random_sampleszGmodule_inputs_torch_nn_FractionalMaxPool2d.<locals>.make_random_samplesM  #    {{9ELLHQQSSrI   r   r'  output_ratio_random_samples)rK   r   r   r  ratiork  r  )r   r   output_sizer  )rK   r   r  rg  sizeTr  r  r	  ratio_return_indices)r   r   r  ratio_no_batch_dimrc  )r   r  rg  size_no_batch_dimrm  rN   r   rU   r   rV   rZ   r   r  s    `      rG   *module_inputs_torch_nn_FractionalMaxPool2dr$  J  s   V5P]^JT 	+ACQdQfg'
<(@A	 	+FXkXmn'
<(@A	 	+5H5J[_ (
<(@A'	) 	+ACQdQfg'
9(=>2%		'
 	+FXkXmn'
9(=>2$		&) rI   c                 j   t        t        ||      }fd}t        t        dd |             t         |d            d      t        t        d	d
 |             t         |d            d      t        t        dd |             t         |d            d      t        t        dd |       d      t         |d            d      t        t        dd |             t         |d            t        d      t        t        d	d
 |             t         |d            t        d      gS )Nr   c                  l    t        j                  dt         j                         j                         S )N)r   r   r   r  r  r  s   rG   r  zGmodule_inputs_torch_nn_FractionalMaxPool3d.<locals>.make_random_sampleso  r  rI   r   r'  r  )r   r   r   r   r   r  rk  r|  )r   r   r   r  )r   r   r  r  r  r  )r   r   r   )r   r   r   )r   r      r  r   asymsizeTr  r   )r   r   r   r   r!  rc  )r   r  r  r  r"  rm  r#  s    `      rG   *module_inputs_torch_nn_FractionalMaxPool3dr)  l  s/   V5P]^JT 	+ACQdQfg'
?(CD	 	+I9^q^st'
?(CD	 	+I:_r_tu'
3C(DE	 	+5H5J[_ (
?(CD'	) 	+ACQdQfg'
<(@A2%		'
 	+I9^q^st'
<(@A2$		&1 rI   c                 V   t        t        |||      }t        t               t         |d            d      t        t               t         |d            t        d      t        t               t         |d            d	      t        t               t         |d
            d      gS r  rm  rn  s          rG   module_inputs_torch_nn_Sigmoidr+    s    V5P]^J 	+o'
27	

 	+o'
162		
 	+o'
<(@A+	

 	+o'
?(CD.	
# rI   c           
         t        t        |||      }t        t               t         |d            d d      t        t               t         |d            d       t        t               t         |d	            t        d
      gS )Nr   rX   c                 >    |j                         j                         S r>   r   r   r   s      rG   r   z3module_inputs_torch_nn_LogSigmoid.<locals>.<lambda>      ): rI   r  rc  r  c                 >    |j                         j                         S r>   r.  r   s      rG   r   z3module_inputs_torch_nn_LogSigmoid.<locals>.<lambda>  r/  rI   r   r   r   rm  rn  s          rG   !module_inputs_torch_nn_LogSigmoidr1    s~    V5P]^J 	+o'
27:		
 	+o'
9(=>:	

 	+o'
162		
 rI   c                 f   t        t        |||      }t        t        |t        j                  d      }di fdddifdddifd	dd
ifdddifg}g }	|D ]\  \  }
}|fd}|	j	                  t        t        di |t         |d       |d       |d      j                               |
|             ^ |	S )Nr   Fr5   r   r   r   r  r  r   r   r  r'  c                     t        |||fi |S r>   )r!   r  s         rG   r   z>module_inputs_torch_nn_MarginRankingLoss.<locals>.reference_fn  s    .r2qO<NOOrI   )r  r   rX   )r   r
   rd   r  rL   r   r}   r  r  s                rG   (module_inputs_torch_nn_MarginRankingLossr4    s    V5P]^J+fEJJV[\K 
R	;./	K01	K01	Hc?#%E M$) 

  =O 	P 	-*M:L*M&3Ju4EzRWGX4?4F4K4K4M'O!%1	3	
	

 rI   c                    t        t        |||      }t        t        |t        j                  d      }di fdddifdddifd	dd
ifg}g }	|D ]  \  }
}|fd}|	j	                  t        t        di |t         |d       |ddd            d|
 |             |	j	                  t        t        di |t         |d       |ddd            |
|              |	S )Nr   Fr5   r   r   r   r  r  r   r   c                     t        ||fi |S r>   )r#   r   s        rG   r   zAmodule_inputs_torch_nn_MultiLabelMarginLoss.<locals>.reference_fn  s    1!QM:LMMrI   r  r   r   r  1d_r   r{  rX   r   r
   rd   r  rL   r   r}   r  s                rG   +module_inputs_torch_nn_MultiLabelMarginLossr9    s   V5P]^J+fEJJV[\K 
R	;./	K01	K01	%E M$) 
  8J 	N 	-*M:L*M&3Ju4E4?!RT4U'W"4&\%1	3	
 	-*M:L*M&3Jw4G4?QUW4X'Z!%1	3	

( rI   c                    t        t        |||      }t        t        |t        j                  d      }t        t        ||d      }di fdddifdddifd	dd
ifdddifdddifdd |d      ifg}	g }
|	D ]J  \  }}|fd}|
j	                  t        t        di |t         |d       |ddd            ||             L |
S )Nr   Fr5   r   r   r   r  r  r   r   r   r   r  r'  r  r  r   c                     t        ||fi |S r>   )r"   r   s        rG   r   z<module_inputs_torch_nn_MultiMarginLoss.<locals>.reference_fn	  s    ,QH5GHHrI   r{  r   r   r  r   rX   r8  )rN   r   rU   r   rV   rZ   r   r  r  r   r   r   r   r   s                 rG   &module_inputs_torch_nn_MultiMarginLossr<  	  s   V5P]^J+fEJJV[\K+fEQVWK 
R	;./	K01	K01	sAh	Hc?#	X{2/0%E M$) 

  8J 	I 	-*M:L*M&3Jw4G4?QS4T'V!%1	3	
	

 rI   c                    t        t        |||      }t        t        |t        j                  d      }t        t        ||d      }di fdddifdddifd	dd
ifdd |d      ifg}	dd}
g }|	D ]O  \  }}|j	                  t        t        di |t         |d       |ddd            |t        |
fi |             Q |S )Nr   Fr5   r   r   r   r  r  r   r   r  r   c                 `   ||j                         j                         z  d|z
  | j                         j                         z  z   }|||z  }| j                  |j                         dz
        |j	                  d      z  }|dk(  r|S |dk(  r|j                         S |j                         S )NrK   r   r   r  )r   r   r   r  r  r  r  s          rG   &multilabelsoftmargin_loss_reference_fnz_module_inputs_torch_nn_MultiLabelSoftMarginLoss.<locals>.multilabelsoftmargin_loss_reference_fn1	  s    QYY[__&&!a%QB<<>3E3E3G)GGfF'quuw{+affRj8M& ;;= ::<rI   r{  r   r   r  r   r  rX   r8  )rN   r   rU   r   rV   rZ   r   r  r  r   r?  r   r   r   s                 rG   /module_inputs_torch_nn_MultiLabelSoftMarginLossr@  $	  s    V5P]^J+fEJJV[\K+fEQVWK 
R	;./	K01	K01	Hk"o./%E  M$) 
  -*M:L*M&3Jw4G4?QUV4W'Y!%,-S%jWi%j	l	

 rI   c                 2   t        t        |||      }t        t        ||d      }di fdddifdddifd	dd
ifg}g }	|D ]U  \  }
}|fd}|	j                  t        t	        di |t	         |d       |d      j                               |
|             W |	S )Nr   Fr5   r   r   r   r  r  r   r   c                     t        ||fi |S r>   )r'   r   s        rG   r   z;module_inputs_torch_nn_SoftMarginLoss.<locals>.reference_fnX	  s    +AqG4FGGrI   )r   r   r   rX   r  r  s                rG   %module_inputs_torch_nn_SoftMarginLossrC  K	  s    V5P]^J+fEQVWK 
R	;./	K01	K01	%E M$) 

  8J 	H 	-*M:L*M&3Jv4F4?4G4L4L4N'P!%1	3	
	

 rI   c           	         g }t        d ||||      D ]  }|j                  j                  |j                  j                  }	}||	d<   ||	d<   t	        j
                  j                  |i |	}
d}|j                  }d|j                  v r)|j                  d   |j                  d<   |j                  d= |j                  t        t        |
|      ||j                                |S )Nr   rU   r   src_maskmaskrk  ).module_inputs_torch_nn_TransformerEncoderLayerr   rY   rZ   rd   r   TransformerEncoderLayerr   rL   r   r}   r   )rN   r   rU   r   rV   rZ   sampleslayer_module_inputl_argsl_kwargsencoder_layer
num_layersr   s                rG   )module_inputs_torch_nn_TransformerEncoderrO  f	  s    GL&%:  /@@EE.@@GG #!88&MHM
 +88---+8+?+?
+KM  ($$Z0{+M:F'#((
 	( NrI   c                    t        t        |||      }t        t        dddd      t         |d            d      t        t        ddd	dt        j
                        t         |d            d
      t        t        ddd	dd      t         |d            d      g}d t        j                  g d|t        j                        f}d t        j                  g d|t        j                        j                  d      f}	t        j                  |	|ddd      D ]]  \  }
}}}}|j                  t        t        ddd	d|||      t         |d      |
|      t        t        |ddi      d|              _ d }|ret        j                  dd      D ]L  \  }}|j                  t        t        ddd	dd||      t         |d            |r|nd d| d|              N |S )Nr   r   r   r'  r   r  relu_activationrk  r   gelu_activationFr   r   FFTr   rU   r  TFd_modelnheaddim_feedforwarddropoutrE  
norm_firstr   r  )rE  src_key_padding_maskr\  r   rE  rF  no_batch_dim_batch_first_rc  c                     | j                   sJ | j                  d       t        j                         5   | |i |}d d d        | j                  d       S # 1 sw Y   xY w)NFT)rV   trainrd   no_grad)moduler   rY   rZ   rP  s        rG   fast_path_reference_fnzNmodule_inputs_torch_nn_TransformerEncoderLayer.<locals>.fast_path_reference_fn	  sX    U]]_ 	-T,V,F	-T	- 	-s   	AA!T)rZ  rE  r[  r   	fastpath__norm_first_)r   r
   r   r}   rk  gelurd   r  boolr   r  r   rL   r  )rN   r   rU   r   rV   rZ   r   rI  key_padding_masks
attn_masksrE  r\  r[  rE  r   rc  s                   rG   rG  rG  	  s   V5P]^J 	+Aq"c:'9% #	
 	+Aq!S!&&A'9% #	
 	+Aq!SuE'9% 	
G0 u||,@W\WaWabc%9&PUPZPZ[bbcijkJj*;]M[hiE&
K"/TU8;;ED#R ,v&Pd %%>1<RhjkQln0>
	$  ) 1 1- O 	JNN&31a$:\`' #0"9-# <@!7T$TF,zlC
	 NrI   c                 p   t        t        |||      }t        t        dddd      t         |d       |d            d      t        t        ddd	dt        j
                        t         |d       |d            d
      t        t        ddd	dd      t         |d       |d            d      g}d t        j                  g d|t        j                        f}d t        j                  g d|t        j                        j                  d      f}	t        j                  |	|ddd      D ]  \  }
}}}}|
}|}|j                  t        t        ddd	d|||      t         |d       |d      |
|||      t        t        |ddd      d|               |d       |d      }}|s$|j                  dd      |j                  dd      }}||j                  dd      fdz  \  }}|j                  t        t        ddd	d|||      t        |||
|||      d| d| d|               |S )Nr   r   r   r'  r   r  rQ  rk  r   rR  Fr   r   rS  rT  r  rU  rV  r  )tgt_maskmemory_masktgt_key_padding_maskmemory_key_padding_maskr   )rm  rn  r]  r^  rc  rK   r   norm_first__batch_first__bias_)r   r
   r   r}   rk  rf  rd   r  rg  r   r  r   rL   r  	transpose)rN   r   rU   r   rV   rZ   r   rI  rh  ri  rk  rm  r[  r   rE  rl  rn  srctgts                      rG   .module_inputs_torch_nn_TransformerDecoderLayerru  	  s   V5P]^J 	+Aq"c:'9%z)'< #	
 	+Aq!S!&&A'9%z)'< #	
 	+Aq!SuE'9%z)'< 	
G. u||,@W\WaWabc%9&PUPZPZ[bbcijkJj*;]M[hi"E&
D+ "6"/TU8;;ED#R ,v&
6(:X[f)=Wn %%>1<QRop8qs 1>	 i(*Y*?S}}Q*CMM!Q,?C+=Q=X=XYZ\]=^<`cd<d9#%9"/TU8;;ED#R ,x[)=Wn #:,mK=tfU	
	1"H NrI   c                 D   t        t        |||      }g }d t        j                  g d|t        j                        f}d t        j                  g d|t        j                        j                  d      f}	t        j                  |	|ddd      D ]
  \  }
}}}}|
fdz  \  }}|fdz  \  }}|j                  t        t        dddd	d	d
|||	      t         |d       |d      ||||      t        t        |ddd      d|               |d       |d      }}|s$|j                  dd	      }|j                  dd	      }||j                  dd      fdz  \  }}|j                  t        t        dddd	d	d
|||	      t        ||||||                    |S )Nr   rS  rT  r  rU  r   r   r   rK   r   )	rW  rX  rY  num_encoder_layersnum_decoder_layersrZ  rE  r[  r   r  )rk  rE  rm  r\  r   )rm  r\  r]  r^  rc  r  r   rh  )r   r
   rd   r  rg  r   r  r   rL   r   r}   r  rr  )rN   r   rU   r   rV   rZ   r   rI  rh  ri  rF  rR  r[  r   rE  rE  rk  r\  rm  rs  rt  s                        rG   "module_inputs_torch_nn_Transformerry  
  s   V5P]^JGu||,@W\WaWabc%9&PUPZPZ[bbcijkJj*;]M[hi$=
D+  $gk86F5H15L22"/TUCDYZ8;akrv#x ,v&
6(:XX`)=Th %%>1<QRlm8np 1>	 i(*Y*?S--1%C--1%C':J:Q:QRSUV:W9Y\]9]6 "6"/TUCDYZ8;akrv#x ,x()=Th			7$J NrI   c           
      V   t        t        j                  |t        j                  d      }t	        t        dd      t         |dd      j                  d                  t	        t        dd      t         |dd	      j                  d      j                  d
d	            d      gS )NFr   r   r   )num_embeddingsembedding_dimr   rh  rK   i   r  discontiguousrk  )r   rd   r  r  r   r}   random_r   )rN   r   rU   r   rV   rZ   
make_emptys          rG    module_inputs_torch_nn_Embeddingr  :
  s    V5::UZ[J+1AN'
1a(8(@(@(CD	
 	+1AN'
1c(:(B(B1(E(L(LQPS(TU 	

 
rI   c                    t        t        |||      }g }d}d t        j                  g d|t        j                        f}	d t        j                  g d|t        j                        j                  d      f}
t        j                  ||||	|
      }|D ]  \  }}}}}|j                  t        t        ddd|||      t         |d	       |d	       |d	      ||
      t                     |j                  t        t        ddd|||      t         |d	       |d	       |d	      ||
      t        t        d                    |S )Nr   rU  rS  rT  )r   r   r   r   T)	embed_dim	num_headsrE  r   add_bias_kvadd_zero_attnr  )rR  	attn_maskr   FrE  )r   r
   rd   r  rg  r   r  r   rL   r   r}   rS  )rN   r   rU   r   rV   rZ   r   rI  	bool_valsrh  ri  productsr   r  r  rR  r  s                    rG   )module_inputs_torch_nn_MultiheadAttentionr  I
  sX   V5P]^JGIu||,@W\WaWabc%9&PUPZPZ[bbclmnJ  IyBSU_`HIQ 
Ek=*:I"/!qVZ59{bo#q+Jv,>
6@RT^_eTf=MYbd7	
 	"/!qV[59{bo#q+Jv,>
6@RT^_eTf=MYbd$%?US	

( NrI   c                    t        t        |||      }t        t        dd      t         |d       |d            t              t        t        ddd      t         |d       |d            t              g}|j                  dd      }|rD|j                  t        t        dddd	
      t         |d       |d            t                     |S )Nr   r   r   r   Tr   is_rnnFrelu)r   nonlinearity)r   r
   r   r}   r  r   rL   )	rN   r   rU   r   rV   rZ   r   rI  r  s	            rG   #module_inputs_torch_nn_RNN_GRU_Cellr  h
  s    V5P]^J+Ar2'
1z"~F2	

 	+Ar='
1z"~F2	
G ZZ%(F 	"/2Dv"V+JqM:b>J6	
 NrI   c                    t        t        |||      }t        t        dd      t         |d       |d       |d      f      t              t        t        ddd      t         |d       |d       |d      f      t              f}|S )Nr   r   r   r   Tr   )r   r
   r   r}   r^  rN   r   rU   r   rV   rZ   r   rI  s           rG   module_inputs_torch_nn_LSTMCellr  
  s    V5P]^J+Ar2'
1
2
SU7WX8	

 	+Ar='
1
2
SU7WX8	
G NrI   c                     | j                   }| j                  d       t        | |      }|j                  j                  |       |S )NF)r   r  r	   data)rW  batch_sizesrequired_gradseqs       rG   make_packed_sequencer  
  s>    %%Mu
sK
0CHHM*JrI   Fc                    t        t        |||      }|d   }d}	d}
d}d}g }|rt        |	|
||      }nt        |
||      }|D ]  }|r|\  }}}}n|\  }}}ddd|||d}ddd|||d}|r
|d<   ||d<   |j                  t	        t        di |t         |d	            t        t        |
                   |j                  t	        t        di |t         |d	       ||rdnddf            t        t        |
                   |s|j                  t	        t        di |t        t         |d      t        j                  ddg                  t        t        |
                   |j                  t	        t        di |t        t         |d      t        j                  g d                  t        t        |
                    |S )Nr   r  )r  rj  FTr   )
input_sizehidden_sizerN  rE  r   bidirectionalr   r  r   r   r  r   r   )r   r   r   r   )r   r   r   )r   r   r   r   r   rX   )
r   r
   r   rL   r   r}   rY  r  rd   r  )rN   r   rU   r   rV   with_packed_sequencerZ   r   r  r  r   rE  r  rI  prod_genrY   nlrt  b_fbidir	cons_argscons_args_hiddens                         rG   module_inputs_torch_nn_RNN_GRUr  
  s   V5P]^JHF#LDK!MG<{MJ4m< * $B3 MAsE#$Qa$'UL	*+AQ+.ES (*In%/1^,"/"<)"<+Jv,>?$%CQTU	
 	"/"C2B"C+Jv,>
QVA\]_`Ka@bc$%CQTU	
  NN&3&@i&@"/0DZPYEZ\a\h\hjkmnio\p0q"r!()GUX!Y NN&3&@i&@"/0DZPYEZ\a\h\hix\y0z"{!()GUX!YI*X NrI   c                     t        t        |||      }d}d}d}	d}
g }t        |||	|
      }|D ]  }|\  }}}}d}d|d||||d}d|d||||d}|j                  t	        t        di |t         |d            t        t        |      	             |d
kD  r|n|} ||rdnd|f       ||rdnd|f      f}|j                  t	        t        di |t         |d      |      t        t        |      	              |S )Nr   r  )r   r   r   r   )r  r  rN  	proj_sizerE  r   r  rq  r  r   r   r   r  rX   )r   r
   r   rL   r   r}   r[  )rN   r   rU   r   rV   rZ   r   r   rE  r  
proj_sizesrI  r  rY   rt  r  r  r  r  r  r  h_outhxs                          rG   module_inputs_torch_nn_LSTMr  
  sD   V5P]^JDK!MJGt[-DH 
#' 3y#$[PQ`i$'UL	*+KWXgp+.ES 	"/"<)"<+Jv,>?$%@cR	
 ']	u!!U34ju!RSU`Aa6bc"/"C2B"C+Jv,>C$%@cR	
%
6 NrI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS )Nr   rK   r  r   rK   r   r  rh  rm  rn  s          rG   &module_inputs_torch_nn_ReflectionPad1dr  	  ^    V5P]^J 	+A.'
6(:;2	

 	+F3'
9(=>	

 
rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS Nr   rK   r  r   rK   r   r   r   r   r   r   rg  rh  rm  rn  s          rG   &module_inputs_torch_nn_ReflectionPad2dr    ^    V5P]^J 	+A.'
9(=>2	

 	+L9'
<(@A	

 
rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS )Nr   rK   r1  r   rK   r   rK   r   rK   r   )r   r   r   r   r   rh  rm  rn  s          rG   &module_inputs_torch_nn_ReflectionPad3dr  '  _    V5P]^J 	+A.'
<(@A2	

 	+,>?'
?(CD	

 
rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS Nr   rK   r  r   r  r  rh  rm  rn  s          rG   'module_inputs_torch_nn_ReplicationPad1dr  6  r  rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS r  rm  rn  s          rG   'module_inputs_torch_nn_ReplicationPad2dr  E  r  rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS )Nr   rK   r  r   rK   r   r   r   r   rg  )r   r   r   rg  r  rh  rm  rn  s          rG   'module_inputs_torch_nn_ReplicationPad3dr  T  r  rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS r  rm  rn  s          rG    module_inputs_torch_nn_ZeroPad1dr  c  r  rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS )Nr   rK   r  r   r  rh  rm  rn  s          rG    module_inputs_torch_nn_ZeroPad2dr  r  r  rI   c           	          t        t        |||      }t        t        d      t         |d            t              t        t        d      t         |d                  gS )Nr   rK   r  r   r  )rK   r   r   r   r   rh  rm  rn  s          rG    module_inputs_torch_nn_ZeroPad3dr    r  rI   c           	          t        t        |||      }t        t        dd      t         |d            t              t        t        dd      t         |d            	      gS )
Nr   rK   r   r  r   r  r   r  rh  rm  rn  s          rG   $module_inputs_torch_nn_ConstantPad1dr    sb    V5P]^J 	+Aq1'
6(:;2	

 	+FA6'
9(=>	

 
rI   c           	          t        t        |||      }t        t        dd      t         |d            t              t        t        dd      t         |d                  gS )	Nr   rK   r   r  r   r  r   rh  rm  rn  s          rG   $module_inputs_torch_nn_ConstantPad2dr    sb    V5P]^J 	+Aq1'
9(=>2	

 	+L!<'
<(@A	

 
rI   c           	          t        t        |||      }t        t        dd      t         |d            t              t        t        dd      t         |d            	      gS )
Nr   rK   r   r  r   r  r  )rK   r   rK   r   rK   rh  rm  rn  s          rG   $module_inputs_torch_nn_ConstantPad3dr    sc    V5P]^J 	+Aq1'
<(@A2	

 	+,>B'
?(CD	

 
rI   c                 v   t        t        |||      }d t        t        d      t         |d            t              t        t        d      t         |d            fd      t        t        d	      t         |d            fd
      t        t        d      t         |d            fd      gS )Nr   c           
      t    t        j                  | dddd|d    df   | | ddddd|d   f   gd      S )z input:
                [[[0., 1., 2.],
                  [3., 4., 5.]]]
                pad: (1, 2)
                output:
                    [[[2., 0., 1., 2., 0., 1.],
                      [5., 3., 4., 5., 3., 4.]]]
            Nr   rK   r   r  rd   catrW  pads     rG   padding1d_circular_refzDmodule_inputs_torch_nn_CircularPad1d.<locals>.padding1d_circular_ref  sB     yy#aSVGHn-sC1gs1vg4FGQOOrI   rK   r  r   r  r  c                 *     || j                         S r>   r  r   r   r   r  s      rG   r   z6module_inputs_torch_nn_CircularPad1d.<locals>.<lambda>      )?199)M rI   )r   rK   c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad1d.<locals>.<lambda>  r  rI   r  c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad1d.<locals>.<lambda>  r  rI   rm  )rN   r   rU   r   rV   rZ   r   r  s          @rG   $module_inputs_torch_nn_CircularPad1dr    s    V5P]^J	P 	+A.'
6(:;2	

 	+F3'
9(=>M	

 	+F3'
9(=>M	

 	+F3'
9(=>M	
! rI   c                 v   t        t        |||      }d t        t        d      t         |d            t              t        t        d      t         |d            fd      t        t        d	      t         |d            fd
      t        t        d      t         |d            fd      gS )Nr   c                     t        j                  | dddd|d    df   | | ddddd|d   f   gd      } t        j                  | dddddd|d    df   | | ddddddd|d   f   gd      S )aS  input:
                [[[[0., 1., 2],
                   [3., 4., 5.]]]]
                pad: (1, 2, 2, 1)
        output:
            [[[[2., 0., 1., 2., 0., 1.],
               [5., 3., 4., 5., 3., 4.],
               [2., 0., 1., 2., 0., 1.],
               [5., 3., 4., 5., 3., 4.],
               [2., 0., 1., 2., 0., 1.]]]]
        Nr   r   r  r   rK   r  r  s     rG   padding2d_circular_refzDmodule_inputs_torch_nn_CircularPad2d.<locals>.padding2d_circular_ref  s     iiQCF78^,c3q!Wc!fW}3EFANyy#aAAwx/0#s1aGSVG;K7LMSTUUrI   rK   r  r   )rK   r   r   rK   )rK   rK   r   r   c                 *     || j                         S r>   r  r   r   r   r  s      rG   r   z6module_inputs_torch_nn_CircularPad2d.<locals>.<lambda>  r  rI   )r   r   r   r   c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad2d.<locals>.<lambda>  r  rI   )r   r   r   rK   )rK   rK   r   r   c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad2d.<locals>.<lambda>  r  rI   rm  )rN   r   rU   r   rV   rZ   r   r  s          @rG   $module_inputs_torch_nn_CircularPad2dr    s    V5P]^JV  	+A.'
9(=>2	

 	+L9'
<(@AM	

 	+L9'
<(@AM	

 	+L9'
<(@AM	
! rI   c                 v   t        t        |||      }d t        t        d      t         |d            t              t        t        d      t         |d            fd      t        t        d	      t         |d            fd
      t        t        d      t         |d            fd      gS )Nr   c                 |   t        j                  | dddd|d    df   | | ddddd|d   f   gd      } t        j                  | dddddd|d    df   | | ddddddd|d   f   gd      } t        j                  | dddddddd|d    df   | | ddddddddd|d   f   gd      S )	aN  input:
                [[[[[ 0.,  1.,  2.],
                    [ 3.,  4.,  5.]],
                   [[ 6.,  7.,  8.],
                    [ 9., 10., 11.]]]]]
            pad: (1, 2, 2, 1, 1, 2)
            output: [[[[[ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.]],

                       [[ 2.,  0.,  1.,  2.,  0.,  1.],
                        [ 5.,  3.,  4.,  5.,  3.,  4.],
                        [ 2.,  0.,  1.,  2.,  0.,  1.],
                        [ 5.,  3.,  4.,  5.,  3.,  4.],
                        [ 2.,  0.,  1.,  2.,  0.,  1.]],

                       [[ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.]],

                       [[ 2.,  0.,  1.,  2.,  0.,  1.],
                        [ 5.,  3.,  4.,  5.,  3.,  4.],
                        [ 2.,  0.,  1.,  2.,  0.,  1.],
                        [ 5.,  3.,  4.,  5.,  3.,  4.],
                        [ 2.,  0.,  1.,  2.,  0.,  1.]],

                       [[ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.],
                        [11.,  9., 10., 11.,  9., 10.],
                        [ 8.,  6.,  7.,  8.,  6.,  7.]]]]]
        Nr   r   r   r  r   r   rK   r  r  s     rG   padding3d_circular_refzDmodule_inputs_torch_nn_CircularPad3d.<locals>.padding3d_circular_ref  s    J iiQCF78^,c3q!Wc!fW}3EFANiiQ1s1vgh./c!Q7CF7:J6KLRSTyy#aAq3q6'(23S#aAq'3q6'>Q:RSYZ[[rI   rK   r  r   r  )rK   rK   r   r   r   c                 *     || j                         S r>   r  r   r   r   r  s      rG   r   z6module_inputs_torch_nn_CircularPad3d.<locals>.<lambda>A  r  rI   )r   r   r   rK   rK   r   c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad3d.<locals>.<lambda>F  r  rI   )r   r   r   rK   r   r   c                 *     || j                         S r>   r  r  s      rG   r   z6module_inputs_torch_nn_CircularPad3d.<locals>.<lambda>K  r  rI   rm  )rN   r   rU   r   rV   rZ   r   r  s          @rG   $module_inputs_torch_nn_CircularPad3dr    s    V5P]^J'\T 	+A.'
<(@A2	

 	+,>?'
?(CDM	

 	+,>?'
?(CDM	

 	+,>?'
?(CDM	
! rI   
TestModule	test_gradcuda)	active_ifr`   test_gradgradtest_non_contiguous_tensors)r  rp   r`   )   r  TestExpandedWeightModuletest_module)r`   
TestDecomptest_rnn_decomp_modulec                    t        t        |||      }t        t        t	        dd      t	         |dd       |dd                  t
        j                  t        d      t        t        t	        dd      t	         |dd       |dd	                  t
        j                  t        d
      t        t        t	        dd      t	         |dd       |dd                  t
        j                  t        d      t        t        t	        dd      t	         |dd       |dddd                  t
        j                  t        d      t        t        t	        ddd      t	         |dd       |dd	                  t
        j                  t        d
      t        t        t	        ddd      t	         |dd       |dd	                  t
        j                  t        d
      g}|S )Nr   r   r&  r   r  rh  5input has inconsistent input_size: got 11 expected 10r   r   r      9hidden0 has inconsistent hidden_size: got 21, expected 20r   5Input batch size 3 doesn't match hidden0 batch size 5rK   z.Expected hidden to be 1D or 2D, got 4D insteadr  rj  	r   r
   r   r   r}   r   r   r^   
ValueErrorr  s           rG   )module_error_inputs_torch_nn_RNN_GRU_Cellr   t  s   V5P]^J"/B"7+Jq",=z!R?PQ %22#O	
 	"/B"7+Jq",=z!R?PQ %22#S	
 	"/B"7+Jq",=z!R?PQ %22#O	
 	"/B"7+Jq",=z!QPQSU?VW %22!H	
 	"/B"?+Jq",=z!R?PQ %22#S	
 	"/B"?+Jq",=z!R?PQ %22#S	
]7Gp NrI   c                    t        t        |||      }t        t        t	        dd      t	         |dd       |dd       |dd      f            t
        j                  t        d      t        t        t	        dd      t	         |dd       |dd	       |dd	      f            t
        j                  t        d
      t        t        t	        dd      t	         |dd       |dd       |dd      f            t
        j                  t        d      t        t        t	        dd      t	         |dd       |dddd       |dddd      f            t
        j                  t        d      g}|S )Nr   r   r&  r   r  rh  r  r  r  r  r   r  rK   z/Expected hx\[0\] to be 1D or 2D, got 4D insteadr  r  s           rG   %module_error_inputs_torch_nn_LSTMCellr    s|   V5P]^J"/B"7+Jq",=
1b@QS]^_acSd?ef %22#O	
 	"/B"7+Jq",=
1b@QS]^_acSd?ef %22#S	
 	"/B"7+Jq",=
1b@QS]^_acSd?ef %22#O	
 	"/B"7+Jq",=
1aQRTV@WYcdeghjkmoYp?qr %22!K	
9%GL NrI   c           
          t        t        t        ddd            t        j                  t
        d      t        t        t        ddd            t        j                  t
        d      g}|S )Nr   r   rK   )r   z%hidden_size must be greater than zeror  z$num_layers must be greater than zero)r   r   r}   r   r   r  )rN   r   rU   r   rV   rZ   rI  s          rG   $module_error_inputs_torch_nn_RNN_GRUr    sb    -Aq*AB$77!?		
 	-B*BC$77!>		
G NrI   c           
          t        t        |||      }|j                  dd      }t        t	        |rt        dd      n
t        d      t         |d                  t        j                  t        d	      gS )
Nr   is_constantFrK   r   r1  rh  z(expected 2D or 3D input \(got 4D input\)r  	r   r
   r   r   r   r}   r   r   r  rN   r   rU   r   rV   rZ   r   r  s           rG   "module_error_inputs_torch_nn_Pad1dr	    sq    V5P]^J**]E2K 	9D-1"5-XYJZ+J|,DE %22!C		
 rI   c           
          t        t        |||      }|j                  dd      }t        t	        |rt        dd      n
t        d      t         |d                  t        j                  t        d	      gS )
Nr   r  FrK   r   r  rh  z(expected 3D or 4D input \(got 2D input\)r  r  r  s           rG   "module_error_inputs_torch_nn_Pad2dr    q    V5P]^J**]E2K 	9D-1"5-XYJZ+Jv,>? %22!C		
 rI   c           
          t        t        |||      }|j                  dd      }t        t	        |rt        dd      n
t        d      t         |d                  t        j                  t        d	      gS )
Nr   r  FrK   r   r  rh  z(expected 4D or 5D input \(got 2D input\)r  r  r  s           rG   "module_error_inputs_torch_nn_Pad3dr    r  rI   r  )r   r   test_memory_formatrV   )r  )r   r   r   zSkipped!)r   )r   r   r   )rp   r`   )r   r   r   TTestEagerFusionModuleInfo,test_aot_autograd_symbolic_module_exhaustive#test_aot_autograd_module_exhaustive)rM   r   r   test_check_inplace)r`   rp   rK   )r  r   i  )version)rp   g-C6?)r   r   r   r   r   r   r   iE  )r  r   r  test_cpu_gpu_parityg{Gzt?)r   r   r   rp   r   r   )r`   rp   r  )r   rp   r   r   r   r   )atolrtoltest_forwardcpu)r   r   r   )include_halfinclude_bfloat16gQ?r2  )r   rp   r   )r  r  )r   rp   r   #test_if_train_and_eval_modes_differtest_save_load)r   r   r   )r  )r   rM   r   TestModuleMPStest_non_contiguoustest_factory_kwargs)rM   r   r   r   )r`   r  gMb`?)r   r   r   r   )r  )r   r   )rM   r   r   r   )rM   r   r   r   r   )r   r   r   	module_db)F(W  rd   unittestcopyr   enumr   	functoolsr   r   r  r   r   r*  torch.nn.functionalr   
functionalrk  torch.nn.utils.rnnr	   torch.testingr
   #torch.testing._internal.common_cudar   $torch.testing._internal.common_dtyper   r   r   *torch.testing._internal.common_device_typer   r   r   r   r   r   r   r   r   r   r   2torch.testing._internal.common_methods_invocationsr   !torch.testing._internal.common_nnr   r   r   r   r   r    r!   r"   r#   r$   r%   r&   r'   r(   $torch.testing._internal.common_utilsr)   r*   r+   r,   r-   r.   r/   typesr0   operatorr<   aoqatquantizable	quantizedr1   r?   __annotations__Module	Container	NLLLoss2d	MaxPool2dr2   rA   typefrom_iterable__all__getattrr3   r4   rH  str	namespacemodule_namerz   rj   r   namespace_namer7   r{   r}   r   r   r   r   r   r   r   r  r   r6  r=  r  rS  rY  r[  r^  rd  ro  rz  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r#  r-  r2  r=  r@  rP  rT  r[  r^  ra  rf  ro  rx  r}  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r   r  r  r
  r  r  r$  r)  r+  r1  r4  r9  r<  r@  rC  rO  rG  ru  ry  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  expectedFailurer  #rnn_gru_lstm_module_info_decoratorsr   r  r  r	  r  r  backendsr   is_availableis_macos_or_newer_macos15_or_newerAdaptiveAvgPool1dAdaptiveAvgPool2d
itemgetterAdaptiveAvgPool3dskipAdaptiveMaxPool1dAdaptiveMaxPool2dAdaptiveMaxPool3d	AvgPool1d	AvgPool2dr   	AvgPool3dBatchNorm1dBatchNorm2dBatchNorm3dCELUConv1dr   Conv2dfloat64Conv3dConvTranspose1dchalfConvTranspose2d	complex32	complex64
complex128ConvTranspose3dCosineEmbeddingLossELUFractionalMaxPool2dFractionalMaxPool3dL1LossSmoothL1Loss
LazyConv1d
LazyConv2d
LazyConv3dLazyConvTranspose1dLazyConvTranspose2dLazyConvTranspose3dLinearBilinearLPPool1dLPPool2dLPPool3d	MaxPool1d	MaxPool3d	KLDivLossMSELossMarginRankingLossMultiLabelMarginLossMultiMarginLossSoftMarginLossMultiLabelSoftMarginLossNLLLossGaussianNLLLossPoissonNLLLossHingeEmbeddingLoss	HuberLossBCELossBCEWithLogitsLossCrossEntropyLossCTCLossGELUGLU	GroupNorm
Hardshrink	HardswishHardtanhInstanceNorm1dInstanceNorm2dInstanceNorm3dLocalResponseNorm	LayerNormRMSNormTransformerEncoderrH  TransformerDecoderLayerTransformerMultiheadAttention	EmbeddingReLU	LeakyReLUReLU6PReLURNNCellGRUCellLSTMCellSigmoid
LogSigmoidSiLUSoftmax	Softmax2d
LogSoftmaxSoftminSoftplus
SoftshrinkSoftsignTanh
Tanhshrink	ThresholdMishRNNGRULSTMReflectionPad1dReflectionPad2dReflectionPad3dReplicationPad1dReplicationPad2dReplicationPad3dSELU	ZeroPad1d	ZeroPad2d	ZeroPad3dCircularPad1dCircularPad2dCircularPad3dConstantPad1dConstantPad2dConstantPad3dr!  )r@  rA  clss   000rG   <module>r     s0       $ $     3 % :G G    Lm m m m
     
HH	HHKKOO	HHKK##	HHKK!!	HHKK!!' 4
#  
HHOO	HH	HH	HHKK##	HHKK##T *2u22&4( 9B8I8IJWY$J4(  ) *T
 * "0N#3o3M#N ') DsO (" OI (( OY4
"++33HbAII*VXY //0>/?q-Nz*OO _&STB BJ# 2 2,d 
' '(<+ <+@(:%P@F2-`$N+\D&D0b0
<4($080Dh( (*&,
*(&-2(6(.(.(8&&="=="9&9&0*"+J$L"*"
****$*:*$*"* **&*"WF-`'TUr=@$N,"0 F4%N D0f&(&&&$,D#L808 F>$N62GT@F+\>>$;|&T#J'RBR   ,4n"46   ,4n"46
   ,0M4n"46
   ,0M0.5;;.V\ 7)$&@- 7)$l4L7' #F:x(V"$$& NN&&335e%..:L:L:^:^_acd:e Ouxx))"J  (+O uxx))$8"J  (//#+!4!4!4Z!@			O* uxx))$8"Jj 9<I]^(++O: uxx))"J;O@ uxx))$8"JAOH uxx))$8"Jj 9<I]^(+IOX uxx!!"BYO^ uxx!!"B
  //#+!4!4!4Z!@#)   2L%--fkmp_O~ uxx!!"B$8  j 9<I]^(	+OP uxx##%)"D  //1LE!4!4!4Z!@  //1L<!4!4!4Z!@QOt uxx##%)"D   2LBVbubjbubu  wA  cB  C  //1LE!4!4!4Z!@  //1L<!4!4!4Z!@uO\ uxx##%)"D  (  //1LE!4!4!4Z!@  //1L<!4!4!4Z!@]OD uxx}}"=   8 8,H\,15==/KMEOR uxx")*G1SX"Y$8,0   >t Ll\pq>R\a\i\i[jk   2LBV,15==/K 2LB_,15==/K   15==%2H I<Ymn!SOx uxx")*G1SX"Y$8,0   >t Ll\pq>R\a\i\i[jk   8 8,H\,2EMM?L   8 8,H\,15==%--:XZ   2LBV,15==/K 2LB_,15==/K!(   15==%2H I<Ymn/yOl uxx")*G1SX"Y$8,0   >t Ll\pq>R\a\i\i[jkU;   8 8,H\]
   15==%2H I<YmnmOP uxx''")*G1SXei"j$8,04U[[A   >t Ll\pq>R\a\i\i[jk 8 8,H](-~6K   2LBV,15==/K 2LB_,15==/KM   15==%2H I<Ymn 15;;2F GWkl'QO~ uxx''")*G1SXei"j$8,04U[[A   >t Ll\pq>R\a\i\i[jk 8 8,H\(-%JZJZ'[]   8 8,H\jp(-u7G7G'HJ   8 8,H\,15==%--:XZ   8 8,H](-~6K   2LBV,15==/K 2LB_,15==/K-4   15==%2H I<Ymn 15;;2F GWkl=!OB uxx''")*G1SXei"j4U[[A$8,0   >t Ll\pq>R\a\i\i[jk(   8 8,H\] 8 8,H\jp(-'IUce   8 8,H](-~6K$   15==%2H I<Ymn 15??E2J K\[pq 15;;2F GWkl-COx uxx++"L  j 9<I]^ayOD	 uxx||"<   8 8,H\,15==/KME	OR	 uxx++"L$8  (j 9<I]^aS	Ob	 uxx++"L$8  (j 9<I]^ac	Or	 uxx"?  j 9<I]^as	O~	 uxx$$"E  j 9<I]^  	<9V(-EKM		OR
 uxx""")*G1SW"X$8,0   >t Ll\pq>R\a\i\i[jk  )   2LBV,15==/K 2LB_,15==/K    15==%2H I<Ymn'S
O~
 uxx""")*G1SW"X$8,0   >t Ll\pq>R\a\i\i[jk  )   8 8,H\,2EMM?L   8 8,H\,15==%--:XZ   2LBV,15==/K 2LB_,15==/K'.   15==%2H I<Ymn5
Ox uxx""")*G1SW"X$8,0   >t Ll\pq>R\a\i\i[jk  )(   8 8,H\]   15==%2H I<Ymn%yOb uxx++")*G1SWdh"i$8,0   >t Ll\pq>R\a\i\i[jk  )   2LBV,15==/K 2LB_,15==/K    15==%2H I<Ymn'cON uxx++")*G1SWdh"i$8,0   >t Ll\pq>R\a\i\i[jk  )   8 8,H\jp(-8   8 8,H\,15==%--:XZ   2LBV,15==/K 2LB_,15==/K'.   15==%2H I<Ymn5OOH uxx++")*G1SWdh"i$8,0   >t Ll\pq>R\a\i\i[jk  )(   8 8,H\]   15==%2H I<Ymn%IOr uxx"?  j 9<I]^asO~ uxx  "A( ==#4d*C ==#4d*C*E F $^	H  j 9<I]^ 8 8,,15==/K	MO^ uxx  "Aj 9<Uj 9<Y\_Oj uxx  "Aj 9<Uj 9<Y  //#+!4!4!4Z!@#(kOH uxx  "Aj 9<Uj 9<Yj 9<I]^	u=	@IOX uxx!!"BYO^ uxx!!"B_Od uxx!!"B$8  	u=@eOr uxx!!"B  j 9<I]^j 9<I^_j 9<Uj 9<Y\	sOF uxx"@  j 9<I]^ 2LB_,15==/L   8 8,,15==/KMGO^ uxx))"J  j 9<I]^a_Oj uxx,,"M  j 9<I]^	<UKj 9<Y\	kO~ uxx''"H  j 9<I]^	<UKj 9<Y\	OR uxx&&"G  j 9<I]^ 8 8,,15==/K	MSOd uxx00"Q  j 9<I]^aeOp uxx"@  j 9<I]^ 8 8,,15==/K	MqOB uxx''"H  j 9<I]^abCOL uxx&&"G  j 9<I]^abMOV uxx**"K  j 9<I]^aWOb uxx!!"B  j 9<I]^ 8 8,,15==/K	McOt uxx"@  j 9<I]^	<]bc	fuOD uxx))"J  j 9<I]^	<]bc	fEOT uxx(("I'TER   8 8,H\] 15==#4VZB[2\ ]_k .TY[ 8 8,H]glgtgtfu,246
UOj uxx"@  j 9<I]^	<ULj 9<Uj 9<Yj 9<Ifg	jkOD uxx}}"=   8 8,,15==/KMEOR uxx||"<SOX uxx!!"B'DQ  j 9<I^_ 15==#4VZB[2\ ] ,.BPUW  j 9<I]kqrj 9<I]kpqj 9<*8fN	PYOt uxx"""C   8 8,dij 8 8,Hm  |A  B 8 8,H\jop 8 8,Hesxy 8 8,HXfklo	uOH uxx!!"B.T  //#+!4!4!4Z!@#(	5 "'(IOb uxx  "AcOh uxx&&")*OST"U%)  j 9<I]^aiOv uxx&&")*OST"U%)  j 9<I]^awOD uxx&&")*OST"U%)   2OEYZ 2OEbc 2O^T 2OEZ[ 2OEUVj 9<I]^aEO^ uxx))"J   2LBVW 2LB_` 2L.Q 2LBgh 2LBWX 2LBRSV
_Ot uxx!!"B  j 9<I]^auO@ uxx"@AOH uxx**%)"K  j 9<,13  j 9<I]^   8 8,H]^aIOf uxx//%)"P 15==#4VZB[2\ ] ,.K,1ZI   15==#4VZB[2\ ] ,n,13  j 9<,13
  j 9<I]^agOJ uxx//"P  j 9<,13  j 9<I]^a
KO` uxx##"D $(  j 9<,13  j 9<I]^aaO| uxx**%)"K  j 9<I]^a}OJ uxx!!"B 15==#4VZB[2\ ] ,.K,134
  j 9<I]^aKO\ uxx}}"=.T  //#+!4!4!4Z!@#(	5]Ov uxx!!"BwO| uxx~~">  (+}OJ uxx~~">  (+KOX uxx")*MVZ"[(QYO` uxx"E(QaOh uxx  "A(MiOp uxx"@.T  //#+!4!4!4Z!@#(	5qOJ uxx"""C   8 8,disx  tA  tA  sB  CEKOV uxx}}"=WO\ uxx"@]Ob uxx!!"B  j 9<I]^ 8 8,disx  tA  tA  sB  C	EcOr uxx"""C  j 9<I]^ 8 8,disx  tA  tA  sB  C	EsOB uxx"@  j 9<I]^aCON uxx  "A  (+OO\ uxx"""C  (+]Oh uxx  "AiOn uxx}}"=.T  //#+!4!4!4Z!@#(	5oOH uxx"""C.T  //#+!4!4!4Z!@#(	5IOb uxx!!"B  (+cOp uxx}}"=  (+qO| uxx||%)")*HQU"V(L=	}OH uxx||%)")*HQV"W(L=	?IOR uxx}}%)"=(L  (+ >?SOb uxx''"HcOh uxx''"H$8j 9<I],24j 9<I],135iOz uxx''"H$8j 9<I],24j 9<I],135{OL  uxx(("IM OR  uxx(("I$8j 9<I],24j 9<I],135S Od  uxx(("I$8j 9<I],24j 9<I],135e Ov  uxx}}"=  (+w OD! uxx!!"BE!OJ! uxx!!"B   8 8,H\jopsK!OV! uxx!!"B   8 8,H\jopsW!Ob! uxx%%"F(Jc!Oj! uxx%%"F(Jk!Or! uxx%%"F(J   8 8,H\]`s!O@" uxx%%"FA"OF" uxx%%"F   8 8,H\jopsG"OR" uxx%%"F   8 8,H\jopsS"O	4
 Oeg K4( Os+   Bl&2Bl!Bl&	Bl,&Bl,l!Bl&