
    Αi$1                    	   S SK Jr  S SKJr  S SKJrJr  \(       a  S SKJr  S SK	J
r
  \" \5      rS rS rS rS	 rS
rSr\" \SS5        \" \SS5        \" \SS5        \" \SS5        \" \SS5        \" \SS5        \" \SS5        \" \SS5        \" \SS5        \(       a
   " S S\SS9rSr\" \SS5        \" \S/ 5        \" \S/ 5        \" \S S 5        \" \S!/ 5        \" \S"S5        \(       a   " S# S$\SS9r " S% S&\SS9rS'r\" \SS5        \" \S(S)5        \" \S*S+5        \" \S,S-5        \" \S.S/5        \" \S0S15        \" \S2S35        \" \S4S55        \" \S6S5        \" \S7/ 5        \" \S8/ 5        \" \S9/ 5        \" \S:S5        \" \S;S5        \" \S<S5        \" \S=S5        \(       a
   " S> S?\SS9rS@r\" \SS5        \" \SASB5        \" \SCSD5        \" \SES5        \" \SFSB5        \" \SGSB5        \" \SHSB5        \" \SISB5        \" \SJS5        \" \SKSL5        \" \S"S5        \" \SM/ 5        \" \SNS5        \" \SOSP5        \" \SQS5        \" \SRS5        \(       a
   " SS ST\SS9rSUr\" \SS5        \" \SVSB5        \" \SWS5        \(       a
   " SX SY\SS9rSZr\" \SS5        \" \S[S\5        \" \S]SB5        \" \S^SB5        \" \S_S`5        \" \SaSB5        \" \SbSB5        \" \ScSB5        \" \SdS5        \" \SeSf5        \" \SgSf5        \" \Sh/ SiQ5        \" \SjSf5        \" \SkS5        \" \SlS5        \(       a
   " Sm Sn\SS9rSor\" \SS5        \" \SpS5        \" \SqSD5        \" \SrSD5        \" \SsSt/5        \" \SuS5        \" \SvS5        \(       a
   " Sw Sx\SS9r Syr!\" \!SS5        \" \!SzSB5        \" \!S{SB5        \" \!S|S5        \" \!S}S5        \(       a
   " S~ S\SS9r"Sr#\" \#SS5        \" \#SSB5        \(       a
   " S S\SS9r$Sr%\" \%SS5        \(       a
   " S S\SS9r&Sr'\" \'SS5        \" \'S/ 5        \(       a
   " S S\SS9r(Sr)\" \)SS5        \" \)SS5        \" \)SS5        \" \)SS5        \" \)SS5        \(       a
   " S S\SS9r*Sr+\" \+SS5        \" \+SS5        \" \+SS5        \(       a
   " S S\SS9r,Sr-\" \-SS5        \(       a   " S S\SS9r.gg)    )annotations)defaultdict)TYPE_CHECKING	TypedDict)Tensor)_DTypeLiteralc                    [         U    $ N_g_default_config)categorys    j/var/www/html/banglarbhumi/venv/lib/python3.13/site-packages/paddle/distributed/auto_parallel/constants.pyget_category_default_configr      s    X&&    c                    U[         U '   g r
   r   )r   default_values     r   set_category_default_configr       s    "/hr   c                    [         U    U   $ r
   r   )r   fields     r   get_field_default_configr   $   s    X&u--r   c                    U[         U    U'   g r
   r   )r   r   r   s      r   set_field_default_configr   (   s    )6h&r   	not_foundbase	auto_modesemigradient_scaleT"gradient_scale_using_allreduce_avgF	use_cachereturn_numpy	all_ranks
split_dataseedNreinitc                  p    \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S'   S\S	'   S\S
'   S\S'   S\S'   Srg)_BaseConfig>   strr   boolr   r   r   r    r!   r"   z
int | Noner#   r$    N__name__
__module____qualname____firstlineno____annotations____static_attributes__r*   r   r   r&   r&   >   s4    ,00r   r&   )total	recomputeenablecheckpointsno_recompute_segmentssrrefined_ops_patternsenable_tuningc                  >    \ rS rSr% S\S'   S\S'   S\S'   S\S'   Srg	)
_RefinedOpsPatternsW   	list[str]main_opsintnumpre_opssuf_opsr*   Nr+   r*   r   r   r;   r;   W   s    r   r;   c                  R    \ rS rSr% S\S'   S\S'   S\S'   S\S	'   S
\S'   S\S'   Srg)_RecomputeConfig]   r)   r4   zlist[Tensor]r5   z	list[int]r6   r?   r7   zlist[_RefinedOpsPatterns]r8   r9   r*   Nr+   r*   r   r   rD   rD   ]   s$    !!((77r   rD   ampdtypefloat16levelo1init_loss_scalingg      @incr_every_n_stepsi  decr_every_n_nan_or_inf   
incr_ratiog       @
decr_ratiog?use_dynamic_loss_scalingcustom_white_listcustom_black_listcustom_black_varnamesuse_fp16_guarduse_bf16_guarduse_master_graduse_promotec                      \ rS rSr% S\S'   S\S'   S\S'   S\S	'   S
\S'   S
\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   Srg)
_AMPConfig}   r)   r4   r   rG   r(   rI   floatrK   r?   rL   rM   rO   rP   rQ   r=   rR   rS   rT   rU   rV   rW   rX   r*   Nr+   r*   r   r   rZ   rZ   }   s`    
  !$$"&&$$$$((r   rZ   shardingstage   degree   enable_overlapparam_comm_stream_numgrad_comm_stream_numparam_bucket_size_numelgrad_bucket_size_numelenable_hierarchical_commpartition_algorgreedy_eventuning_rangerelease_gradientscomm_buffer_size_MB   enable_tensor_fusionsave_unbalanced_paramc                      \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S'   S\S	'   S\S
'   S\S'   S\S'   S\S'   S\S'   S\S'   Srg)_ShardingConfig   r)   r4   r?   r^   r`   rb   rc   rd   re   rf   rg   r(   rh   r9   zlist[int] | tuple[int, int]rj   r*   Nr+   r*   r   r   rq   rq      sG    
""!!!$$ ##"&&11r   rq   gradient_mergek_stepsavgc                  4    \ rS rSr% S\S'   S\S'   S\S'   Srg)	_GradientMergeConfig   r)   r4   r?   rt   ru   r*   Nr+   r*   r   r   rw   rw      s    	r   rw   pipelineschedule_mode1F1B	pp_degree
vpp_degreevpp_seg_method micro_batch_sizeaccumulate_stepsgeneration_batch_sizeenable_send_recv_overlapjob_schedule_profiler_startjob_schedule_profiler_stopprogram_runtimes)=   H   G   "      memory_limit_timessplit_backward auto_parallel_sync_shared_paramsc                      \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S	'   S\S
'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   S\S'   Srg)_PipelineConfig   r)   r4   r(   rz   r?   r|   r}   r~   r   r   r   r   r   r   r   r   r*   Nr+   r*   r   r   r   r      sM    """&&%(($''*..r   r   qatchannel_wise_abs_maxweight_bitsactivation_bitsnot_quant_pattern
skip_quantalgoonnx_formatc                  \    \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S	'   S
\S'   S\S'   Srg)
_QATConfig   r)   r4   r   r?   r   r   r=   r   z
str | Noner   r   r*   Nr+   r*   r   r   r   r      s+    ""$$r   r   tuningprofile_start_stepprofile_end_steprun_after_tuningdebugc                  H    \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S'   S	rg
)_TuningConfigi  r)   r4   r?   r   r   r   r   r*   Nr+   r*   r   r   r   r     s    r   r   dataset
num_shardsc                  *    \ rS rSr% S\S'   S\S'   Srg)_DatasetConfigi"  r)   r4   r?   r   r*   Nr+   r*   r   r   r   r   "  s    r   r   fused_linear_promotionc                       \ rS rSr% S\S'   Srg)_FusedLinearPromotionConfigi/  r)   r4   r*   Nr+   r*   r   r   r   r   /      r   r   fused_passesfused_passes_listc                  *    \ rS rSr% S\S'   S\S'   Srg)_FusedPassesConfigi<  r)   r4   r=   r   r*   Nr+   r*   r   r   r   r   <  s    $$r   r   dp_optimizationfuse_all_reduce_opsfuse_grad_size_in_MB    overlap_comm_caclgradient_sync_after_accumulatec                  H    \ rS rSr% S\S'   S\S'   S\S'   S\S'   S\S'   S	rg
)_DPOptimizationConfigiO  r)   r4   r   r?   r   r   r   r*   Nr+   r*   r   r   r   r   O  s    !!!!(,,r   r   mp_optimization!allreduce_matmul_grad_overlappingreplace_with_c_embedding#replace_with_parallel_cross_entropyc                       \ rS rSr% S\S'   Srg)_MPOptimizationConfigie  r)   r   r*   Nr+   r*   r   r   r   r   e  s    +//r   r   sp_optimizationc                       \ rS rSr% S\S'   Srg)_SPOptimizationConfigiq  r)   r4   r*   Nr+   r*   r   r   r   r   q  r   r   r   )/
__future__r   collectionsr   typingr   r   paddler   paddle._typing.dtype_liker   dictr   r   r   r   r   	NOT_FOUNDBASEr&   	RECOMPUTEr;   rD   AMPrZ   SHARDINGrq   GRADIENT_MERGErw   PIPELINEr   QATr   TUNINGr   DATASETr   FUSEDLINEARPROMOTIONr   FUSED_PASSESr   DP_OPTIMIZATIONr   MP_OPTIMIZATIONr   SP_OPTIMIZATIONr   r*   r   r   <module>r      s0   # # +7  % '0.7 	
  {F 3 / 6 CU K {D 1 ~t 4 {E 2 |T 2 vt , x /	iu 	 	 He 4 M2 6 $;R @ D! , $:B ? OU ;iu 9E   h . gy 1 gt , 17 ; 2D 9 7 ; lC 0 lC 0 8$ ? 12 6 12 6 5r : . 6 . 6 / 7 mT 2Ye ,  8U 3 7A . 8Q / #3U ; #:A > #91 = #<a @ #;Q ? #=u E #4m D ?E : >2 6 #6 > #8# > #95 A #:D A 2)5 2$ " 5 9 A 6  5y   8U 3 ?F ; ; 2 < 3 #3R 8 #5q 9 #5q 9 #:A > #=u E #@" E #? D #57J K #7 < #3U ; #Eu M/)5 /&  h . 4d ; mQ / / 3 1L> B fd + mT 2Ye  
 5 1 !5q 9 !3Q 7 !3T : % 0	   (E 2 , 2%  0  -x ?iu   x 7 ':B ?%Ye % $ (E : *? F *@" E *=t D 5u -	 - $ 8% *De L :E 0	 0 $ (D 9	  r   