
    h1                    X   d Z ddlZddlZddlZddlZddlZddlZddlZddl	Z	ddl
Z
ddlZddlZddlZddlmZmZ ddlmZ ddlmZ ddlmZmZmZmZmZ ddlZddlZddlm Z   ejB                  d      d	k(  r e"d
       ddl#m$Z$m%Z% ddl#m&Z' ddl(m)Z)m*Z*m+Z+m,Z,m-Z-m.Z.m/Z/  e/j`                  e1      Z2 e-       rddl#m3Z3  e.       r
ddl4Z4ddl5m6Z7 dZ8	 ejr                  jO                  d      Z:dZ;ejN                  jy                  e:      ejN                  jy                  e8      k\  Z=ddl>Z>e>j~                  j                  d      dZAndZAej                  j                  d      duxs ej                  j                  d      duZJer3eJr1	 ejr                  jO                  d      ZKe2j                  deK d       ddl#mMZM ddlNmOZOmPZP ddlQmRZRmSZSmTZT ddlUmVZV ddl(mWZWmXZX d ZYd  ZZd! Z[d" Z\d# Z]d$ Z^d% Z_d& Z`d' Zad( Zbd) Zcd* Zdd+ Zed, Zfd- Zgd. Zhd/ Zid0 Zjd1 Zkd2eld3emd4eSfd5Znd2eld3emd4eSfd6Zod2eld3emd4eSfd7Zpd2eld3emd4eSfd8Zqd9 Zrd: Zs G d; d<eP      Ztd=ed>emfd?Zu G d@ dAeme      Zv G dB dCeP      Zw G dD dEeP      Zx G dF dGeP      Zy G dH dIeP      Zz G dJ dKeP      Z{ G dL dMe{      Z| G dN dOe}      Z~ G dP dQeP      Z G dR dSeP      Z G dT dUeP      Z G dV dWeP      Z G dX dYeP      Z G dZ d[eP      Zezeye{eetexeweee|eeed\Zd] Zy# ejr                  j                  eCeDeEeFeGf$ r dZ:dZ;dZ=dZAY w xY w# ejr                  j                  $ rW 	 ejr                  jO                  d      ZKe2j                  deK d       n!# ejr                  j                  $ r dZJY nw xY wY w xY w)^z+
Integrations with other Python libraries.
    N)asdictfields)Enum)Path)TYPE_CHECKINGAnyLiteralOptionalUnion)_is_package_available
WANDB_MODEofflineu%   ⚙️  Running in WANDB offline mode   )PreTrainedModelTrainingArguments)__version__)PushToHubMixinflatten_dictis_datasets_availableis_pandas_availableis_tf_availableis_torch_availablelogging)TFPreTrainedModelz3.43.2comet_mlTzcomet.api_keyFneptunezneptune-clientzNeptune version z available.zNeptune-client version )	modelcard)ProgressCallbackTrainerCallback)PREFIX_CHECKPOINT_DIRBestRunIntervalStrategy)ParallelMode)ENV_VARS_TRUE_VALUESis_torch_xla_availablec                      t        j                  dd      j                         t        v rt        j                  d       yt        j                  j                  d      dd l	} t        | d      S y)NWANDB_DISABLED zUsing the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).Fwandbr   run)osgetenvupperr$   loggerwarning	importlibutil	find_specr)   hasattr)r)   s    i/var/www/html/eduruby.in/venv/lib/python3.12/site-packages/transformers/integrations/integration_utils.pyis_wandb_availabler5   m   sa    	yy!2&,,.2FFt	
 ~~(4 ue$$    c                  D    t         j                  j                  d      d uS )Ntrackior0   r1   r2    r6   r4   is_trackio_availabler;          >>##I.d::r6   c                  D    t         j                  j                  d      d uS )Nclearmlr9   r:   r6   r4   is_clearml_availabler?      r<   r6   c                  &   t        j                  dd      j                         dk(  rt        j	                  d       yt
        du ryt        du r%t        j	                  dt        t        t               yt        du rt        j	                  d       yy)	N
COMET_MODEr(   DISABLEDzUsing the `COMET_MODE=DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).Fzcomet_ml version %s is installed, but version %s or higher is required. Please update comet_ml to the latest version to enable Comet logging with pip install 'comet-ml>=%s'.a#  comet_ml is installed but the Comet API Key is not configured. Please set the `COMET_API_KEY` environment variable to enable Comet logging. Check out the documentation for other ways of configuring it: https://www.comet.com/docs/v2/guides/experiment-management/configure-sdk/#set-the-api-keyT)
r+   r,   r-   r.   r/   _is_comet_installed_is_comet_recent_enough_comet_version_MIN_COMET_VERSION_is_comet_configuredr:   r6   r4   is_comet_availablerH      s    	yyr"((*j8t	
 e#%'t	
 u$h	
 r6   c                      t         j                  j                  d      d uxs! t         j                  j                  d      d uS )NtensorboardtensorboardXr9   r:   r6   r4   is_tensorboard_availablerL      s7    >>##M2$>v)..BZBZ[iBjrvBvvr6   c                  D    t         j                  j                  d      d uS )Noptunar9   r:   r6   r4   is_optuna_availablerO          >>##H-T99r6   c                  D    t         j                  j                  d      d uS )Nrayr9   r:   r6   r4   is_ray_availablerS      s    >>##E*$66r6   c                  Z    t               syt        j                  j                  d      d uS )NFzray.tune)rS   r0   r1   r2   r:   r6   r4   is_ray_tune_availablerU      s%    >>##J/t;;r6   c                  D    t         j                  j                  d      d uS )Nsigoptr9   r:   r6   r4   is_sigopt_availablerX      rP   r6   c                      t         j                  j                  d      yt         j                  j                  d      yt         j                  j                  d      d uS )NazuremlFzazureml.corezazureml.core.runr9   r:   r6   r4   is_azureml_availabler[      sM    ~~	*2~~/7>>##$67tCCr6   c                      t        j                  dd      j                         dk(  ryt        j                  j                  d      d uS )NDISABLE_MLFLOW_INTEGRATIONFALSETRUEFmlflow)r+   r,   r-   r0   r1   r2   r:   r6   r4   is_mlflow_availablera      s<    	yy-w7==?6I>>##H-T99r6   c                      d t         j                  j                  d      t         j                  j                  d      fvS )Ndagshubr`   r9   r:   r6   r4   is_dagshub_availablerd      s1    	00;Y^^=U=UV^=_```r6   c                      t         S N)_has_neptuner:   r6   r4   is_neptune_availablerh      s    r6   c                  D    t         j                  j                  d      d uS )N
codecarbonr9   r:   r6   r4   is_codecarbon_availablerk      s    >>##L1==r6   c                  D    t         j                  j                  d      d uS )Nflytekitr9   r:   r6   r4   is_flytekit_availablern      s    >>##J/t;;r6   c                  Z    t               syt        j                  j                  d      d uS )NFzflytekitplugins.deck)rn   r0   r1   r2   r:   r6   r4    is_flyte_deck_standard_availablerp      s&     ">>##$:;4GGr6   c                  D    t         j                  j                  d      d uS )Ndvcliver9   r:   r6   r4   is_dvclive_availablers      r<   r6   c                  D    t         j                  j                  d      d uS )Nswanlabr9   r:   r6   r4   is_swanlab_availablerv      r<   r6   c                 N   t               r0dd l}t        | |j                  j                        r| j
                  S t               rt        | t              r| S t               rt        | t              r| S t               rt        | t              r| S t        d| j                         )Nr   zUnknown type for trial )rO   rN   
isinstancetrial	BaseTrialparamsrU   dictrX   r5   RuntimeError	__class__)ry   rN   s     r4   	hp_paramsr      s    eV\\334<<eT"LeT"LeT"L
00AB
CCr6   n_trials	directionreturnc                 &    dd l ddlm  j                  j                  dk(  r.ddj
                  f fd}|j                  dd       }|j                  dd      }|j                  dd	      }t        |t              r|nd }|d n|} j                  d||d
|}	|	j                  |||||       |	j                         s@|	j                  }
t        t        |
j                        |
j                   |
j"                        S |	j$                  }|D cg c]6  }t        t        |j                        |j&                  |j"                        8 c}S t)        |      D ]  }d  _        d g} j                  j,                  t.        j0                  k7  rt3        d      t4        j6                  j9                  |d        j;                  d |d          t=         dd        j?                         } jA                  |       _         y c c}w )Nr   )release_memoryry   c                 n   d }|rPt        j                  |      D ]8  }|j                  t              st         j                  j                  ||      }: d 	_        	j                  j                  dkD  r	j                  j                  t        j                  k7  rt        d      	j                  |        j                  j                  | j                   | j"                        }|g}t$        j&                  j)                  |d       	j+                  ||        n	j+                  ||        t-        	dd       &	j/                         }	j1                  |      	_         	j2                  	j4                        \  	_        	_        	j6                  j9                          	j                  S )N   Conly support DDP optuna HPO for ParallelMode.DISTRIBUTED currently.r   srcresume_from_checkpointry   	objective)r+   listdir
startswithr    pathjoinr   args
world_sizeparallel_moder#   DISTRIBUTEDr}   hp_spacery   
FixedTrialr{   numbertorchdistributedbroadcast_object_listtraingetattrevaluatecompute_objectivemodel_wrappedmodelacceleratorclear)
ry   checkpoint_dir
checkpointsubdirfixed_trialtrial_main_rank_listmetricsrN   r   trainers
          r4   
_objectivez(run_hp_search_optuna.<locals>._objective  sk   J jj8 JF(()>?%'WW\\.&%I
J !%G||&&*<<--1I1II&'lmm  '$ll55ellELLQ(3}$!!778LRS7TZuMZuMwT2:!**,$+$=$=g$F! 4B'BWBWY`YfYf3g0G!7=%%'$$$r6   timeoutn_jobsr   gc_after_trialF)r   
directions)r   r   r   r   r   r   r   r   rf   r:   )!rN   accelerate.utils.memoryr   r   process_indexTrialpoprx   listcreate_studyoptimize_is_multi_objective
best_trialr!   strr   valuer{   best_trialsvaluesranger   r   r#   r   r}   r   r   r   r   r   r   r   )r   r   r   kwargsr   r   r   r   r   studyr   r   bestir   r   rN   r   s   `               @@r4   run_hp_search_optunar      s   6||!!Q&	%fll 	%8 **Y-Ha($4e<",Y"=Y4
&2D		###YiJYRXYzHgfest((*))J3z001:3C3CZEVEVWW++KT_`DGC,dkk4;;G``x 
	GA $G$(6 ||))\-E-EE"#hii334Ha3PMM=QRS=TMUwT2:!**,$+$=$=g$F!
	G  as   ;Hc                 4   dd l dd ldt        ffd}| j                  j                  s)ddlm} t        j                  d        |d      | _        | j                  t              }d | _        d	|vrad
di|d	<   | j                  j                  dkD  rd|d	   d<   d| j                  j                  dkD  rdndz   }t        j                  d| d       |d	   j                  dd      }|| j                  _        d|vrddlm}	  |	dg      |d<   d|v rddlm}
m}m}m} t1        |d   |
|||f      rn| j                  j2                  r'| j                  j4                  t6        j8                  k(  r1t;        dj=                  t?        |d         j@                              jB                  jE                  ||       tG        jH                        fd       }tK        d      rjL                  |_&         jB                  jN                  |f| jQ                  d       |d|}|jS                  d|d d | j                  jT                        }tW        |jX                  |jZ                  d   |j\                  |      }|| j_                  |       |S ) Nr   ry   c                 x   	 ddl m} |j                  |      r|j                  t               d |_        j                  j                         }|rld|_        |j                         5 }t        t        |      j                  t         d            j                         }|j                  ||        d d d        n|j                  |        t        |dd       |j!                         }|j#                  |      |_        |j%                  |j                  dd       t'        j(                         5 }|j+                  |	       j                  j,                  j/                  |      }j                  j1                  ||
       d d d        y y # t
        $ r Y qw xY w# 1 sw Y   xY w# 1 sw Y   y xY w)Nr   )NotebookProgressCallbackr   *r   )ry   T)r   done)r   )r   )transformers.utils.notebookr   pop_callbackadd_callbackr   ModuleNotFoundErrorr   r   get_checkpointas_directorynextr   globr    as_posixr   r   r   updatetempfileTemporaryDirectory_tune_save_checkpoint
Checkpointfrom_directoryreport)	ry   local_trainerr   r   r   checkpoint_pathr   temp_checkpoint_dirrR   s	           r4   r   z%run_hp_search_ray.<locals>._objectiveA  s   	L))*BC**+;< #'YY--/
 '2M#((* Yn"&tN';'@'@DYCZZ[A\']"^"g"g"i##?RW#XY Y e, =+t4<#,,.G&3&E&Eg&NM#NN)@)@$OP,,. A2E33CV3W YY11@@ATU
		  Z @A A =+ # 		Y YA As+   ,F )AF$5AF0	F! F!$F-0F9r   )TrainerMemoryTrackerzMemory tracking for your Trainer is currently enabled. Automatically disabling the memory tracker since the memory tracker is not serializable.T)skip_memory_metricsresources_per_trialcpur   gpuz1 CPUz
 and 1 GPUr(   zgNo `resources_per_trial` arg was passed into `hyperparameter_search`. Setting it to a default value of z for each trial.progress_reporter)CLIReporterr   )metric_columns	scheduler)ASHASchedulerHyperBandForBOHBMedianStoppingRulePopulationBasedTraininga  You are using {cls} as a scheduler but you haven't enabled evaluation during training. This means your trials will not report intermediate results to Ray Tune, and can thus not be stopped early or used to exploit other trials parameters. If this is what you want, do not use {cls}. If you would like to use {cls}, make sure you pass `do_eval=True` and `eval_strategy='steps'` in the Trainer `args`.)cls)r   c                     t               rddl}t        j                  j	                  |j
                  j                         d      }t        j                  j                  d|      }t        j                  j                  |      }|t        j                  |j                  <   |j                  j                  |        | i |S )a"  
        Wrapper around `tune.with_parameters` to ensure datasets_modules are loaded on each Actor.

        Without this, an ImportError will be thrown. See https://github.com/huggingface/transformers/issues/11565.

        Assumes that `_objective`, defined above, is a function.
        r   Nz__init__.pydatasets_modules)r   datasets.loadr+   r   r   loadinit_dynamic_modulesr0   r1   spec_from_file_locationmodule_from_specsysmodulesnameloaderexec_module)r   r   datasetsdynamic_modules_pathspecr   	trainables         r4    dynamic_modules_import_trainablez;run_hp_search_ray.<locals>.dynamic_modules_import_trainable  s     !" #%77<<0R0R0TVc#d >>99:LNbcD(~~>>tD%5CKK		"KK##$45$)&))r6   
__mixins__)confignum_samples   )metricmodescope)0rR   	ray.trainr|   _memory_trackerr   trainer_utilsr   r.   r/   r   TensorBoardCallbackr   r   n_gpuinfoget_n_gpuray.tuner   ray.tune.schedulersr   r   r   r   rx   do_evaleval_strategyr"   NOr}   formattype__name__tunewith_parameters	functoolswrapsr3   r   r*   r   get_best_trial	ray_scoper!   trial_idlast_resultr   r   )r   r   r   r   r   r   
_tb_writerresource_msggpus_per_trialr   r   r   r   r   r   analysisr   best_runrR   r   s                     @@r4   run_hp_search_rayr  =  s   $A$ $AL ""668<	

 #74"P %%&9:JGM F*).
$%<<!34F()%0',,2D2Dq2H,bQ/1	
 1266ua@N(GLL &((&1+&O"#ftt ;-1CEUWn!o
<<''7<<+E+EIYI\I\+\"
 #)&T&2E-F-O-O&"P  ((7(KI__Y*  *( y,'6?6J6J(3sxx||(% 	H (()BQ-W^WcWcWmWm(nJz**J,B,B;,OQ[QbQbdlmHZ(Or6   c           	      r   dd l }| j                  j                  dk(  rUt        j                  j                  d      dk\  r |j                  d       |j                  dd| j                  d       d|dd	gd
|      }t        j                  d|j                          |j                         D ]8  }|5  d | _        | j                  j                  d
kD  r| j                  j                  t         j"                  k7  rt%        d      | j'                  |j(                         t*        j,                  j/                  t1        j2                  | j                        d       | j5                  d        n| j5                  d |j(                         t7        | dd       &| j9                         }| j;                  |      | _        |j=                  d| j                         d d d        ; t?        |jA                               d   }tC        |j                  |jD                  d   jF                  |jH                        }	|	S ddl m%}
  |
       }|jM                  dd       }||jO                  |       |jQ                         jS                  d| j                  d       d|dd	gd
|d      }t        j                  d|j                          |jT                  jV                  |jX                  k  r|jQ                  |j                        j[                         jS                         }d | _        | j                  j                  d
kD  r| j                  j                  t         j"                  k7  rt%        d      | j'                  |       t*        j,                  j/                  t1        j2                  | j                        d       | j5                  d        n| j5                  d |       t7        | dd       &| j9                         }| j;                  |      | _        d| j                  dg}|jQ                  |j                        j]                         jS                  |j                  |      }t        j                  d|j                   d|j                   d       |jQ                  |j                        j_                         }|jT                  jV                  |jX                  k  rt?        |jQ                  |j                        ja                         j_                         jc                               d   }tC        |j                  |jF                  |jH                        }	|	S te        |      D ](  }d | _        t?        t1        j2                  | j                              }| j                  j                  t         j"                  k7  rt%        d      t*        j,                  j/                  |d       t1        jf                  ti        |            }tk        |      jm                         D ]"  \  }}|dk7  sto        | j                  ||       $ | j5                  d        t7        | dd       | j9                         }| j;                  |      | _        + y # 1 sw Y   xY w)Nr   rW   z8.0.0huggingfacezhuggingface-tuner   r   r   )r   r   strategyr   )r   r  
parametersr   parallel_bandwidthbudgetz6created experiment: https://app.sigopt.com/experiment/zConly support DDP Sigopt HPO for ParallelMode.DISTRIBUTED currently.r   )r   r   )
Connectionproxies)r   r!  r   r"  observation_budgetprojectr   r   )
suggestionr   z"[suggestion_id, observation_id]: [, ]
local_rank)8rW   r   r   r0   metadataversionset_projectcreate_experimentr   r.   r  idloopr   r   r   r#   r   r}   _hp_search_setupr*   r   r   r   pickledumpsr   r   r   r   
log_metricr   get_best_runsr!   r   r   assignmentsr$  r   set_proxiesexperimentscreateprogressobservation_countr&  suggestionsobservationsfetchbest_assignmentsiterate_pagesr   loadsbytesr   itemssetattr)r   r   r   r   rW   
experimentr*   r   r   r  r$  connr%  r)  r   obsr   args_main_rankr   keyr   s                        r4   run_hp_search_sigoptrL    s   ||!!Q&%%h/7:}-11'"++D1"-IS]^_#$ 2 J KKPQ[Q^Q^P_`a!( C C(,G%||..2"<<559Q9QQ"./t"uu009))??W\\@Z`a?bTBTQwT:B")"2"2"4,3,E,Eg,N)NN;0A0ABC CC" 
0023A6DtwwK(@(F(FHXHXYHT Q *<DjjD1G"  )))+22'"++D1"-IS]^_#$#+% 3 J KKPQ[Q^Q^P_`a%%77*:W:WW!--jmm<HHJQQS
$(!<<**Q.||11\5M5MM*+pqq,,Z8%%;;FLL<V\];^MMM>MMZMP7K6>%..0G(/(A(A'(JG%#.9J9JKL&&z}}5BBDKKWaWdWdmsKt@rRURXRXQYYZ[\!--jmm<BBD
' %%77*:W:WW* ((7HHJPPR``bcdefDtww

D4D4DEHx 	GA $G!&,,w||"<=N||))\-E-EE"#hii33N3J<<n 56D$Tl002 6
U,&GLL#u56 MMM6wT2:!**,$+$=$=g$F!	G YC Cs   6D+Z,,Z6	c                 N    ddl m}  |       st        d      dd ld} j                  j
                  D ]  }t        |t              sd} n |s j                  t                      dg j                  _
        d d d d|j                  d	d       }|j                  d
d       }|j                  dd       }	|j                  dd       }
|j                  dd       j                  d       }|d   d<   |d   d<   |	r|	|d<    fd}|sj                  |||
      }n<dd l|
rj                  j!                  |
       j                  j#                  |       t$        j'                  d|        j)                  |||       t+        d   d   d   |      S )Nr   )r5   z8This function needs wandb installed: `pip install wandb`r   FTr)   )run_idr   hyperparameterssweep_idr'  r   entityr   z	eval/lossgoalc                     	j                   r	j                   n	j                         } | j                  j                  _        | j
                  j                  i d       	j
                  }d _        j                  d t        |      d          t        dd       ^j                         }j                  |      _        t        |      }|vr)t        j                  d d|j!                                 d}d   /d	k(  rj                  d   k  }nd
k(  rj                  d   kD  }|sd   ,| j"                  d<   j                  d<   t%        |      d<   j                  S )N)r8  r   _itemsr   r   zProvided metric zU not found. This might result in unexpected sweeps charts. The available metrics are FrN  minimizemaximizerO  )r*   initr   state
trial_namer   r   r   r   varsr   r   r   rewrite_logsr.   r/   keysr1  r|   )
r*   r   r   format_metrics
best_scorer   r   r   r   r)   s
        r4   r   z'run_hp_search_wandb.<locals>._objectiveB  sk    99eii%**,#&88 

"?@ Tfh9OP7K.6&&(G ' 9 9' BG)'2N^+&vh /$$2$7$7$9#:< 
h+J&$..K1HH
j($..K1HH
H-5#&66Jx &-&7&7J{#,0LJ()   r6   )r'  rQ  zwandb sweep id - )functioncountrN  r   rO  )integrationsr5   ImportErrorr)   callback_handler	callbacksrx   WandbCallbackr   r   	report_tor   r   sweep	wandb.envenv
set_entityr/  r.   r  agentr!   )r   r   r   r   r5   reporting_to_wandbcallbackrP  r'  r   rQ  sweep_configr   r   r   r)   s   ` `          @@@r4   run_hp_search_wandbro  %  s   1TUU ,,66 h.!% ]_-%YGLL tMJzz*d+HjjD)G::fd#DZZ$'FZZ+.F##D)L%.L6"%+L6"#V! !B ;;|WV;LII  (		g&
KK#H:./	KK:XK>:h'K)@*M^B_aijjr6   c                     g } t               rt               s| j                  d       t               r| j                  d       t	               r| j                  d       t               r| j                  d       t               r| j                  d       t               r| j                  d       t               r| j                  d       t               r| j                  d       t               r| j                  d	       t               r| j                  d
       t               r| j                  d       t               r| j                  d       | S )Nazure_mlr   rc   rr   r`   r   rJ   r)   rj   r>   ru   r8   )r[   ra   appendrH   rd   rs   rh   rL   r5   rk   r?   rv   r;   )ra  s    r4   $get_available_reporting_integrationsrs  r  s   L&9&;J'J'I&I&H%I&!M*G$ L)I&I&I&r6   c                     i }d}t        |      }d}t        |      }| j                         D ]G  \  }}|j                  |      r||d||d  z   <   #|j                  |      r||d||d  z   <   @||d|z   <   I |S )Neval_test_eval/ztest/ztrain/)lenrE  r   )dnew_deval_prefixeval_prefix_lentest_prefixtest_prefix_lenkvs           r4   r[  r[    s    EK+&OK+&O	 $1<<$34E'Ao.//0\\+&34E'Ao.//0"#E(Q,$ Lr6   c                   4    e Zd ZdZddZddZd ZddZd Zy)	r  z
    A [`TrainerCallback`] that sends the logs to [TensorBoard](https://www.tensorflow.org/tensorboard).

    Args:
        tb_writer (`SummaryWriter`, *optional*):
            The writer to use. Will instantiate one if not set.
    Nc                     t               }|st        d      |r	 ddlm} || _        || _        y d | _        || _        y # t
        $ r/ 	 ddlm} || _        n# t
        $ r
 d | _        Y nw xY wY || _        y w xY w)NzuTensorBoardCallback requires tensorboard to be installed. Either update your PyTorch version or install tensorboardX.r   )SummaryWriter)rL   r}   torch.utils.tensorboardr  _SummaryWriterrb  rK   	tb_writer)selfr  has_tensorboardr  s       r4   __init__zTensorBoardCallback.__init__  s    24)  
/A&3# # #'D"  //:*7D'" /*.D'/ #/s3   ? 	A7	AA7A*'A7)A**A76A7c                 l    |xs |j                   }| j                  | j                  |      | _        y y )N)log_dir)logging_dirr  r  )r  r   r  s      r4   _init_summary_writerz(TensorBoardCallback._init_summary_writer  s8    -T--*!000ADN +r6   c                    |j                   sy d }|j                  r8|j                  }|*t        j                  j                  |j                  |      }| j                  | j                  ||       | j                  | j                  j                  d|j                                d|v rV|d   }t        |d      rD|j                  7|j                  j                         }| j                  j                  d|       y y y y y )Nr   r   r   model_config)is_world_process_zerois_hyper_param_searchrY  r+   r   r   r  r  r  add_textto_json_stringr3   r   )	r  r   rX  controlr   r  rY  r   model_config_jsons	            r4   on_train_beginz"TensorBoardCallback.on_train_begin  s    **&&))J%'',,t'7'7D>>!%%dG4>>%NN##FD,?,?,AB& w5(+0H(-(C(C(E%NN++N<MN 1I+ ! &r6   c           
      (   |j                   sy | j                  | j                  |       | j                  t        |      }|j	                         D ]  \  }}t        |t        t        f      r(| j                  j                  |||j                         Dt        |t              r(| j                  j                  |||j                         |t        j                  d| dt        |       d| d        | j                  j                          y y )N)Trainer is attempting to log a value of "
" of type 
 for key "zn" as a scalar. This invocation of Tensorboard's writer.add_scalar() is incorrect so we dropped this attribute.)r  r  r  r[  rE  rx   intfloat
add_scalarglobal_stepr   r  r.   r/   r  flushr  r   rX  r  logsr   r  r  s           r4   on_logzTensorBoardCallback.on_log  s    **>>!%%d+>>%%D

 1a#u.NN--aE4E4EF3'NN++Aq%2C2CDNN3ja	A3 ?EE NN  " &r6   c                 `    | j                   r"| j                   j                          d | _         y y rf   )r  closer  r   rX  r  r   s        r4   on_train_endz TensorBoardCallback.on_train_end  s%    >>NN  "!DN r6   rf   )	r  
__module____qualname____doc__r  r  r  r  r  r:   r6   r4   r  r    s"    #.B
O,#."r6   r  r   
output_dirc                    t        | dd      5 t        | t              rt        |        nt	               r(t        | t
              rfd}| j                  |       nMt               rCt        | t        j                  j                  t        f      rt        | d      rt        |        d d d        y # 1 sw Y   y xY w)Nz/model_architecture.txtzw+filec                      t        |        y )Nr  )print)sfs    r4   print_to_filez6save_model_architecture_to_file.<locals>.print_to_file  s    aa r6   )print_fn
base_model)openrx   r   r  r   r   summaryr   r   nnModuler   r3   )r   r  r  r  s      @r4   save_model_architecture_to_filer    s    	34d	; !qe_-%a :e5F#G! MM=M1!uuxx?@WUT`Ea%a ! ! !s   BB88Cc                   L    e Zd ZdZdZdZdZedefd       Z	e
dedd fd       Zy	)
WandbLogModelz)Enum of possible log model values in W&B.r   endfalser   c                 F    | t         j                  t         j                  fv S )zYCheck if the value corresponds to a state where the `WANDB_LOG_MODEL` setting is enabled.)r  
CHECKPOINTENDr  s    r4   
is_enabledzWandbLogModel.is_enabled  s      00-2C2CDDDr6   r   c                    t        |t              st        dt        |             |j	                         t
        v r"t        dt        j                  d       d      t        j                  d| d       t        j                  S )Nz>Expecting to have a string `WANDB_LOG_MODEL` setting, but got zSetting `WANDB_LOG_MODEL` as WANDB_LOG_MODELzn is deprecated and will be removed in version 5 of transformers. Use one of `'end'` or `'checkpoint'` instead.z6Received unrecognized `WANDB_LOG_MODEL` setting value=z ; so disabling `WANDB_LOG_MODEL`)rx   r   	TypeErrorr  r-   r$   DeprecationWarningr+   r,   r.   r  r  r  r/   r^   )r   r   s     r4   	_missing_zWandbLogModel._missing_  s    %%\]abg]h\ijkk;;=00$/		:K0L/M N[ [  	DUGKkl	
 """r6   N)r  r  r  r  r  r  r^   propertyboolr  classmethodr   r  r:   r6   r4   r  r    sR    3J
CEED E E #c #o # #r6   r  c                   F    e Zd ZdZd Zd ZddZddefdZddZ	d	 Z
d
 Zy)re  z{
    A [`TrainerCallback`] that logs metrics, media, model checkpoints to [Weight and Biases](https://www.wandb.com/).
    c                 N   t               }|sat        j                  j                  d      7t	        j
                  dd      j                         t        v }|rt        d      t        d      |rdd l	}|| _
        d| _        t        t	        j
                  dd	            | _        y )
Nr)   r'   r(   a@  You specified `report_to='wandb'` but also set the `WANDB_DISABLED` environment variable.
This disables wandb logging, even though it was explicitly requested.

- To enable wandb logging: unset `WANDB_DISABLED`.
- To disable logging: use `report_to='none'`.

Note: WANDB_DISABLED is deprecated and will be removed in v5.zFWandbCallback requires wandb to be installed. Run `pip install wandb`.r   Fr  r  )r5   r0   r1   r2   r+   r,   r-   r$   r}   r)   _wandb_initializedr  
_log_model)r  	has_wandbwandb_disabledr)   s       r4   r  zWandbCallback.__init__)  s    &(	~~''0<!#+;R!@!F!F!HL`!`!&X  ghhDK!'		2CW(MNr6   c           	      (
   | j                   yd| _        ddlm} |j                  rt
        j                  d       i |j                         }t        |d      rR|j                  Ft        |j                  t              r|j                  n|j                  j                         }i ||}t        |d      r |j                  |j                  }i d|i|}|j                  }	i }
|	#|	|
d<   |j                  xs |j                  |
d	<   nQ|j                  E|j                  |
d<   |j                  |j                  k(  r| j                   j!                  d
d       | j                   j"                  2 | j                   j$                  d*dt'        j(                  dd      i|
 | j                   j                  j+                  |xs i d       t-        | j                   dd      r9| j                   j/                  d       | j                   j/                  ddd       t'        j(                  dd      }t1               s6|dv r2| j                   j3                  ||t5        d|j6                               | j                   j"                  j9                  d       	 |j;                         | j                   j                  d<   | j@                  jB                  rtE        jF                         5 }|j                  |j                  |j                  k(  r#d| j                   j"                  jH                   n"d| j                   j"                  jJ                   }| j                   jM                  |d t        |d      r|j                  j                         nd| j                   j                  jO                  d      dd!"      }tQ        ||       tS        |      jU                  d      D ]X  }|jW                         s|jY                  |jJ                  d#$      5 }|j[                  |j]                                ddd       Z | j                   j"                  j_                  |d%g&       d'| j                   j"                  j`                   d(}tb        xjd                  d)| z  c_2        ddd       yyy# t<        $ r t
        j                  d       Y |$ r t
        j?                  d       Y 3w xY w# 1 sw Y   xY w# 1 sw Y   yxY w)+u  
        Setup the optional Weights & Biases (*wandb*) integration.

        One can subclass and override this method to customize the setup if needed. Find more information
        [here](https://docs.wandb.ai/guides/integrations/huggingface). You can also override the following environment
        variables:

        Environment:
        - **WANDB_LOG_MODEL** (`str`, *optional*, defaults to `"false"`):
            Whether to log model and checkpoints during training. Can be `"end"`, `"checkpoint"` or `"false"`. If set
            to `"end"`, the model will be uploaded at the end of training. If set to `"checkpoint"`, the checkpoint
            will be uploaded every `args.save_steps` . If set to `"false"`, the model will not be uploaded. Use along
            with [`~transformers.TrainingArguments.load_best_model_at_end`] to upload best model.

            <Deprecated version="5.0">

            Setting `WANDB_LOG_MODEL` as `bool` will be deprecated in version 5 of 🤗 Transformers.

            </Deprecated>
        - **WANDB_WATCH** (`str`, *optional* defaults to `"false"`):
            Can be `"gradients"`, `"all"`, `"parameters"`, or `"false"`. Set to `"all"` to log gradients and
            parameters.
        - **WANDB_PROJECT** (`str`, *optional*, defaults to `"huggingface"`):
            Set this to a custom string to store results in a different project.
        - **WANDB_DISABLED** (`bool`, *optional*, defaults to `False`):
            Whether to disable wandb entirely. Set `WANDB_DISABLED=true` to disable.
        NTr   )ConfigErrorz`Automatic Weights & Biases logging enabled, to disable set os.environ["WANDB_DISABLED"] = "true"r   peft_configr   groupzThe `run_name` is currently set to the same value as `TrainingArguments.output_dir`. If this was not intended, please specify a different run name by setting the `TrainingArguments.run_name` parameter.F)repeatr'  WANDB_PROJECTr  allow_val_changedefine_metrictrain/global_stepr   )step_metric	step_syncWANDB_WATCHr  )allr!  	gradientsd   )loglog_freqtransformers_trainer)codemodel/num_parameterszZCould not log the number of model parameters in Weights & Biases due to an AttributeError.zbA ConfigError was raised whilst setting the number of model parameters in Weights & Biases config.model-r   )r  num_parametersinitial_modelr   r  r-  wbr   r  aliasesz[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>]()
r:   )3r  r  wandb.sdk.lib.config_utilr  r  r.   r  to_dictr3   r   rx   r|   r  rY  run_namer  termwarnr*   rW  r+   r,   r   r   r  r%   watchmaxlogging_steps_labelr  AttributeErrorr/   r  r  r   r   r1  r   Artifactr  r  r   r   is_filenew_filewrite
read_byteslog_artifacturlr   AUTOGENERATED_TRAINER_COMMENT)r  r   rX  r   r   WandbConfigErrorcombined_dictr  r  rY  	init_args_watch_modeltemp_dir
model_namemodel_artifactr  fabadge_markdowns                     r4   setupzWandbCallback.setupA  sx   8 ;;  	N&&KKr /t||~.Muh'ELL,D/9%,,/Mu||SXS_S_SgSgSi A< A= Aum,1B1B1N#// QM;#? Q= Q))JI%$.	&!%)]]%Edoo	'"*$(MM	&!==DOO3KK((C$ )  {{&    IIo}E
 KK%%m&9rD%Q t{{OT:))*=>))#;NZ^)_ 99]G<L)+@b0b!!%\CUM`M`Da!bKKOO""(>"?	=B=Q=Q=S""#9: ))002 Uh !MM1T]]doo5U !!3!3 45%dkkoo&:&:%;< 
 &*[[%9%9'$FMeU]F^ELL,@,@,Bdh.2kk.@.@.D.DE[.\-1" &: &N 4E8D!(^005 999;!/!8!8d!8!K 9r " 89 99 KKOO00,0X--1[[__-@-@,AD # ;;NCS?TT;=U U *u '` " p $ x69 9)U UsD   'R: /DT T S;=A2T:S8S87S8;T TTNc                     | j                   y |j                  }|r(| j                   j                          d| _        d |_        | j                  s | j
                  |||fi | y y NF)r  r  finishr  r  r  )r  r   rX  r  r   r   	hp_searchs          r4   r  zWandbCallback.on_train_begin  sa    ;;//	KK  %D DM  DJJtUE4V4 !r6   r   c           	         | j                   y | j                  j                  r| j                  r|j                  ruddlm} t        j                  |      }d |_	        d |_
         ||||dg      }	t        j                         5 }
|	j                  |
       |j                  slt        | j                   j                         j#                         D ci c]3  \  }}t%        |t&        j(                        r|j+                  d      s||5 c}}nKd|j,                   |j.                  d|j0                  d| j                   j2                  j5                  d      i}d	|d
<   t6        j9                  d       |j:                  |j:                  |j<                  k(  r#d| j                   j>                  j@                   n"d| j                   j>                  jB                   }tE        ||
       | j                   jG                  |d|      }tI        |
      jK                  d      D ]X  }|jM                         s|jO                  |jB                  d      5 }|jQ                  |jS                                d d d        Z | j                   j>                  jU                  |d
g       d d d        y y y y c c}}w # 1 sw Y   xY w# 1 sw Y   y xY w)Nr   Trainerfaker   r   processing_classeval_dataset_rw  ztrain/total_flossr  Tfinal_modelzLogging model artifacts. ...r  r   r  r   r  r  r  )+r  r  r  r  r  r   r  copydeepcopy	deepspeeddeepspeed_pluginr   r   
save_modelload_best_model_at_endr|   r  rE  rx   numbersNumberr   metric_for_best_modelbest_metric
total_flosr   r  r.   r  r  r  r*   r1  r   r  r  r   r   r  r  r  r  r  )r  r   rX  r  r   r  r   r  args_for_fakefake_trainerr  r  r  r-  r  artifactr  r	  s                     r4   r  zWandbCallback.on_train_end  s{   ;;??%%$*;*;@[@[) MM$/M&*M#-1M*""%BRbhaiL ,,. P(''1  66 %))<)<$=$C$C$E Aq%a8cAR 1   : :;<e>O>O+U-=-=.0B0B0F0FG]0^  +/':; -$//1Q T[[__//01!$++//"6"6!78  0x@;;//ZgX`/ah,,S1 5Ayy{%..qvvD.A 5RHHQ\\^45 55 ,,X,O=P P A\*;%25 59P Ps>   	AK	8J7D,K	<K	 J=92K	7K	=KK		Kc                    g d}| j                   y | j                  s| j                  |||       |j                  r|j	                         D ]-  \  }}	||v s|	| j                   j
                  j                  |<   / |j	                         D 	ci c]  \  }}	||vs||	 }
}}	t        |
      }
| j                   j                  i |
d|j                  i       y y c c}	}w )Ntrain_runtimetrain_samples_per_secondtrain_steps_per_second
train_lossr#  r  )
r  r  r  r  rE  r*   r  r[  r  r  r  r   rX  r  r   r  r   single_value_scalarsr  r  non_scalar_logss              r4   r  zWandbCallback.on_log  s     
 ;;  JJtUE*&&

 31,,12DKKOO++A.3 15

^1I]@]q!t^O^*?;OKKOOWW0CUEVEVWX ' _s   CCc                 
   | j                   t        j                  k(  r| j                  r|j                  rt        | j                  j                        j                         D ci c]3  \  }}t        |t        j                        r|j                  d      s||5 }}}| j                  j                  j                  d      |d<   d|j                   }t         j"                  j%                  |j&                  |      }	t(        j+                  d| d       |j,                  |j,                  |j&                  k(  r#d| j                  j.                  j0                   n"d| j                  j.                  j2                   }
| j                  j5                  |
d|      }|j7                  |	       | j                  j9                  |d	t;        |j<                  d
       d|j                   g       y y y y c c}}w )Nr  r  checkpoint- Logging checkpoint artifacts in z. ...r  r   r  epoch_r   checkpoint_global_step_r  )r  r  r  r  r  r|   r  r  rE  rx   r  r   r   r   r  r  r+   r   r   r  r.   r  r  r*   r1  r   r  add_dirr  roundepoch)r  r   rX  r  r   r  r  checkpoint_metadatackpt_dirartifact_pathcheckpoint_namer&  s               r4   on_savezWandbCallback.on_save  s   ??m6664;L;LQVQlQl !!4!45;;=#Aqa0c9J 1# #
 ;?++:L:L:P:PQg:h 67$U%6%6$78HGGLL(CMKK:8*EJK MM)T]]doo-M ++,-dkkoo2234 
 {{++wYl+mH]+KK$$VE%++q,A+B#CG^_d_p_p^qEr"s % % Rm;L6#s   )8G?c                     | j                   y | j                  s | j                  ||fi | |j                  r't	        |      }| j                   j                  |       y y rf   )r  r  r  r  r[  r  r  r   rX  r  r   r   s         r4   
on_predictzWandbCallback.on_predict"  sU    ;;  DJJtU-f-&&"7+GKKOOG$ 'r6   rf   NNr  r  r  r  r  r  r  r   r  r  r<  r?  r:   r6   r4   re  re  $  s:    O0|U|	5*P!2 *PXY*.%r6   re  c                   F    e Zd ZdZd Zd ZddZddefdZddZ	d	 Z
d
 Zy)TrackioCallbacka  
    A [`TrainerCallback`] that logs metrics to Trackio.

    It records training metrics, model (and PEFT) configuration, and GPU memory usage.
    If `nvidia-ml-py` is installed, GPU power consumption is also tracked.

    **Requires**:
    ```bash
    pip install trackio
    ```
    c                 Z    t               }|st        d      |rdd l}|| _        d| _        y )NzLTrackioCallback requires trackio to be installed. Run `pip install trackio`.r   F)r;   r}   r8   _trackior  )r  has_trackior8   s      r4   r  zTrackioCallback.__init__9  s.    *,mnn#DM!r6   c                 
   |j                   rDi |j                         }t        |d      rR|j                  Ft	        |j                  t
              r|j                  n|j                  j                         }i ||}t        |d      r |j                  |j                  }i d|i|}| j                  j                  t        j                  dd      |j                  t        j                  dd      d       | j                  j                  j                  |d	
       	 |j                         | j                  j                  d<   d	| _        yd	| _        y# t        $ r t        j!                  d       Y d	| _        yw xY w)a  
        Setup the optional Trackio integration.

        To customize the setup you can also override the following environment variables:

        Environment:
        - **TRACKIO_PROJECT** (`str`, *optional*, defaults to `"huggingface"`):
            The name of the project (can be an existing project to continue tracking or a new project to start tracking
            from scratch).
        - **TRACKIO_SPACE_ID** (`str`, *optional*, defaults to `None`):
            If set, the project will be logged to a Hugging Face Space instead of a local directory. Should be a
            complete Space name like `"username/reponame"` or `"orgname/reponame"`, or just `"reponame" in which case
            the Space will be created in the currently-logged-in Hugging Face user's namespace. If the Space does not
            exist, it will be created. If the Space already exists, the project will be logged to it.
        r   Nr  TRACKIO_PROJECTr  TRACKIO_SPACE_IDallow)r'  r   space_idresumeTr  r  zQCould not log the number of model parameters in Trackio due to an AttributeError.)r  r  r3   r   rx   r|   r  rE  rW  r+   r,   r  r   r  r  r.   r  r  )r  r   rX  r   r   r  r  r  s           r4   r  zTrackioCallback.setupC  sV     &&.t||~.Muh'ELL,D/9%,,/Mu||SXS_S_SgSgSi A< A= Aum,1B1B1N#// QM;#? Q= QMM		"3]C]]#5t<	   MM  '''Mq?D?S?S?U$$%;< !D " qop qs   #'E FFNc                 H    | j                   s | j                  |||fi | y y rf   r  r  r  r   rX  r  r   r   s         r4   r  zTrackioCallback.on_train_beginn  '      DJJtUE4V4 !r6   r   c                 l    |j                   r(| j                  r| j                  j                          y y y rf   )r  r  rE  r  r  r   rX  r  r   r  r   s          r4   r  zTrackioCallback.on_train_endr  s+    &&4+<+<MM  " ,=&r6   c                    g d}t               rRt        j                  j                         r3t        j                  j	                         }t        j                  j                  |      j                  }	t        j                  j                  |      }
d| d|
dz  d| d|
|	z  i}t        d      r+t        j                  j                  |      }|dz  |d| d<   t        j                         rqt        j                         r]d gt        j                         z  }t        j                  ||       |D ci c]  }|j                         D ]  \  }}||
  }}}}ni }| j                  s| j!                  |||       |j"                  ra|j                         D ci c]  \  }}||vs|| }}}t%        |      }| j&                  j)                  i ||d	|j*                  i       y y c c}}}w c c}}w )
Nr(  zgpu/z/allocated_memoryi   @z/memory_usagepynvmli  z/powerr  )r   r   cudais_availablecurrent_deviceget_device_propertiestotal_memorymemory_allocatedr   
power_drawdistis_initializedget_world_sizeall_gather_objectrE  r  r  r  r[  rE  r  r  )r  r   rX  r  r   r  r   r.  
device_idxrY  rZ  gpu_memory_logspowergathered_logsry  r  r  r/  s                     r4   r  zTrackioCallback.on_logv  s    
 EJJ$;$;$=224J ::;;JGTTL$zz:::F zl"346F'6Rzl-02B\2QO %X.

--j9=BT\$zl& 9:  "t':':'<!%)<)<)> >&&}oF1>"U"UA1779"U41a1a4"U1"U"U O  JJtUE*&&04

^1I]@]q!t^O^*?;OMMllOlEXZ_ZkZklm ' #V _s   ;"G1"G8/G8c                      y rf   r:   r  s        r4   r<  zTrackioCallback.on_save  s    r6   c                     | j                   y | j                  s | j                  ||fi | |j                  r't	        |      }| j                   j                  |       y y rf   )rE  r  r  r  r[  r  r>  s         r4   r?  zTrackioCallback.on_predict  sW    ==   DJJtU-f-&&"7+GMMg& 'r6   rf   r@  rA  r:   r6   r4   rC  rC  ,  s5    
")!V5#!2 #!nF'r6   rC  c                   8    e Zd ZdZd Zd Zd	dZd
dZd Zd Z	y)CometCallbackz_
    A [`TrainerCallback`] that sends the logs to [Comet ML](https://www.comet.com/site/).
    c                     t         du st        du rt        dt         dt         d      d| _        d| _        d | _        y )NFz!CometCallback requires comet-ml>=z- to be installed. Run `pip install comet-ml>=z`.)rC   rD   r}   rF   r  _log_assets_experimentr  s    r4   r  zCometCallback.__init__  s`    %'+Be+K34F3GGt  vH  uI  IK  L  " r6   c                    d| _         t        j                  dd      j                         }|dv rd| _        |j
                  rt        j                  d      }d}d}|@|j                         }|dk(  rd}n(|dk(  rd	}n |d
v r|}n|rt        j                  d|       y|j                  r|t        j                  d|       d}ddl
} |j                  |j                        }	 |j                  |||	      | _        | j                  j                  |d       d|j!                         i}
t#        |d      r+|j$                  |j$                  j!                         }||
d<   t#        |d      r|j&                  |j&                  }||
d<   | j                  j)                  |
ddd       |j                  r8t+        |dd      }t+        |dd      }| j                  j-                  ||       yyy)a  
        Setup the optional Comet integration.

        Environment:
        - **COMET_MODE** (`str`, *optional*, default to `get_or_create`):
            Control whether to create and log to a new Comet experiment or append to an existing experiment.
            It accepts the following values:
                * `get_or_create`: Decides automatically depending if
                  `COMET_EXPERIMENT_KEY` is set and whether an Experiment
                  with that key already exists or not.
                * `create`: Always create a new Comet Experiment.
                * `get`: Always try to append to an Existing Comet Experiment.
                  Requires `COMET_EXPERIMENT_KEY` to be set.
                * `ONLINE`: **deprecated**, used to create an online
                  Experiment. Use `COMET_START_ONLINE=1` instead.
                * `OFFLINE`: **deprecated**, used to created an offline
                  Experiment. Use `COMET_START_ONLINE=0` instead.
                * `DISABLED`: **deprecated**, used to disable Comet logging.
                  Use the `--report_to` flag to control the integrations used
                  for logging result instead.
        - **COMET_PROJECT_NAME** (`str`, *optional*):
            Comet project name for experiments.
        - **COMET_LOG_ASSETS** (`str`, *optional*, defaults to `TRUE`):
            Whether or not to log training assets (tf event logs, checkpoints, etc), to Comet. Can be `TRUE`, or
            `FALSE`.

        For a number of configurable items in the environment, see
        [here](https://www.comet.com/docs/v2/guides/experiment-management/configure-sdk/#explore-comet-configuration-options).
        TCOMET_LOG_ASSETSr^   >   1r_   rA   Nonliner   F)r  get_or_creater;  z:Invalid COMET_MODE env value %r, Comet logging is disabledzjHyperparameter Search is enabled, forcing the creation of new experiments, COMET_MODE value %r  is ignoredr;  r   )r   )rn  r   experiment_configtransformers)	frameworkr   r   r  manual)rr  sourceflatten_nestedrY  trial_params)optimization_idr!  )r  r+   r,   r-   ri  r  lowerr.   r/   r  r   ExperimentConfigr  startrj  !__internal_api__set_model_graph__r  r3   r   r   __internal_api__log_parameters__r   log_optimization)r  r   rX  r   
log_assetscomet_old_moder   rn  r   rp  r{   r  r  rw  optimization_paramss                  r4   r  zCometCallback.setup  s   < !YY17;AAC
&#D&&YY|4NDF)!/!5!5!7!X-!F#y0"F#'II)D#NN#_aop **#NN E&   9 9 9t}} M-x~~V$ZklD>>uP^>_dlln-Fuh'ELL,D$||335#/x um,1B1B1N#//(3}%==.RV >  **")%t"D&-e^T&J#  11/^q1r	 +a 'r6   Nc                 D    | j                   s| j                  |||       y y rf   rN  rO  s         r4   r  zCometCallback.on_train_begin         JJtUE* !r6   c                     | j                   s| j                  |||       |j                  rL| j                  ?t	        |      }| j                  j                  ||j                  |j                  d       y y y )Nrq  stepr7  rr  r  r  r  rj  r[  __internal_api__log_metrics__r  r7  )r  r   rX  r  r   r  r   rewritten_logss           r4   r  zCometCallback.on_log  sq      JJtUE*&&+!-d!3  >>"):):%++Yg ?  , 'r6   c                 X   | j                   r|j                  r| j                  V| j                  du rHt        j                  d       | j                  j                  |j                  dd|j                         |j                  r"| j                  j                          d| _         y y y y )NTz(Logging checkpoints. This may take time.)	recursivelog_file_namer  F)r  r  rj  ri  r.   r  log_asset_folderr  r  r  cleanr  s        r4   r  zCometCallback.on_train_end  s    !<!<+##t+KK JK$$554tRWRcRc 6 
 **  &&($)! + "=r6   c                     | j                   s| j                  ||d        |j                  rL| j                  ?t	        |      }| j                  j                  ||j                  |j                  d       y y y )N)r   rq  r  r  )r  r   rX  r  r   r   rewritten_metricss          r4   r?  zCometCallback.on_predict(  sr      JJtU$J/&&4+;+;+G ,W 5::!(9(9Xf ;  ,H&r6   rf   r@  )
r  r  r  r  r  r  r  r  r  r?  r:   r6   r4   rg  rg    s(     Vsp+*r6   rg  c                   &    e Zd ZdZddZd ZddZy)AzureMLCallbackzh
    A [`TrainerCallback`] that sends the logs to [AzureML](https://pypi.org/project/azureml-sdk/).
    Nc                 <    t               st        d      || _        y )NzPAzureMLCallback requires azureml to be installed. Run `pip install azureml-sdk`.)r[   r}   azureml_run)r  r  s     r4   r  zAzureMLCallback.__init__7  s    #%qrr&r6   c                 n    ddl m} | j                  #|j                  r|j	                         | _        y y y )Nr   Run)azureml.core.runr  r  r  get_context)r  r   rX  r  r   r  s         r4   on_init_endzAzureMLCallback.on_init_end<  s1    (#(C(C"0D )D#r6   c                     | j                   r[|j                  rN|j                         D ]:  \  }}t        |t        t
        f      s| j                   j                  |||       < y y y )N)description)r  r  rE  rx   r  r  r  r  s           r4   r  zAzureMLCallback.on_logB  s]     ; ;

 >1a#u.$$((A1(=> !<r6   rf   )r  r  r  r  r  r  r  r:   r6   r4   r  r  2  s    '
1>r6   r  c                   >    e Zd ZdZd Zd Zd
dZd
dZd Zd Z	d	 Z
y)MLflowCallbackz
    A [`TrainerCallback`] that sends the logs to [MLflow](https://www.mlflow.org/). Can be disabled by setting
    environment variable `DISABLE_MLFLOW_INTEGRATION = TRUE`.
    c                    t               st        d      dd l}|j                  j                  j
                  | _        |j                  j                  j                  | _        d| _	        d| _
        d| _        || _        y )NzIMLflowCallback requires mlflow to be installed. Run `pip install mlflow`.r   F)ra   r}   r`   utils
validationMAX_PARAM_VAL_LENGTH_MAX_PARAM_VAL_LENGTHMAX_PARAMS_TAGS_PER_BATCH_MAX_PARAMS_TAGS_PER_BATCHr  _auto_end_run_log_artifacts_ml_flow)r  r`   s     r4   r  zMLflowCallback.__init__O  sf    "$jkk%+\\%<%<%Q%Q"*0,,*A*A*[*['!"#r6   c           
      
   t        j                  dd      j                         t        v | _        t        j                  dd      j                         t        v | _        t        j                  dd      | _        t        j                  dd      | _        t        j                  dd      j                         t        v | _        t        j                  dd      | _	        t        j                  d	d      | _
        t        j                  j                  | j                  j                        t        j                  j                  d
      k\  | _        t"        j%                  d| j                   d|j&                   d| j
                   d| j                          |j(                  r| j                  j+                         sj| j                  rH| j                  j-                  | j                         t"        j%                  d| j                          nFt"        j%                  d       n0t"        j%                  d| j                  j/                                 | j                  j1                         | j
                  s| j                  r| j                  r%| j                  j3                  | j                         | j                  j5                  |j&                  | j
                         t"        j%                  d| j                  j1                         j6                  j8                          d| _        |j=                         }t?        |d      r,|j@                   |j@                  j=                         }i ||}| j                  rtC        |      n|}tE        |jG                               D ]F  \  }}tI        tK        |            | jL                  kD  s(t"        jO                  d| d| d       ||= H tE        |jG                               }| j                  rg| j                  jQ                         rMtS        | j                        }	|	tI        |      k  r*t"        j%                  dtI        |       d|	 d       |d|	 }tU        dtI        |      | jV                        D ]y  }
| j                   r7| j                  jY                  t[        ||
|
| jV                  z          d       F| j                  jY                  t[        ||
|
| jV                  z                 { t        j                  dd      }|r0t]        j^                  |      }| j                  ja                  |       d| _1        y)a  
        Setup the optional MLflow integration.

        Environment:
        - **HF_MLFLOW_LOG_ARTIFACTS** (`str`, *optional*):
            Whether to use MLflow `.log_artifact()` facility to log artifacts. This only makes sense if logging to a
            remote server, e.g. s3 or GCS. If set to `True` or *1*, will copy each saved checkpoint on each save in
            [`TrainingArguments`]'s `output_dir` to the local or remote artifact storage. Using it without a remote
            storage will just copy the files to your artifact location.
        - **MLFLOW_TRACKING_URI** (`str`, *optional*):
            Whether to store runs at a specific path or remote server. Unset by default, which skips setting the
            tracking URI entirely.
        - **MLFLOW_EXPERIMENT_NAME** (`str`, *optional*, defaults to `None`):
            Whether to use an MLflow experiment_name under which to launch the run. Default to `None` which will point
            to the `Default` experiment in MLflow. Otherwise, it is a case sensitive name of the experiment to be
            activated. If an experiment with this name does not exist, a new experiment with this name is created.
        - **MLFLOW_TAGS** (`str`, *optional*):
            A string dump of a dictionary of key/value pair to be added to the MLflow run as tags. Example:
            `os.environ['MLFLOW_TAGS']='{"release.candidate": "RC1", "release.version": "2.2.0"}'`.
        - **MLFLOW_NESTED_RUN** (`str`, *optional*):
            Whether to use MLflow nested runs. If set to `True` or *1*, will create a nested run inside the current
            run.
        - **MLFLOW_RUN_ID** (`str`, *optional*):
            Allow to reattach to an existing run which can be useful when resuming training from a checkpoint. When
            `MLFLOW_RUN_ID` environment variable is set, `start_run` attempts to resume a run with the specified run ID
            and other parameters are ignored.
        - **MLFLOW_FLATTEN_PARAMS** (`str`, *optional*, defaults to `False`):
            Whether to flatten the parameters dictionary before logging.
        - **MLFLOW_MAX_LOG_PARAMS** (`int`, *optional*):
            Set the maximum number of parameters to log in the run.
        HF_MLFLOW_LOG_ARTIFACTSr^   MLFLOW_NESTED_RUNMLFLOW_TRACKING_URINMLFLOW_EXPERIMENT_NAMEMLFLOW_FLATTEN_PARAMSMLFLOW_RUN_IDMLFLOW_MAX_LOG_PARAMSz2.8.0zMLflow experiment_name=z, run_name=z	, nested=z, tracking_uri=zMLflow tracking URI is set to zdEnvironment variable `MLFLOW_TRACKING_URI` is not provided and therefore will not be explicitly set.)r  nestedzMLflow run started with run_id=Tr   r  z" for key "z" as a parameter. MLflow's log_param() only accepts values no longer than 250 characters so we dropped this attribute. You can use `MLFLOW_FLATTEN_PARAMS` environment variable to flatten the parameters and avoid this message.z.Reducing the number of parameters to log from z to .r   F)synchronousMLFLOW_TAGS)2r+   r,   r-   r$   r  _nested_run_tracking_uri_experiment_name_flatten_params_run_id_max_log_params	packagingr.  parser  r   
_async_logr.   debugr  r  is_tracking_uri_setset_tracking_uriget_tracking_uri
active_runset_experiment	start_runr  rN  r  r  r3   r   r   r   rE  rx  r   r  r/   isdigitr  r   r  
log_paramsr|   jsonrC  set_tagsr  )r  r   rX  r   r  r  r   r   combined_dict_itemsmax_log_paramsr   mlflow_tagss               r4   r  zMLflowCallback.setup\  ss   @ !ii(A7KQQSWkk99%8'BHHJNbbYY'<dC "		*BD I!yy)@'JPPRVjjyy$7!yy)@$G
 $++11$--2K2KLPYPaPaPgPghoPpp%d&;&;%<KV_`d`p`p_q r!//02	
 &&==446%%MM2243E3EFLL#A$BTBTAU!VWLL+
 =dmm>\>\>^=_`a}}'')1T5E5E((MM001F1FG''tGWGW'X>t}}?W?W?Y?^?^?e?e>fgh%)" LLNMuh'ELL,D$||335 A< A= A;?;O;OL7UbM#M$7$7$9: 	,es5z?T%?%??NNCE7+VZU[ \/ / &d+	, #'}':':'<"=##(<(<(D(D(F!$T%9%9!:!C(;$<<LLHM`IaHbbfgufvvwx +>o~*N'1c"568W8WX q??MM,,0Q9X9X5XYZhm -  MM,,T2Ea!dNmNmJm2n-opq ))M48K"jj5&&{3 r6   Nc                 D    | j                   s| j                  |||       y y rf   rN  rO  s         r4   r  zMLflowCallback.on_train_begin  r  r6   c           
         | j                   s| j                  |||       |j                  r4i }|j                         D ]  \  }}	t	        |	t
        t        f      r|	||<   "t	        |	t        j                        r'|	j                         dk(  r|	j                         ||<   ct        j                  d|	 dt        |	       d| d        |j                         D 	ci c]  \  }}	t        j                  dd|      |	 }
}}	| j                   r)| j"                  j%                  |
|j&                  d	       y | j"                  j%                  |
|j&                  
       y y c c}	}w )Nr   r  r  r  zc" as a metric. MLflow's log_metric() only accepts float and int types so we dropped this attribute.z[^0-9A-Za-z_\-\.\ :/]r  F)r   r  r  )r   r  )r  r  r  rE  rx   r  r  r   Tensornumelitemr.   r/   r  resubr  r  log_metricsr  )r  r   rX  r  r  r   r   r   r  r  sanitized_metricss              r4   r  zMLflowCallback.on_log  sE     JJtUE*&&G

 	1a#u.!"GAJ5<<0QWWY!^!"GAJNNCA3jQUVWQXPYYcdecf go o	 ZaYfYfYh iQUQRTU(@#q!I1!L i i))2C%J[J[in)o))2C%J[J[)\' ' !js   "E"c                     | j                   rP|j                  rC| j                  r6| j                  j	                         r| j                  j                          y y y y y rf   )r  r  r  r  r  end_runr  s        r4   r  zMLflowCallback.on_train_end  sL    !<!<!!dmm&>&>&@%%' 'A! "=r6   c                    | j                   r|j                  r| j                  rd|j                   }t        j
                  j                  |j                  |      }t        j                  d| d       | j                  j                  j                  |d|i| j                  j                  j                                y y y y )Nr1  r2  z. This may take time.
model_path)	artifactspython_model)r  r  r  r  r+   r   r   r  r.   r  r  pyfunc	log_modelPythonModelr  r   rX  r  r   r9  r:  s          r4   r<  zMLflowCallback.on_save  s    !<!<ATAT$U%6%6$78HGGLL(CMKK:8*DYZ[MM  **'7!]]11==? + 	 BU!<r6   c                     | j                   rWt        t        | j                  dd             r6| j                  j	                         | j                  j                          y y y y )Nr  )r  callabler   r  r  r  r  s    r4   __del__zMLflowCallback.__del__  sU     dCD((*6MM!!# 7 E r6   rf   )r  r  r  r  r  r  r  r  r  r<  r  r:   r6   r4   r  r  I  s-    
i!V+]0(
	$r6   r  c                   2     e Zd ZdZ fdZ fdZd Z xZS )DagsHubCallbackzh
    A [`TrainerCallback`] that logs to [DagsHub](https://dagshub.com/). Extends [`MLflowCallback`]
    c                 f    t         |           t               st        d      ddlm} || _        y )NzLDagsHubCallback requires dagshub to be installed. Run `pip install dagshub`.r   )Repo)superr  rd   rb  dagshub.uploadr  )r  r  r~   s     r4   r  zDagsHubCallback.__init__  s*    #%lmm'	r6   c                 l   t        j                  dd      j                         t        v | _        t        j                  d      xs d| _        t        j                  d      | _        | j                  | j                  j                  t         j                        d   | j                  j                  t         j                        d   j                  d      d	   t        j                  d
      xs d      | _
        t        d      | _        | j                  t        d      t        | <  |i | y)z
        Setup the DagsHub's Logging integration.

        Environment:
        - **HF_DAGSHUB_LOG_ARTIFACTS** (`str`, *optional*):
                Whether to save the data and model artifacts for the experiment. Default to `False`.
        HF_DAGSHUB_LOG_ARTIFACTSr^   HF_DAGSHUB_MODEL_NAMEmainr  r  r   BRANCH)ownerr   branchr  NzpDagsHubCallback requires the `MLFLOW_TRACKING_URI` environment variable to be set. Did you run `dagshub.init()`?)r+   r,   r-   r$   log_artifactsr   remoter  splitseprepor   r   r}   r  r  )r  r   r   r~   s      r4   r  zDagsHubCallback.setup  s      YY'A7KQQSWkkII56@&	ii 56II++##BFF+B/""266*2.44S9!<99X&0&  
	
 %	;;% 
 	t&v&r6   c                 j   | j                   rt        | dd       rRt        j                  | j                  j
                  t        j                  j                  |j                  d             | j                  j                  t        | j                              j                  |j                         y y )Ntrain_dataloaderz
dataset.pt)r  r   r   saver  datasetr+   r   r   r  r  	directoryr   r5  r  s        r4   r  zDagsHubCallback.on_train_end'  st    t/6

40088"'',,tXd:efIIDII/77H	 r6   )r  r  r  r  r  r  r  __classcell__r~   s   @r4   r  r    s    '6Ir6   r  c                        e Zd Z fdZ xZS )NeptuneMissingConfigurationc                 $    t         |   d       y )NaA  
        ------ Unsupported ---- We were not able to create new runs. You provided a custom Neptune run to
        `NeptuneCallback` with the `run` argument. For the integration to work fully, provide your `api_token` and
        `project` by saving them as environment variables or passing them to the callback.
        )r  r  )r  r~   s    r4   r  z$NeptuneMissingConfiguration.__init__0  s    	
r6   )r  r  r  r  r  r  s   @r4   r  r  /  s    
 
r6   r  c                   0   e Zd ZdZdZdZdZdZdZdhZ	dddd	dd
ddde
e   de
e   de
e   dedede
e   fdZd Zd Zd Zd Zd Zed        Zed        Zd Zd Zd Zd Zdedefd Zd! Zd*d"Zd# Zd$ Zd% Zd*d&Z e!d'        Z"d*d(e
e#ee$f      fd)Z%y)+NeptuneCallbacka  TrainerCallback that sends the logs to [Neptune](https://app.neptune.ai).

    Args:
        api_token (`str`, *optional*): Neptune API token obtained upon registration.
            You can leave this argument out if you have saved your token to the `NEPTUNE_API_TOKEN` environment
            variable (strongly recommended). See full setup instructions in the
            [docs](https://docs.neptune.ai/setup/installation).
        project (`str`, *optional*): Name of an existing Neptune project, in the form "workspace-name/project-name".
            You can find and copy the name in Neptune from the project settings -> Properties. If None (default), the
            value of the `NEPTUNE_PROJECT` environment variable is used.
        name (`str`, *optional*): Custom name for the run.
        base_namespace (`str`, *optional*, defaults to "finetuning"): In the Neptune run, the root namespace
            that will contain all of the metadata logged by the callback.
        log_parameters (`bool`, *optional*, defaults to `True`):
            If True, logs all Trainer arguments and model parameters provided by the Trainer.
        log_checkpoints (`str`, *optional*): If "same", uploads checkpoints whenever they are saved by the Trainer.
            If "last", uploads only the most recently saved checkpoint. If "best", uploads the best checkpoint (among
            the ones saved by the Trainer). If `None`, does not upload checkpoints.
        run (`Run`, *optional*): Pass a Neptune run object if you want to continue logging to an existing run.
            Read more about resuming runs in the [docs](https://docs.neptune.ai/logging/to_existing_object).
        **neptune_run_kwargs (*optional*):
            Additional keyword arguments to be passed directly to the
            [`neptune.init_run()`](https://docs.neptune.ai/api/neptune#init_run) function when a new run is created.

    For instructions and examples, see the [Transformers integration
    guide](https://docs.neptune.ai/integrations/transformers) in the Neptune documentation.
    z%source_code/integrations/transformersmodel_parametersry   rv  trainer_parametersztrain/epochN
finetuningT)	api_tokenr'  r   base_namespacer*   log_parameterslog_checkpointsr  r'  r   r  r  r  c                   t               st        d      	 ddlm}	 ddlm}
  |
d|t        t        d       f        |
d|t        t        d       f        |
d|t        t        d       f        |
d|t                |
d	||	t        d       f        |
d
|t                |
d|t        t        d       f       || _        || _        || _        || _        d | _        d| _        d | _        d| _        |||d|| _        d | _        | j                  d u| _        d | _        | j                  dv rd| j                   | _        d| _        y d| _        d| _        y # t        $ r ddlm}
 ddlm}	 Y Lw xY w)NzwNeptuneCallback requires the Neptune client library to be installed. To install the library, run `pip install neptune`.r   r  )verify_typer  r'  r   r  r*   r  r  F)r  r'  r   >   r   lastzcheckpoints/Tcheckpoints)rh   
ValueErrorr   r  neptune.internal.utilsr	  rb  neptune.new.internal.utils#neptune.new.metadata_containers.runr   r  r  _base_namespace_path_log_parameters_log_checkpoints_initial_run_run_is_monitoring_runr  _force_reset_monitoring_run_init_run_kwargs_volatile_checkpoints_dir_should_upload_checkpoint_recent_checkpoint_path_target_checkpoints_namespace*_should_clean_recently_uploaded_checkpoint)r  r  r'  r   r  r*   r  r  neptune_run_kwargsr  r	  s              r4   r  zNeptuneCallback.__init__^  s    $%E 
	@#:
 	KS$t*,=>Iwd4j(9:FD3T
"34$nc:E3d4j 12$nd;%d4j8IJ$2!- /+.	"'+0(.7GUY p]o p)-&)-)>)>d)J&'+$  $443?@U@U?V1WD.>BD;1>D.>CD;A  	@>??	@s   E E0/E0c                 d    | j                   r$| j                   j                          | ` d | _         y y rf   )r  stopr  s    r4   _stop_run_if_existsz#NeptuneCallback._stop_run_if_exists  s(    99IINN	DI r6   c                 f   	 ddl m} ddlm}m} | j                          	 |j                         }|j                  | j                          |di || _        | j                  d   j                         | _        y # t
        $ r ddlm} ddlm}m} Y w xY w# ||f$ r}t               |d }~ww xY w)Nr   )init_run)NeptuneMissingApiTokenException"NeptuneMissingProjectNameExceptionsys/idr:   )r   r"  neptune.exceptionsr#  r$  rb  neptune.newneptune.new.exceptionsr   r  r   r  r  r@  r  r  )r  additional_neptune_kwargsr"  r#  r$  
run_paramses          r4   _initialize_runzNeptuneCallback._initialize_run  s    	s(n
 	  "	72779Jd334 .:.DI99X.446DL  	s,rr	s 34ST 	7-/Q6	7s)   A< AB <BBB0 B++B0c                     | j                   | _        d| _        | j                  d   j                         | _        d | _         y )NTr%  )r  r  r  r@  r  r  s    r4   _use_initial_runz NeptuneCallback._use_initial_run  s8    %%	"&yy*002 r6   c                 .   | j                   | j                          y | j                  s| j                  ry | j                  r<| j                  s0| j                  s$| j                  | j                         d| _        y | j                          d| _        y )N)with_idTF)r  r.  r  r  r  r,  r  r  s    r4   _ensure_run_with_monitoringz+NeptuneCallback._ensure_run_with_monitoring  sv    (!!#338O8Oyy!8!8AaAa$$T\\$:*.'$$&380r6   c                     | j                   | j                          y | j                  s(| j                  | j                  dddd       d| _        y y )NF)r0  capture_stdoutcapture_stderrcapture_hardware_metricscapture_traceback)r  r.  r  r,  r  r  r  s    r4   '_ensure_at_least_run_without_monitoringz7NeptuneCallback._ensure_at_least_run_without_monitoring  sV    (!!#99$$ LL#(#(-2&+ %  +0' r6   c                 R    | j                   | j                          | j                   S rf   )r  r7  r  s    r4   r*   zNeptuneCallback.run  s"    9988:yyr6   c                 4    | j                   | j                     S rf   )r*   r  r  s    r4   _metadata_namespacez#NeptuneCallback._metadata_namespace  s    xx1122r6   c                 F    t         | j                  t        j                  <   y rf   )r.  r*   r   integration_version_keyr  s    r4   _log_integration_versionz(NeptuneCallback._log_integration_version  s    <C889r6   c                 Z    |j                         | j                  t        j                  <   y rf   )to_sanitized_dictr:  r   trainer_parameters_key)r  r   s     r4   _log_trainer_parametersz'NeptuneCallback._log_trainer_parameters  s!    KOKaKaKc  !G!GHr6   c                     ddl m} |rVt        |d      rI|j                  < ||j                  j	                               | j
                  t        j                  <   y y y y )Nr   )stringify_unsupportedr   )neptune.utilsrC  r3   r   r  r:  r   model_parameters_key)r  r   rC  s      r4   _log_model_parametersz%NeptuneCallback._log_model_parameters  sQ    7WUH-%,,2JMb$$&ND$$_%I%IJ 3K-5r6   c                     |r3t        |d      r'|j                  | j                  t        j                  <   |rBt        |d      r5|j
                  (|j
                  | j                  t        j                  <   y y y y )NrY  rv  )r3   rY  r:  r   trial_name_keyrv  trial_params_key)r  rX  s     r4   "_log_hyper_param_search_parametersz2NeptuneCallback._log_hyper_param_search_parameters  sh    WUL1GLGWGWD$$_%C%CDWUN38J8J8VINI[I[D$$_%E%EF 9W35r6   source_directoryr   c                    t         j                  j                  ||      x}}| j                  t         j                  j                  | j                  |      }	 |j	                  dd      j                  t         j                  j                        }t         j                  j                  ||      }t        j                  ||       |}| j                  | j                     j                  |       | j                  r>| j                   2| j                  | j                     j#                  | j                          || _        y # t        $ r#}t        j                  d| d       Y d }~d }~ww xY w)Nz..r(   zONeptuneCallback was unable to made a copy of checkpoint due to I/O exception: 'z'. Could fail trying to upload.)r+   r   r   r  replacelstripr  shutilcopytreeOSErrorr.   r/   r:  r  upload_filesr  r  delete_files)	r  rK  r   target_pathrelative_pathconsistent_checkpoint_path	cpkt_path	copy_pathr+  s	            r4   _log_model_checkpointz%NeptuneCallback._log_model_checkpoint  s1   &(ggll3CZ&PPm))5)+d6T6TV`)a&
)11$;BB277;;O	GGLL)CYO	y98 	  !C!CDQQR]^::t?[?[?g$$T%G%GHUUVZVrVrs'4$  efgeh i3 3 s   A1E 	E1E,,E1c                     d | _         | j                  r;|j                  s|j                  #t	        j
                         j                  | _         | j                  dk(  r|j                  st        d      y y )Nr   zWTo save the best model checkpoint, the load_best_model_at_end argument must be enabled.)	r  r  overwrite_output_dirsave_total_limitr   r   r   r  r  r  s        r4   r  zNeptuneCallback.on_init_end  sh    )-&  d&?&?4CXCXCd-5-H-H-J-O-OD*  F*43N3Nvww 4O*r6   c                    |j                   sy | j                          d| _        | j                          | j                  r"| j                  |       | j                  |       |j                  r| j                  |       y y )NT)	r  r1  r  r=  r  rA  rF  r  rJ  rO  s         r4   r  zNeptuneCallback.on_train_begin  so    **((*+/(%%'((.&&u-&&33E: 'r6   c                 $    | j                          y rf   )r   r  s        r4   r  zNeptuneCallback.on_train_end  s      "r6   c                 ~    | j                   !t        j                  | j                   d       | j                          y )NT)ignore_errors)r  rO  rmtreer   r  s    r4   r  zNeptuneCallback.__del__   s.    ))5MM$88M  "r6   c                 p    | j                   r*| j                  |j                  d|j                          y y )Nr1  )r  rY  r  r  r  s        r4   r<  zNeptuneCallback.on_save&  s2    ))&&t+eFWFWEX8YZ *r6   c                 2   | j                   dk(  r|j                  }|j                  d      sd| }|j                  |      }|j                  rt
        j                  nt
        j                  }|j                  d u xs  |||j                        | _	        y y )Nr   ru  )
r  r!  r   r  greater_is_betternpgreaterlessr"  r  )	r  r   rX  r  r   r   best_metric_namemetric_valueoperators	            r4   on_evaluatezNeptuneCallback.on_evaluate*  s      F*#99#..w7%*+;*<#= ";;'78L%)%;%;rzzH-2->->$-F-s(S_afararJsD* +r6   c                     |j                   j                  D ]  }t        ||       s|j                  c S  t	        d      )Nz6The trainer doesn't have a NeptuneCallback configured.)rc  rd  rx   r*   	Exception)r   r   rm  s      r4   get_runzNeptuneCallback.get_run6  s?    00:: 	$H(C(||#	$ PQQr6   r  c                 ,   |j                   sy |t        |      j                         D ]h  \  }}t        |t        t
        f      s|t        j                  v r|| j                  |<   ?| j                  |   j                  ||j                         j y y )Nr  )r  r[  rE  rx   r  r  r   flat_metricsr:  r  r  )r  r   rX  r  r  r   r   r   s           r4   r  zNeptuneCallback.on_log>  s    **+D1779 Zeec5\2;;;9>006006::5uGXGX:YZ r6   rf   )&r  r  r  r  r<  rE  rH  rI  r@  rq  r
   r   r  r  r   r,  r.  r1  r7  r  r*   r:  r=  rA  rF  rJ  rY  r  r  r  r  r<  rk  r  rn  r|   r  r  r:   r6   r4   r   r   :  s\   8 F-N%1!?L
 $(!%"*#)-5D C=5D #	5D
 sm5D 5D 5D "#5Dn7$!90  
 3 3Dd\5c 5s 50x;##[
t R R
Z$sEz:J1K 
Zr6   r   c                   *    e Zd ZdZd Zd ZddZd Zy)CodeCarbonCallbackzI
    A [`TrainerCallback`] that tracks the CO2 emission of training.
    c                     t               st        d      t        j                  j                  rt        d      dd l}|| _        d | _        y )NzWCodeCarbonCallback requires `codecarbon` to be installed. Run `pip install codecarbon`.aZ  CodeCarbonCallback requires `codecarbon` package, which is not compatible with AMD ROCm (https://github.com/mlco2/codecarbon/pull/490). When using the Trainer, please specify the `report_to` argument (https://huggingface.co/docs/transformers/v4.39.3/en/main_classes/trainer#transformers.TrainingArguments.report_to) to disable CodeCarbonCallback.r   )rk   r}   r   r.  hiprj   _codecarbontracker)r  rj   s     r4   r  zCodeCarbonCallback.__init__P  sN    &(i  ]] m  	%r6   c                     | j                   9|j                  r,| j                  j                  |j                        | _         y y y )N)r  )rw  is_local_process_zerorv  EmissionsTrackerr  r  s        r4   r  zCodeCarbonCallback.on_init_end_  s<    <<E$?$?++<<<XDL %@r6   Nc                 l    | j                   r(|j                  r| j                   j                          y y y rf   )rw  ry  rz  rO  s         r4   r  z!CodeCarbonCallback.on_train_begind  s(    <<E77LL  8<r6   c                 l    | j                   r(|j                  r| j                   j                          y y y rf   )rw  ry  r  r  s        r4   r  zCodeCarbonCallback.on_train_endh  s(    <<E77LL 8<r6   rf   )r  r  r  r  r  r  r  r  r:   r6   r4   rs  rs  K  s    Y
! r6   rs  c                   j    e Zd ZdZdZdZdZdZdZdZ	dZ
d	Zd	Zd
ZdZd Zd ZddZd ZddZd Zd Zy)ClearMLCallbacka  
    A [`TrainerCallback`] that sends the logs to [ClearML](https://clear.ml/).

    Environment:
    - **CLEARML_PROJECT** (`str`, *optional*, defaults to `HuggingFace Transformers`):
        ClearML project name.
    - **CLEARML_TASK** (`str`, *optional*, defaults to `Trainer`):
        ClearML task name.
    - **CLEARML_LOG_MODEL** (`bool`, *optional*, defaults to `False`):
        Whether to log models as artifacts during training.
    r(   TransformerszModel Configuration_ignore_hparams_ui_overrides_"_ignore_model_config_ui_overrides_z%The configuration of model number {}.zNote that, when cloning this task and running it remotely, the configuration might be applied to another model instead of this one. To avoid this, initialize the task externally by calling `Task.init` before the `ClearMLCallback` is instantiated.r   FNc                 ~    t               rdd l}|| _        nt        d      d| _        d | _        d| _        g | _        y )Nr   zNClearMLCallback requires 'clearml' to be installed. Run `pip install clearml`.F)r?   r>   _clearmlr}   r  _clearml_taskr  _checkpoints_saved)r  r>   s     r4   r  zClearMLCallback.__init__  s=    !#DMopp!!"$r6   c                 Z   | j                   y | j                  ry t        xj                  dz  c_        t        xj                  dz  c_        t        j                  dk(  rdndt        t        j                        z   t        _        |j                  rt        j                  d       | j                  t        j                  _| j                   j                  j                         r$| j                   j                  j                         rdt        _        ndt        _        | j                   j                  j                         r| j                   j                  j                         r| j                   j                  j                         | _
        t        j                   dt        j"                  sdnd	      j%                         t'        j(                  d	h      v | _        t        j                  d
       n| j                   j                  j-                  t        j                   dd      t        j                   dd      dddd      | _
        t        j                   dd	      j%                         t'        j(                  d	h      v | _        dt        _        t        j                  d       d| _        t        j.                  t        j                  z   }|dz   t        j0                  z   }| j                   j                  j                         r6| j3                  ||       | j                  j5                  |dt6        d       nl| j                  j9                  |dd      s| j                  j;                  ||       n1| j3                  |t        j.                  t        j                  z          t=        |dd       |dz   t        j>                  z   }t        j@                  jC                  t        j                        }	t        j                  t        j                  k7  r|	dt        jD                  z   z  }	| j                   j                  j                         ry| j                  j5                  |dt6        d       | j                  jG                  t        jH                  t        j                  z   |jJ                  jM                         |	       y | j                  j9                  |dd      sY|jJ                  jO                  | j                  jQ                  t        jH                  t        j                  z               |_%        y | j                  jG                  t        jH                  t        j                  z   |jJ                  jM                         |	       y y y )Nr   r(   r  z"Automatic ClearML logging enabled.FTCLEARML_LOG_MODELr^   r_   z)External ClearML Task has been connected.CLEARML_PROJECTzHuggingFace TransformersCLEARML_TASKr  )rJ   pytorch)project_name	task_nameauto_connect_frameworks
output_uriz"ClearML Task has been initialized./zIf True, ignore Transformers hyperparameters overrides done in the UI/backend when running remotely. Otherwise, the overrides will be applied when running remotely)r   r   
value_typer  )defaultcastr    zIf True, ignore Transformers model configuration overrides done in the UI/backend when running remotely. Otherwise, the overrides will be applied when running remotely)r   config_dictr  ))r  r  r~  _train_run_counter_model_connect_counterr   
log_suffixr  r.   r  r  _should_close_on_train_endTaskrunning_locallycurrent_taskr+   r,   _task_created_in_callbackr-   r$   unionr  rW  _hparams_section_ignore_hparams_overrides_copy_training_args_as_hparamsset_parameterr  get_parameterconnectr   _ignoge_model_config_overrides_model_config_descriptionr  _model_config_description_noteset_configuration_object_model_config_sectionr   r  	from_dict get_configuration_object_as_dict)
r  r   rX  r   r  r   suffixed_hparams_sectionignore_hparams_config_sectionignore_model_config_section configuration_object_descriptions
             r4   r  zClearMLCallback.setup  s   == **a/*..!3.!449BsSIkIkEl?l 	" &&KK<=!!)"==E==--==?4==CUCUCbCbCdEJBEIB ==%%557DMM<N<N<[<[<])-););)H)H)JD&&(ii+'6'P'PV\' eg!5!;!;VH!E'FDO KK KL)-););)@)@%'YY/@B\%]"$))NI"F@ERW0X#'	 *A *D& ')ii0CV&L&R&R&TXlXrXrY 'DO AEO=KK DE$(!'6'G'G/JdJd'd$,Ds,J_MvMv,v)}}!!11333D:RS""006#r 1  ''556S]ahl5m""**41IJ33/::_=W=WW uh-9,s2_5c5cc , 4C3\3\3c3c#::40 #99_=_=__4o>l>l8ll4==%%557&&448"#'v 5  &&??,BB_E_E__$)LL$8$8$:$D @ 
 ++99:U_cjn9o#(<<#9#9**KK+AAOD^D^^$EL &&??,BB_E_E__$)LL$8$8$:$D @ ? :i 'r6   c                     | j                   y g | _        |j                  rd| _        | j                  s | j                  ||||fi | y y r  )r  r  r  r  r  rR  s          r4   r  zClearMLCallback.on_train_begin  sP    == "$&& %D  DJJtUE+;FvF !r6   c                 p    t         j                  r&| j                  j                          dt         _        y y )Nr   )r~  r  r  r  r  r  s        r4   r  zClearMLCallback.on_train_end  s*    55$$&12O. 6r6   c           
         | j                   y | j                  s | j                  ||||fi | |j                  rd}t	        |      }	d}
t	        |
      }g d}|j                         D ]  \  }}t        |t        t        f      rF||v r=| j                  j                         j                  |t        j                  z   |       _|j                  |      rL| j                  j                         j                  dt        j                  z   ||	d  ||j                          |j                  |
      rM| j                  j                         j                  dt        j                  z   ||d  ||j                          | j                  j                         j                  dt        j                  z   |||j                          dt"        j%                  d	| d
t'        |       d| d        y y )Nru  rv  )r)  r*  r+  r,  r#  r7  r(  eval)titleseriesr   	iterationtestr   r  r  r  zn" as a scalar. This invocation of ClearML logger's  report_scalar() is incorrect so we dropped this attribute.)r  r  r  r  rx  rE  rx   r  r  r  
get_loggerreport_single_valuer~  r  r   report_scalarr  r.   r/   r  )r  r   rX  r  r   r  r  r   r{  r|  r}  r~  r.  r  r  s                  r4   r  zClearMLCallback.on_log  s   ==   DJJtUE+;FvF&&!K!+.O!K!+.O$  

 !1a#u.00**557KK!"_%?%?!?q L  k2**557EE"(?+E+E"E#$_%5#6"#&+&7&7	 F  k2**557EE"(?+E+E"E#$_%5#6"#&+&7&7	 F  **557EE")O,F,F"F#$"#&+&7&7	 F  NN3ja	A3 ?EE9! 'r6   c                    | j                   r| j                  r|j                  rd|j                   }t        j
                  j                  |j                  |      }|t        j                  z   }t        j                  d| d       | j                  j                  | j                  |      }|j                  | j                  |       |j                  |||j                  d       | j                   j#                  |       |j$                  r|j$                  t'        | j                         k  r	 | j                  j(                  j*                  j-                  | j                   d   ddd	       | j                   dd  | _        |j$                  r$|j$                  t'        | j                         k  ry y y y y y y # t.        $ r<}	t        j1                  d
| j                   d   j2                   d|	        Y d }	~	y d }	~	ww xY w)Nr1  zLogging checkpoint artifact `z`. This may take some time.)taskr   F)weights_pathtarget_filenamer  auto_delete_filer   T)delete_weights_fileforceraise_on_errorszCould not remove checkpoint `z5` after going over the `save_total_limit`. Error is: r   )r  r  r  r  r+   r   r   r  r~  r  r.   r  r  OutputModelr  update_weights_packager  rr  r\  rx  r   Modelremoverm  r/   r   )
r  r   rX  r  r   r9  r:  r   output_modelr+  s
             r4   r<  zClearMLCallback.on_save@  s   ??t11e6Q6Q$U%6%6$78HGGLL(CMo888DKK7v=XYZ==44$:L:LSW4XL  d&8&8t D//* (++!&	 0  ##**<8''D,A,ACH_H_D`,`MM''--44//2,0"(,	 5  +/*A*A!"*E' ''D,A,ACH_H_D`,`',`' 7R1?, ! NN78O8OPQ8R8W8W7X  YN  OP  NQ  R 	s   :A G 	H	2HH	c                    t        |      D ci c]J  }|j                  r<|j                  j                  d      s!|j                  t	        ||j                        L }}| j
                  j                  j                  j                  |      j                         D ci c]  \  }}t        |      | }}}| j                  j                  j                  ||       y c c}w c c}}w )N_token)prefix)r   rW  r   endswithr   r  	utilitiesproxy_objectflatten_dictionaryrE  r   r  
_argumentscopy_from_dict)r  training_argsr  fieldas_dictr  r  	flat_dicts           r4   r  z.ClearMLCallback._copy_training_args_as_hparams^  s      .
zz%**"5"5h"? JJuzz::
 

 ,0==+B+B+O+O+b+bcj+k+q+q+st41aSVQYt	t%%44Yv4N

 us   AC C%r@  )NNN)r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r<  r  r:   r6   r4   r~  r~  m  sy    
 J%1 ?%I" G	9 #  %!%%aFG3
3jF<Or6   r~  c                   :     e Zd ZdZddedef fdZd Zd Z xZS )FlyteCallbacka^  A [`TrainerCallback`] that sends the logs to [Flyte](https://flyte.org/).
    NOTE: This callback only works within a Flyte task.

    Args:
        save_log_history (`bool`, *optional*, defaults to `True`):
            When set to True, the training logs are saved as a Flyte Deck.

        sync_checkpoints (`bool`, *optional*, defaults to `True`):
            When set to True, checkpoints are synced with Flyte and can be used to resume training in the case of an
            interruption.

    Example:

    ```python
    # Note: This example skips over some setup steps for brevity.
    from flytekit import current_context, task


    @task
    def train_hf_transformer():
        cp = current_context().checkpoint
        trainer = Trainer(..., callbacks=[FlyteCallback()])
        output = trainer.train(resume_from_checkpoint=cp.restore())
    ```
    save_log_historysync_checkpointsc                     t         |           t               st        d      t	               r
t               st        j                  d       d}ddlm	}  |       j                  | _        || _        || _        y )NzLFlyteCallback requires flytekit to be installed. Run `pip install flytekit`.zSyncing log history requires both flytekitplugins-deck-standard and pandas to be installed. Run `pip install flytekitplugins-deck-standard pandas` to enable this feature.Fr   )current_context)r  r  rn   rb  rp   r   r.   r/   rm   r  r   cpr  r  )r  r  r  r  r~   s       r4   r  zFlyteCallback.__init__  si    $&lmm/19L9NNNa  %,!#.. 0 0r6   c                    | j                   r{|j                  rnd|j                   }t        j                  j                  |j                  |      }t        j                  d| d       | j                  j                  |       y y y )Nr1  zSyncing checkpoint in z to Flyte. This may take time.)r  r  r  r+   r   r   r  r.   r  r  r  r  s          r4   r<  zFlyteCallback.on_save  sn      U%@%@$U%6%6$78HGGLL(CMKK0
:XYZGGLL' &A r6   c                     | j                   rIdd l}ddlm} ddlm} |j                  |j                        } |d |       j                  |             y y )Nr   )Deck)TableRendererzLog History)	r  pandasrm   r  flytekitplugins.deck.rendererr  	DataFramelog_historyto_html)	r  r   rX  r  r   pdr  r  log_history_dfs	            r4   r  zFlyteCallback.on_train_end  sD      %C\\%*;*;<N 7 7 GH !r6   )TT)	r  r  r  r  r  r  r<  r  r  r  s   @r4   r  r  h  s&    41 1 1$(Ir6   r  c                   d    e Zd ZdZ	 	 ddee   deeed   ef      fdZ	d Z
ddZdd	Zd
 Zd Zy)DVCLiveCallbackaW  
    A [`TrainerCallback`] that sends the logs to [DVCLive](https://www.dvc.org/doc/dvclive).

    Use the environment variables below in `setup` to configure the integration. To customize this callback beyond
    those environment variables, see [here](https://dvc.org/doc/dvclive/ml-frameworks/huggingface).

    Args:
        live (`dvclive.Live`, *optional*, defaults to `None`):
            Optional Live instance. If None, a new instance will be created using **kwargs.
        log_model (Union[Literal["all"], bool], *optional*, defaults to `None`):
            Whether to use `dvclive.Live.log_artifact()` to log checkpoints created by [`Trainer`]. If set to `True`,
            the final checkpoint is logged at the end of training. If set to `"all"`, the entire
            [`TrainingArguments`]'s `output_dir` is logged at each checkpoint.
    Nliver  r  c                 z   t               st        d      ddlm} d| _        d | _        t        ||      r|| _        n|t        d|j                   d      || _        | j                  Pt        j                  dd      }|j                         t        v rd	| _        y |j                         d
k(  rd
| _        y y y )NzLDVCLiveCallback requires dvclive to be installed. Run `pip install dvclive`.r   LiveFzFound class z  for live, expected dvclive.LiveHF_DVCLIVE_LOG_MODELr^   Tr  )rs   r}   rr   r  r  r  rx   r~   r  r+   r,   r-   r$   rx  )r  r  r  r   r  log_model_envs         r4   r  zDVCLiveCallback.__init__  s     $%mnn !	dD!DIdnn-==]^__#??"II&<gFM""$(<<"&$$&%/"' 0	 #r6   c                     ddl m} d| _        |j                  rB| j                  s |       | _        | j                  j                  |j                                yy)a@  
        Setup the optional DVCLive integration. To customize this callback beyond the environment variables below, see
        [here](https://dvc.org/doc/dvclive/ml-frameworks/huggingface).

        Environment:
        - **HF_DVCLIVE_LOG_MODEL** (`str`, *optional*):
            Whether to use `dvclive.Live.log_artifact()` to log checkpoints created by [`Trainer`]. If set to `True` or
            *1*, the final checkpoint is logged at the end of training. If set to `all`, the entire
            [`TrainingArguments`]'s `output_dir` is logged at each checkpoint.
        r   r  TN)rr   r  r  r  r  r  r  )r  r   rX  r   r  s        r4   r  zDVCLiveCallback.setup  sE     	! &&99 F	II  0 'r6   c                 D    | j                   s| j                  |||       y y rf   rN  rO  s         r4   r  zDVCLiveCallback.on_train_begin  r  r6   c           
         | j                   s| j                  |||       |j                  rddlm} ddlm} |j                         D ]b  \  }	}
|j                  |
      r$| j                  j                   ||	d      |
       ;t        j                  d|
 dt        |
       d|	 d       d | j                  j                          y y )	Nr   )Metric)standardize_metric_namezdvclive.huggingfacer  r  r  zh" as a scalar. This invocation of DVCLive's Live.log_metric() is incorrect so we dropped this attribute.)r  r  r  dvclive.plotsr  dvclive.utilsr  rE  	could_logr  r6  r.   r/   r  	next_step)r  r   rX  r  r   r  r   r  r  rK  r   s              r4   r  zDVCLiveCallback.on_log  s      JJtUE*&&,="jjl 	
U##E*II(()@F[)\^cdNN!7*T%[MC5 IEE		 II! 'r6   c                     | j                   dk(  r@| j                  r3|j                  r&| j                  j	                  |j
                         y y y y )Nr  )r  r  r  r  r  r  r  s        r4   r<  zDVCLiveCallback.on_save  s@    ??e#(9(9e>Y>YII""4??3 ?Z(9#r6   c                    | j                   r|j                  rddlm} | j                  du r |||j                  d      |j                  d      dg      }|j                  rdnd	}t        j                  j                  |j                  |      }|j                  |       | j                  j                  ||dd
       | j                  j                          y y y )Nr   r  Tr   r  r  r  r   r
  )r   r  r  )r  r  transformers.trainerr  r  r  r  r+   r   r   r  r  r  r  r  )	r  r   rX  r  r   r  r%  r   r  s	            r4   r  zDVCLiveCallback.on_train_end  s    !<!<4$&& **W-%+ZZ0B%C"(	  "&!<!<v&WW\\$//4@
''
3		&&z7QU&VIIMMO "=r6   r@  rf   )r  r  r  r  r
   r   r   r	   r  r  r  r  r  r<  r  r:   r6   r4   r  r    sV    " #;?(sm( E'%.$"678(21&+"&4r6   r  c                   @    e Zd ZdZd Zd Zd
dZddZddZd Z	d	 Z
y)SwanLabCallbackzn
    A [`TrainerCallback`] that logs metrics, media, model checkpoints to [SwanLab](https://swanlab.cn/).
    c                     t               st        d      dd l}|| _        d| _        t        j                  dd       | _        y )NzLSwanLabCallback requires swanlab to be installed. Run `pip install swanlab`.r   FSWANLAB_LOG_MODEL)rv   r}   ru   _swanlabr  r+   r,   r  )r  ru   s     r4   r  zSwanLabCallback.__init__	  s9    #%mnn!))$7>r6   c                    d| _         |j                  rt        j                  d       i |j	                         }t        |d      rR|j                  Ft        |j                  t              r|j                  n|j                  j	                         }i ||}t        |d      r |j                  |j                  }i d|i|}|j                  }i }	|!|j                  |j                   d| |	d<   n#|j                  |j                  |	d<   n|||	d<   t        j                  dd      |	d	<   | j                  j                          | j                  j                   di |	 d
| j                  j                  d<   | j                  j                  j#                  |       	 | j                  j                  j#                  d|j%                         i       t'        |      j(                  dk(  st'        |      j(                  dk(  ra|j+                         \  }
}| j                  j                  j#                  d|
i       | j                  j                  j#                  d|i       | j.                  nt        j1                  d       d| j                  j                         j2                  j4                  j6                   d}t8        xj:                  d| z  c_        yyy# t,        $ r t        j                  d       Y w xY w)a	  
        Setup the optional SwanLab (*swanlab*) integration.

        One can subclass and override this method to customize the setup if needed. Find more information
        [here](https://docs.swanlab.cn/guide_cloud/integration/integration-huggingface-transformers.html).

        You can also override the following environment variables. Find more information about environment
        variables [here](https://docs.swanlab.cn/en/api/environment-variable.html#environment-variables)

        Environment:
        - **SWANLAB_API_KEY** (`str`, *optional*, defaults to `None`):
            Cloud API Key. During login, this environment variable is checked first. If it doesn't exist, the system
            checks if the user is already logged in. If not, the login process is initiated.

                - If a string is passed to the login interface, this environment variable is ignored.
                - If the user is already logged in, this environment variable takes precedence over locally stored
                login information.

        - **SWANLAB_PROJECT** (`str`, *optional*, defaults to `None`):
            Set this to a custom string to store results in a different project. If not specified, the name of the current
            running directory is used.

        - **SWANLAB_LOG_DIR** (`str`, *optional*, defaults to `swanlog`):
            This environment variable specifies the storage path for log files when running in local mode.
            By default, logs are saved in a folder named swanlog under the working directory.

        - **SWANLAB_MODE** (`Literal["local", "cloud", "disabled"]`, *optional*, defaults to `cloud`):
            SwanLab's parsing mode, which involves callbacks registered by the operator. Currently, there are three modes:
            local, cloud, and disabled. Note: Case-sensitive. Find more information
            [here](https://docs.swanlab.cn/en/api/py-init.html#swanlab-init)

        - **SWANLAB_LOG_MODEL** (`str`, *optional*, defaults to `None`):
            SwanLab does not currently support the save mode functionality.This feature will be available in a future
            release

        - **SWANLAB_WEB_HOST** (`str`, *optional*, defaults to `None`):
            Web address for the SwanLab cloud environment for private version (its free)

        - **SWANLAB_API_HOST** (`str`, *optional*, defaults to `None`):
            API address for the SwanLab cloud environment for private version (its free)

        TzYAutomatic SwanLab logging enabled, to disable set os.environ["SWANLAB_MODE"] = "disabled"r   Nr  -experiment_nameSWANLAB_PROJECTr'  u   🤗transformers	FRAMEWORKmodel_num_parameters	PeftModelPeftMixedModelpeft_model_trainable_paramspeft_model_all_paramzQCould not log the number of model parameters in SwanLab due to an AttributeError.sSwanLab does not currently support the save mode functionality. This feature will be available in a future release.z[<img src="https://raw.githubusercontent.com/SwanHubX/assets/main/badge1.svg" alt="Visualize in SwanLab" height="280" height="32"/>](r  r  r:   )r  r  r.   r  r  r3   r   rx   r|   r  rY  r  r+   r,   r  rn  rW  r   r  r  r  get_nb_trainable_parametersr  r  r/   publiccloudexp_urlr   r  )r  r   rX  r   r   r  r  r  rY  r  trainable_params	all_paramr
  s                r4   r  zSwanLabCallback.setup	  s   V !&&KKst.t||~.Muh'ELL,D/9%,,/Mu||SXS_S_SgSgSi A< A= Aum,1B1B1N#// QM;#? Q= Q))JI%$--*C26--*/N	+,*/3}}	+,'/9	+,#%99->#EIi }}$$&."""  1CDMM  -MM  ''6q$$++-CUEYEYE[,\];'';6$u+:N:NRb:b272S2S2U/$iMM((//1NP`0abMM((//1G0ST
 *J
))-)>)>)@)G)G)M)M)U)U(VVWY  77R?O;PP7 +S 'J " qopqs   (CK* *L
LNc                 H    | j                   s | j                  |||fi | y y rf   rN  rO  s         r4   r  zSwanLabCallback.on_train_begin	  rP  r6   c                 |    | j                   0| j                  r#|j                  rt        j	                  d       y y y y Nr	  r  r  r  r.   r/   rR  s          r4   r  zSwanLabCallback.on_train_end	  ;    ??&4+<+<A\A\NNF B]+<&r6   c                    g d}| j                   s| j                  |||       |j                  r|j                         D ]6  \  }}	||v s| j                  j                  d| |	i|j                         8 |j                         D 	ci c]  \  }}	||vs||	 }
}}	t        |
      }
| j                  j                  i |
d|j                  i|j                         y y c c}	}w )Nr(  zsingle_value/rp  r  )r  r  r  rE  r  r  r  r[  r-  s              r4   r  zSwanLabCallback.on_log	  s     
   JJtUE*&&

 X1,,MM%%qc':A&>UEVEV%WX 15

^1I]@]q!t^O^*?;OMMYY2EuGXGXY`e`q`qr ' _s   C%C%c                 |    | j                   0| j                  r#|j                  rt        j	                  d       y y y y r  r  r  s        r4   r<  zSwanLabCallback.on_save	  r  r6   c                     | j                   s | j                  ||fi | |j                  r't        |      }| j                  j                  |       y y rf   )r  r  r  r[  r  r  r>  s         r4   r?  zSwanLabCallback.on_predict	  sJ      DJJtU-f-&&"7+GMMg& 'r6   rf   r@  )r  r  r  r  r  r  r  r  r  r<  r?  r:   r6   r4   r  r  	  s.    ?aQF5s&'r6   r  )rq  r   r`   r   rJ   r8   r)   rj   r>   rc   flyterr   ru   c           	         | g S t        | t              rd| k(  rg S d| k(  rt               } n| g} | D ]<  }|t        vst	        | ddj                  t        j                                d       | D cg c]  }t        |    c}S c c}w )Nnoner  z is not supported, only r*  z are supported.)rx   r   rs  INTEGRATION_TO_CALLBACKr  r   r\  )rf  integrations     r4   #get_reporting_integration_callbacksr  	  s    	)S!YIi<>I"I  55-7		BYB^B^B`8a7bbqr  ENN[#K0NNNs   4B)r  r  r  importlib.metadatar0   importlib.utilr  r  r+   r4  r  rO  r   r   dataclassesr   r   enumr   pathlibr   typingr   r   r	   r
   r   numpyre  packaging.versionr  transformers.utils.import_utilsr   r,   r  r(   r   r   r   r.  r  r   r   r   r   r   r   r   r  r  r.   r   r   torch.distributedr   r\  rF   r-  rE   rC   r  rD   r   r   
get_configrG   PackageNotFoundErrorrb  r  r  r  KeyErrorr1   r2   rg   _neptune_versionr  r   trainer_callbackr   r   r  r    r!   r"   r  r#   r$   r%   r5   r;   r?   rH   rL   rO   rS   rU   rX   r[   ra   rd   rh   rk   rn   rp   rs   rv   r   r  r   r   r  rL  ro  rs  r[  r  r  r  re  rC  rg  r  r  r  rm  r  r   rs  r~  r  r  r  r  r  r:   r6   r4   <module>r-     sp         	  	  
  &   ? ?   A 299\i'	
12 1 %   
		H	%$$  !''//
;N'//55nEIZIZI`I`asItt !!/2>#$ NNY't3my~~7O7OP`7aim7m  \!$--55i@&'7&8DE  @ L L ( @$;;Bw:7<:D:a><H;;D*;C ;C ;g ;|C C C7 CL_C _C _g _DJk3 Jk3 JkW JkZ: U"/ U"p!3 !C ! #C #:E%O E%Pw'o w'tIO IX>o >.r$_ r$j.In .Ib
) 
NZo NZb   DxOo xOv<IO <I~fo fR['o ['~  &$ "O]K 	//j)Ucemn !N# 	! 22 !	!(1199:JKKK12B1C;OP!!66 	! L	!	!sI   A8L 0L9 'L65L69N)0NN)N"N)!N""N)(N)