aboutsummaryrefslogtreecommitdiffstatshomepage
path: root/models/trpg-final/training_args.bin
blob: 6f17593be54c8b342061599bac7e0e6cf7045203 (plain)
ofshex dumpascii
0000 50 4b 03 04 00 00 08 08 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 16 00 0c 00 74 72 PK............................tr
0020 61 69 6e 69 6e 67 5f 61 72 67 73 2f 64 61 74 61 2e 70 6b 6c 46 42 08 00 5a 5a 5a 5a 5a 5a 5a 5a aining_args/data.pklFB..ZZZZZZZZ
0040 80 02 63 74 72 61 6e 73 66 6f 72 6d 65 72 73 2e 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 0a 54 72 ..ctransformers.training_args.Tr
0060 61 69 6e 69 6e 67 41 72 67 75 6d 65 6e 74 73 0a 71 00 29 81 71 01 7d 71 02 28 58 0a 00 00 00 6f ainingArguments.q.).q.}q.(X....o
0080 75 74 70 75 74 5f 64 69 72 71 03 58 13 00 00 00 2e 2f 6d 6f 64 65 6c 73 2f 74 72 70 67 2d 66 69 utput_dirq.X...../models/trpg-fi
00a0 6e 61 6c 71 04 58 14 00 00 00 6f 76 65 72 77 72 69 74 65 5f 6f 75 74 70 75 74 5f 64 69 72 71 05 nalq.X....overwrite_output_dirq.
00c0 89 58 08 00 00 00 64 6f 5f 74 72 61 69 6e 71 06 89 58 07 00 00 00 64 6f 5f 65 76 61 6c 71 07 89 .X....do_trainq..X....do_evalq..
00e0 58 0a 00 00 00 64 6f 5f 70 72 65 64 69 63 74 71 08 89 58 0d 00 00 00 65 76 61 6c 5f 73 74 72 61 X....do_predictq..X....eval_stra
0100 74 65 67 79 71 09 63 74 72 61 6e 73 66 6f 72 6d 65 72 73 2e 74 72 61 69 6e 65 72 5f 75 74 69 6c tegyq.ctransformers.trainer_util
0120 73 0a 49 6e 74 65 72 76 61 6c 53 74 72 61 74 65 67 79 0a 71 0a 58 02 00 00 00 6e 6f 71 0b 85 71 s.IntervalStrategy.q.X....noq..q
0140 0c 52 71 0d 58 14 00 00 00 70 72 65 64 69 63 74 69 6f 6e 5f 6c 6f 73 73 5f 6f 6e 6c 79 71 0e 89 .Rq.X....prediction_loss_onlyq..
0160 58 1b 00 00 00 70 65 72 5f 64 65 76 69 63 65 5f 74 72 61 69 6e 5f 62 61 74 63 68 5f 73 69 7a 65 X....per_device_train_batch_size
0180 71 0f 4b 04 58 1a 00 00 00 70 65 72 5f 64 65 76 69 63 65 5f 65 76 61 6c 5f 62 61 74 63 68 5f 73 q.K.X....per_device_eval_batch_s
01a0 69 7a 65 71 10 4b 08 58 18 00 00 00 70 65 72 5f 67 70 75 5f 74 72 61 69 6e 5f 62 61 74 63 68 5f izeq.K.X....per_gpu_train_batch_
01c0 73 69 7a 65 71 11 4e 58 17 00 00 00 70 65 72 5f 67 70 75 5f 65 76 61 6c 5f 62 61 74 63 68 5f 73 sizeq.NX....per_gpu_eval_batch_s
01e0 69 7a 65 71 12 4e 58 1b 00 00 00 67 72 61 64 69 65 6e 74 5f 61 63 63 75 6d 75 6c 61 74 69 6f 6e izeq.NX....gradient_accumulation
0200 5f 73 74 65 70 73 71 13 4b 01 58 17 00 00 00 65 76 61 6c 5f 61 63 63 75 6d 75 6c 61 74 69 6f 6e _stepsq.K.X....eval_accumulation
0220 5f 73 74 65 70 73 71 14 4e 58 0a 00 00 00 65 76 61 6c 5f 64 65 6c 61 79 71 15 4b 00 58 17 00 00 _stepsq.NX....eval_delayq.K.X...
0240 00 74 6f 72 63 68 5f 65 6d 70 74 79 5f 63 61 63 68 65 5f 73 74 65 70 73 71 16 4e 58 0d 00 00 00 .torch_empty_cache_stepsq.NX....
0260 6c 65 61 72 6e 69 6e 67 5f 72 61 74 65 71 17 47 3f 0a 36 e2 eb 1c 43 2d 58 0c 00 00 00 77 65 69 learning_rateq.G?.6...C-X....wei
0280 67 68 74 5f 64 65 63 61 79 71 18 47 00 00 00 00 00 00 00 00 58 0a 00 00 00 61 64 61 6d 5f 62 65 ght_decayq.G........X....adam_be
02a0 74 61 31 71 19 47 3f ec cc cc cc cc cc cd 58 0a 00 00 00 61 64 61 6d 5f 62 65 74 61 32 71 1a 47 ta1q.G?.......X....adam_beta2q.G
02c0 3f ef f7 ce d9 16 87 2b 58 0c 00 00 00 61 64 61 6d 5f 65 70 73 69 6c 6f 6e 71 1b 47 3e 45 79 8e ?......+X....adam_epsilonq.G>Ey.
02e0 e2 30 8c 3a 58 0d 00 00 00 6d 61 78 5f 67 72 61 64 5f 6e 6f 72 6d 71 1c 47 3f f0 00 00 00 00 00 .0.:X....max_grad_normq.G?......
0300 00 58 10 00 00 00 6e 75 6d 5f 74 72 61 69 6e 5f 65 70 6f 63 68 73 71 1d 4b 14 58 09 00 00 00 6d .X....num_train_epochsq.K.X....m
0320 61 78 5f 73 74 65 70 73 71 1e 4a ff ff ff ff 58 11 00 00 00 6c 72 5f 73 63 68 65 64 75 6c 65 72 ax_stepsq.J....X....lr_scheduler
0340 5f 74 79 70 65 71 1f 63 74 72 61 6e 73 66 6f 72 6d 65 72 73 2e 74 72 61 69 6e 65 72 5f 75 74 69 _typeq.ctransformers.trainer_uti
0360 6c 73 0a 53 63 68 65 64 75 6c 65 72 54 79 70 65 0a 71 20 58 06 00 00 00 6c 69 6e 65 61 72 71 21 ls.SchedulerType.q.X....linearq!
0380 85 71 22 52 71 23 58 13 00 00 00 6c 72 5f 73 63 68 65 64 75 6c 65 72 5f 6b 77 61 72 67 73 71 24 .q"Rq#X....lr_scheduler_kwargsq$
03a0 7d 71 25 58 0c 00 00 00 77 61 72 6d 75 70 5f 72 61 74 69 6f 71 26 47 00 00 00 00 00 00 00 00 58 }q%X....warmup_ratioq&G........X
03c0 0c 00 00 00 77 61 72 6d 75 70 5f 73 74 65 70 73 71 27 4b 00 58 09 00 00 00 6c 6f 67 5f 6c 65 76 ....warmup_stepsq'K.X....log_lev
03e0 65 6c 71 28 58 07 00 00 00 70 61 73 73 69 76 65 71 29 58 11 00 00 00 6c 6f 67 5f 6c 65 76 65 6c elq(X....passiveq)X....log_level
0400 5f 72 65 70 6c 69 63 61 71 2a 58 07 00 00 00 77 61 72 6e 69 6e 67 71 2b 58 10 00 00 00 6c 6f 67 _replicaq*X....warningq+X....log
0420 5f 6f 6e 5f 65 61 63 68 5f 6e 6f 64 65 71 2c 88 58 0b 00 00 00 6c 6f 67 67 69 6e 67 5f 64 69 72 _on_each_nodeq,.X....logging_dir
0440 71 2d 58 31 00 00 00 2e 2f 6d 6f 64 65 6c 73 2f 74 72 70 67 2d 66 69 6e 61 6c 2f 72 75 6e 73 2f q-X1..../models/trpg-final/runs/
0460 44 65 63 33 30 5f 32 30 2d 32 32 2d 35 39 5f 61 72 63 68 6c 69 6e 75 78 71 2e 58 10 00 00 00 6c Dec30_20-22-59_archlinuxq.X....l
0480 6f 67 67 69 6e 67 5f 73 74 72 61 74 65 67 79 71 2f 68 0a 58 05 00 00 00 73 74 65 70 73 71 30 85 ogging_strategyq/h.X....stepsq0.
04a0 71 31 52 71 32 58 12 00 00 00 6c 6f 67 67 69 6e 67 5f 66 69 72 73 74 5f 73 74 65 70 71 33 89 58 q1Rq2X....logging_first_stepq3.X
04c0 0d 00 00 00 6c 6f 67 67 69 6e 67 5f 73 74 65 70 73 71 34 4b 05 58 16 00 00 00 6c 6f 67 67 69 6e ....logging_stepsq4K.X....loggin
04e0 67 5f 6e 61 6e 5f 69 6e 66 5f 66 69 6c 74 65 72 71 35 88 58 0d 00 00 00 73 61 76 65 5f 73 74 72 g_nan_inf_filterq5.X....save_str
0500 61 74 65 67 79 71 36 63 74 72 61 6e 73 66 6f 72 6d 65 72 73 2e 74 72 61 69 6e 65 72 5f 75 74 69 ategyq6ctransformers.trainer_uti
0520 6c 73 0a 53 61 76 65 53 74 72 61 74 65 67 79 0a 71 37 68 30 85 71 38 52 71 39 58 0a 00 00 00 73 ls.SaveStrategy.q7h0.q8Rq9X....s
0540 61 76 65 5f 73 74 65 70 73 71 3a 4b c8 58 10 00 00 00 73 61 76 65 5f 74 6f 74 61 6c 5f 6c 69 6d ave_stepsq:K.X....save_total_lim
0560 69 74 71 3b 4b 02 58 10 00 00 00 73 61 76 65 5f 73 61 66 65 74 65 6e 73 6f 72 73 71 3c 88 58 11 itq;K.X....save_safetensorsq<.X.
0580 00 00 00 73 61 76 65 5f 6f 6e 5f 65 61 63 68 5f 6e 6f 64 65 71 3d 89 58 0f 00 00 00 73 61 76 65 ...save_on_each_nodeq=.X....save
05a0 5f 6f 6e 6c 79 5f 6d 6f 64 65 6c 71 3e 89 58 27 00 00 00 72 65 73 74 6f 72 65 5f 63 61 6c 6c 62 _only_modelq>.X'...restore_callb
05c0 61 63 6b 5f 73 74 61 74 65 73 5f 66 72 6f 6d 5f 63 68 65 63 6b 70 6f 69 6e 74 71 3f 89 58 07 00 ack_states_from_checkpointq?.X..
05e0 00 00 6e 6f 5f 63 75 64 61 71 40 89 58 07 00 00 00 75 73 65 5f 63 70 75 71 41 89 58 0e 00 00 00 ..no_cudaq@.X....use_cpuqA.X....
0600 75 73 65 5f 6d 70 73 5f 64 65 76 69 63 65 71 42 89 58 04 00 00 00 73 65 65 64 71 43 4b 2a 58 09 use_mps_deviceqB.X....seedqCK*X.
0620 00 00 00 64 61 74 61 5f 73 65 65 64 71 44 4e 58 0d 00 00 00 6a 69 74 5f 6d 6f 64 65 5f 65 76 61 ...data_seedqDNX....jit_mode_eva
0640 6c 71 45 89 58 04 00 00 00 62 66 31 36 71 46 89 58 04 00 00 00 66 70 31 36 71 47 88 58 0e 00 00 lqE.X....bf16qF.X....fp16qG.X...
0660 00 66 70 31 36 5f 6f 70 74 5f 6c 65 76 65 6c 71 48 58 02 00 00 00 4f 31 71 49 58 16 00 00 00 68 .fp16_opt_levelqHX....O1qIX....h
0680 61 6c 66 5f 70 72 65 63 69 73 69 6f 6e 5f 62 61 63 6b 65 6e 64 71 4a 58 04 00 00 00 61 75 74 6f alf_precision_backendqJX....auto
06a0 71 4b 58 0e 00 00 00 62 66 31 36 5f 66 75 6c 6c 5f 65 76 61 6c 71 4c 89 58 0e 00 00 00 66 70 31 qKX....bf16_full_evalqL.X....fp1
06c0 36 5f 66 75 6c 6c 5f 65 76 61 6c 71 4d 89 58 04 00 00 00 74 66 33 32 71 4e 4e 58 0a 00 00 00 6c 6_full_evalqM.X....tf32qNNX....l
06e0 6f 63 61 6c 5f 72 61 6e 6b 71 4f 4b 00 58 0b 00 00 00 64 64 70 5f 62 61 63 6b 65 6e 64 71 50 4e ocal_rankqOK.X....ddp_backendqPN
0700 58 0d 00 00 00 74 70 75 5f 6e 75 6d 5f 63 6f 72 65 73 71 51 4e 58 11 00 00 00 74 70 75 5f 6d 65 X....tpu_num_coresqQNX....tpu_me
0720 74 72 69 63 73 5f 64 65 62 75 67 71 52 89 58 05 00 00 00 64 65 62 75 67 71 53 5d 71 54 58 14 00 trics_debugqR.X....debugqS]qTX..
0740 00 00 64 61 74 61 6c 6f 61 64 65 72 5f 64 72 6f 70 5f 6c 61 73 74 71 55 89 58 0a 00 00 00 65 76 ..dataloader_drop_lastqU.X....ev
0760 61 6c 5f 73 74 65 70 73 71 56 4e 58 16 00 00 00 64 61 74 61 6c 6f 61 64 65 72 5f 6e 75 6d 5f 77 al_stepsqVNX....dataloader_num_w
0780 6f 72 6b 65 72 73 71 57 4b 00 58 1a 00 00 00 64 61 74 61 6c 6f 61 64 65 72 5f 70 72 65 66 65 74 orkersqWK.X....dataloader_prefet
07a0 63 68 5f 66 61 63 74 6f 72 71 58 4e 58 0a 00 00 00 70 61 73 74 5f 69 6e 64 65 78 71 59 4a ff ff ch_factorqXNX....past_indexqYJ..
07c0 ff ff 58 08 00 00 00 72 75 6e 5f 6e 61 6d 65 71 5a 4e 58 0c 00 00 00 64 69 73 61 62 6c 65 5f 74 ..X....run_nameqZNX....disable_t
07e0 71 64 6d 71 5b 88 58 15 00 00 00 72 65 6d 6f 76 65 5f 75 6e 75 73 65 64 5f 63 6f 6c 75 6d 6e 73 qdmq[.X....remove_unused_columns
0800 71 5c 88 58 0b 00 00 00 6c 61 62 65 6c 5f 6e 61 6d 65 73 71 5d 4e 58 16 00 00 00 6c 6f 61 64 5f q\.X....label_namesq]NX....load_
0820 62 65 73 74 5f 6d 6f 64 65 6c 5f 61 74 5f 65 6e 64 71 5e 89 58 15 00 00 00 6d 65 74 72 69 63 5f best_model_at_endq^.X....metric_
0840 66 6f 72 5f 62 65 73 74 5f 6d 6f 64 65 6c 71 5f 4e 58 11 00 00 00 67 72 65 61 74 65 72 5f 69 73 for_best_modelq_NX....greater_is
0860 5f 62 65 74 74 65 72 71 60 4e 58 10 00 00 00 69 67 6e 6f 72 65 5f 64 61 74 61 5f 73 6b 69 70 71 _betterq`NX....ignore_data_skipq
0880 61 89 58 04 00 00 00 66 73 64 70 71 62 5d 71 63 58 13 00 00 00 66 73 64 70 5f 6d 69 6e 5f 6e 75 a.X....fsdpqb]qcX....fsdp_min_nu
08a0 6d 5f 70 61 72 61 6d 73 71 64 4b 00 58 0b 00 00 00 66 73 64 70 5f 63 6f 6e 66 69 67 71 65 7d 71 m_paramsqdK.X....fsdp_configqe}q
08c0 66 28 58 0e 00 00 00 6d 69 6e 5f 6e 75 6d 5f 70 61 72 61 6d 73 71 67 4b 00 58 03 00 00 00 78 6c f(X....min_num_paramsqgK.X....xl
08e0 61 71 68 89 58 0b 00 00 00 78 6c 61 5f 66 73 64 70 5f 76 32 71 69 89 58 12 00 00 00 78 6c 61 5f aqh.X....xla_fsdp_v2qi.X....xla_
0900 66 73 64 70 5f 67 72 61 64 5f 63 6b 70 74 71 6a 89 75 58 22 00 00 00 66 73 64 70 5f 74 72 61 6e fsdp_grad_ckptqj.uX"...fsdp_tran
0920 73 66 6f 72 6d 65 72 5f 6c 61 79 65 72 5f 63 6c 73 5f 74 6f 5f 77 72 61 70 71 6b 4e 58 12 00 00 sformer_layer_cls_to_wrapqkNX...
0940 00 61 63 63 65 6c 65 72 61 74 6f 72 5f 63 6f 6e 66 69 67 71 6c 63 74 72 61 6e 73 66 6f 72 6d 65 .accelerator_configqlctransforme
0960 72 73 2e 74 72 61 69 6e 65 72 5f 70 74 5f 75 74 69 6c 73 0a 41 63 63 65 6c 65 72 61 74 6f 72 43 rs.trainer_pt_utils.AcceleratorC
0980 6f 6e 66 69 67 0a 71 6d 29 81 71 6e 7d 71 6f 28 58 0d 00 00 00 73 70 6c 69 74 5f 62 61 74 63 68 onfig.qm).qn}qo(X....split_batch
09a0 65 73 71 70 89 58 10 00 00 00 64 69 73 70 61 74 63 68 5f 62 61 74 63 68 65 73 71 71 4e 58 0c 00 esqp.X....dispatch_batchesqqNX..
09c0 00 00 65 76 65 6e 5f 62 61 74 63 68 65 73 71 72 88 58 14 00 00 00 75 73 65 5f 73 65 65 64 61 62 ..even_batchesqr.X....use_seedab
09e0 6c 65 5f 73 61 6d 70 6c 65 72 71 73 88 58 0c 00 00 00 6e 6f 6e 5f 62 6c 6f 63 6b 69 6e 67 71 74 le_samplerqs.X....non_blockingqt
0a00 89 58 1c 00 00 00 67 72 61 64 69 65 6e 74 5f 61 63 63 75 6d 75 6c 61 74 69 6f 6e 5f 6b 77 61 72 .X....gradient_accumulation_kwar
0a20 67 73 71 75 4e 75 62 58 12 00 00 00 70 61 72 61 6c 6c 65 6c 69 73 6d 5f 63 6f 6e 66 69 67 71 76 gsquNubX....parallelism_configqv
0a40 4e 58 09 00 00 00 64 65 65 70 73 70 65 65 64 71 77 4e 58 16 00 00 00 6c 61 62 65 6c 5f 73 6d 6f NX....deepspeedqwNX....label_smo
0a60 6f 74 68 69 6e 67 5f 66 61 63 74 6f 72 71 78 47 00 00 00 00 00 00 00 00 58 05 00 00 00 6f 70 74 othing_factorqxG........X....opt
0a80 69 6d 71 79 63 74 72 61 6e 73 66 6f 72 6d 65 72 73 2e 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 0a imqyctransformers.training_args.
0aa0 4f 70 74 69 6d 69 7a 65 72 4e 61 6d 65 73 0a 71 7a 58 11 00 00 00 61 64 61 6d 77 5f 74 6f 72 63 OptimizerNames.qzX....adamw_torc
0ac0 68 5f 66 75 73 65 64 71 7b 85 71 7c 52 71 7d 58 0a 00 00 00 6f 70 74 69 6d 5f 61 72 67 73 71 7e h_fusedq{.q|Rq}X....optim_argsq~
0ae0 4e 58 09 00 00 00 61 64 61 66 61 63 74 6f 72 71 7f 89 58 0f 00 00 00 67 72 6f 75 70 5f 62 79 5f NX....adafactorq..X....group_by_
0b00 6c 65 6e 67 74 68 71 80 89 58 12 00 00 00 6c 65 6e 67 74 68 5f 63 6f 6c 75 6d 6e 5f 6e 61 6d 65 lengthq..X....length_column_name
0b20 71 81 58 06 00 00 00 6c 65 6e 67 74 68 71 82 58 09 00 00 00 72 65 70 6f 72 74 5f 74 6f 71 83 5d q.X....lengthq.X....report_toq.]
0b40 71 84 58 07 00 00 00 70 72 6f 6a 65 63 74 71 85 58 0b 00 00 00 68 75 67 67 69 6e 67 66 61 63 65 q.X....projectq.X....huggingface
0b60 71 86 58 10 00 00 00 74 72 61 63 6b 69 6f 5f 73 70 61 63 65 5f 69 64 71 87 58 07 00 00 00 74 72 q.X....trackio_space_idq.X....tr
0b80 61 63 6b 69 6f 71 88 58 1a 00 00 00 64 64 70 5f 66 69 6e 64 5f 75 6e 75 73 65 64 5f 70 61 72 61 ackioq.X....ddp_find_unused_para
0ba0 6d 65 74 65 72 73 71 89 4e 58 11 00 00 00 64 64 70 5f 62 75 63 6b 65 74 5f 63 61 70 5f 6d 62 71 metersq.NX....ddp_bucket_cap_mbq
0bc0 8a 4e 58 15 00 00 00 64 64 70 5f 62 72 6f 61 64 63 61 73 74 5f 62 75 66 66 65 72 73 71 8b 4e 58 .NX....ddp_broadcast_buffersq.NX
0be0 15 00 00 00 64 61 74 61 6c 6f 61 64 65 72 5f 70 69 6e 5f 6d 65 6d 6f 72 79 71 8c 88 58 1d 00 00 ....dataloader_pin_memoryq..X...
0c00 00 64 61 74 61 6c 6f 61 64 65 72 5f 70 65 72 73 69 73 74 65 6e 74 5f 77 6f 72 6b 65 72 73 71 8d .dataloader_persistent_workersq.
0c20 89 58 13 00 00 00 73 6b 69 70 5f 6d 65 6d 6f 72 79 5f 6d 65 74 72 69 63 73 71 8e 88 58 1a 00 00 .X....skip_memory_metricsq..X...
0c40 00 75 73 65 5f 6c 65 67 61 63 79 5f 70 72 65 64 69 63 74 69 6f 6e 5f 6c 6f 6f 70 71 8f 89 58 0b .use_legacy_prediction_loopq..X.
0c60 00 00 00 70 75 73 68 5f 74 6f 5f 68 75 62 71 90 89 58 16 00 00 00 72 65 73 75 6d 65 5f 66 72 6f ...push_to_hubq..X....resume_fro
0c80 6d 5f 63 68 65 63 6b 70 6f 69 6e 74 71 91 4e 58 0c 00 00 00 68 75 62 5f 6d 6f 64 65 6c 5f 69 64 m_checkpointq.NX....hub_model_id
0ca0 71 92 4e 58 0c 00 00 00 68 75 62 5f 73 74 72 61 74 65 67 79 71 93 63 74 72 61 6e 73 66 6f 72 6d q.NX....hub_strategyq.ctransform
0cc0 65 72 73 2e 74 72 61 69 6e 65 72 5f 75 74 69 6c 73 0a 48 75 62 53 74 72 61 74 65 67 79 0a 71 94 ers.trainer_utils.HubStrategy.q.
0ce0 58 0a 00 00 00 65 76 65 72 79 5f 73 61 76 65 71 95 85 71 96 52 71 97 58 09 00 00 00 68 75 62 5f X....every_saveq..q.Rq.X....hub_
0d00 74 6f 6b 65 6e 71 98 4e 58 10 00 00 00 68 75 62 5f 70 72 69 76 61 74 65 5f 72 65 70 6f 71 99 4e tokenq.NX....hub_private_repoq.N
0d20 58 0f 00 00 00 68 75 62 5f 61 6c 77 61 79 73 5f 70 75 73 68 71 9a 89 58 0c 00 00 00 68 75 62 5f X....hub_always_pushq..X....hub_
0d40 72 65 76 69 73 69 6f 6e 71 9b 4e 58 16 00 00 00 67 72 61 64 69 65 6e 74 5f 63 68 65 63 6b 70 6f revisionq.NX....gradient_checkpo
0d60 69 6e 74 69 6e 67 71 9c 89 58 1d 00 00 00 67 72 61 64 69 65 6e 74 5f 63 68 65 63 6b 70 6f 69 6e intingq..X....gradient_checkpoin
0d80 74 69 6e 67 5f 6b 77 61 72 67 73 71 9d 4e 58 1a 00 00 00 69 6e 63 6c 75 64 65 5f 69 6e 70 75 74 ting_kwargsq.NX....include_input
0da0 73 5f 66 6f 72 5f 6d 65 74 72 69 63 73 71 9e 89 58 13 00 00 00 69 6e 63 6c 75 64 65 5f 66 6f 72 s_for_metricsq..X....include_for
0dc0 5f 6d 65 74 72 69 63 73 71 9f 5d 71 a0 58 16 00 00 00 65 76 61 6c 5f 64 6f 5f 63 6f 6e 63 61 74 _metricsq.]q.X....eval_do_concat
0de0 5f 62 61 74 63 68 65 73 71 a1 88 58 0c 00 00 00 66 70 31 36 5f 62 61 63 6b 65 6e 64 71 a2 68 4b _batchesq..X....fp16_backendq.hK
0e00 58 14 00 00 00 70 75 73 68 5f 74 6f 5f 68 75 62 5f 6d 6f 64 65 6c 5f 69 64 71 a3 4e 58 18 00 00 X....push_to_hub_model_idq.NX...
0e20 00 70 75 73 68 5f 74 6f 5f 68 75 62 5f 6f 72 67 61 6e 69 7a 61 74 69 6f 6e 71 a4 4e 58 11 00 00 .push_to_hub_organizationq.NX...
0e40 00 70 75 73 68 5f 74 6f 5f 68 75 62 5f 74 6f 6b 65 6e 71 a5 4e 58 0d 00 00 00 6d 70 5f 70 61 72 .push_to_hub_tokenq.NX....mp_par
0e60 61 6d 65 74 65 72 73 71 a6 58 00 00 00 00 71 a7 58 14 00 00 00 61 75 74 6f 5f 66 69 6e 64 5f 62 ametersq.X....q.X....auto_find_b
0e80 61 74 63 68 5f 73 69 7a 65 71 a8 89 58 10 00 00 00 66 75 6c 6c 5f 64 65 74 65 72 6d 69 6e 69 73 atch_sizeq..X....full_determinis
0ea0 6d 71 a9 89 58 0b 00 00 00 74 6f 72 63 68 64 79 6e 61 6d 6f 71 aa 4e 58 09 00 00 00 72 61 79 5f mq..X....torchdynamoq.NX....ray_
0ec0 73 63 6f 70 65 71 ab 58 04 00 00 00 6c 61 73 74 71 ac 58 0b 00 00 00 64 64 70 5f 74 69 6d 65 6f scopeq.X....lastq.X....ddp_timeo
0ee0 75 74 71 ad 4d 08 07 58 0d 00 00 00 74 6f 72 63 68 5f 63 6f 6d 70 69 6c 65 71 ae 89 58 15 00 00 utq.M..X....torch_compileq..X...
0f00 00 74 6f 72 63 68 5f 63 6f 6d 70 69 6c 65 5f 62 61 63 6b 65 6e 64 71 af 4e 58 12 00 00 00 74 6f .torch_compile_backendq.NX....to
0f20 72 63 68 5f 63 6f 6d 70 69 6c 65 5f 6d 6f 64 65 71 b0 4e 58 19 00 00 00 69 6e 63 6c 75 64 65 5f rch_compile_modeq.NX....include_
0f40 74 6f 6b 65 6e 73 5f 70 65 72 5f 73 65 63 6f 6e 64 71 b1 89 58 1d 00 00 00 69 6e 63 6c 75 64 65 tokens_per_secondq..X....include
0f60 5f 6e 75 6d 5f 69 6e 70 75 74 5f 74 6f 6b 65 6e 73 5f 73 65 65 6e 71 b2 68 0b 58 13 00 00 00 6e _num_input_tokens_seenq.h.X....n
0f80 65 66 74 75 6e 65 5f 6e 6f 69 73 65 5f 61 6c 70 68 61 71 b3 4e 58 14 00 00 00 6f 70 74 69 6d 5f eftune_noise_alphaq.NX....optim_
0fa0 74 61 72 67 65 74 5f 6d 6f 64 75 6c 65 73 71 b4 4e 58 12 00 00 00 62 61 74 63 68 5f 65 76 61 6c target_modulesq.NX....batch_eval
0fc0 5f 6d 65 74 72 69 63 73 71 b5 89 58 0d 00 00 00 65 76 61 6c 5f 6f 6e 5f 73 74 61 72 74 71 b6 89 _metricsq..X....eval_on_startq..
0fe0 58 10 00 00 00 75 73 65 5f 6c 69 67 65 72 5f 6b 65 72 6e 65 6c 71 b7 89 58 13 00 00 00 6c 69 67 X....use_liger_kernelq..X....lig
1000 65 72 5f 6b 65 72 6e 65 6c 5f 63 6f 6e 66 69 67 71 b8 4e 58 16 00 00 00 65 76 61 6c 5f 75 73 65 er_kernel_configq.NX....eval_use
1020 5f 67 61 74 68 65 72 5f 6f 62 6a 65 63 74 71 b9 89 58 1d 00 00 00 61 76 65 72 61 67 65 5f 74 6f _gather_objectq..X....average_to
1040 6b 65 6e 73 5f 61 63 72 6f 73 73 5f 64 65 76 69 63 65 73 71 ba 88 58 11 00 00 00 64 69 73 74 72 kens_across_devicesq..X....distr
1060 69 62 75 74 65 64 5f 73 74 61 74 65 71 bb 63 61 63 63 65 6c 65 72 61 74 65 2e 73 74 61 74 65 0a ibuted_stateq.caccelerate.state.
1080 50 61 72 74 69 61 6c 53 74 61 74 65 0a 71 bc 29 81 71 bd 7d 71 be 28 58 04 00 00 00 5f 63 70 75 PartialState.q.).q.}q.(X...._cpu
10a0 71 bf 89 58 07 00 00 00 62 61 63 6b 65 6e 64 71 c0 4e 58 06 00 00 00 64 65 76 69 63 65 71 c1 63 q..X....backendq.NX....deviceq.c
10c0 74 6f 72 63 68 0a 64 65 76 69 63 65 0a 71 c2 58 04 00 00 00 63 75 64 61 71 c3 85 71 c4 52 71 c5 torch.device.q.X....cudaq..q.Rq.
10e0 68 53 89 58 10 00 00 00 64 69 73 74 72 69 62 75 74 65 64 5f 74 79 70 65 71 c6 63 61 63 63 65 6c hS.X....distributed_typeq.caccel
1100 65 72 61 74 65 2e 75 74 69 6c 73 2e 64 61 74 61 63 6c 61 73 73 65 73 0a 44 69 73 74 72 69 62 75 erate.utils.dataclasses.Distribu
1120 74 65 64 54 79 70 65 0a 71 c7 58 02 00 00 00 4e 4f 71 c8 85 71 c9 52 71 ca 58 0d 00 00 00 6e 75 tedType.q.X....NOq..q.Rq.X....nu
1140 6d 5f 70 72 6f 63 65 73 73 65 73 71 cb 4b 01 58 0d 00 00 00 70 72 6f 63 65 73 73 5f 69 6e 64 65 m_processesq.K.X....process_inde
1160 78 71 cc 4b 00 58 13 00 00 00 6c 6f 63 61 6c 5f 70 72 6f 63 65 73 73 5f 69 6e 64 65 78 71 cd 4b xq.K.X....local_process_indexq.K
1180 00 58 0d 00 00 00 66 6f 72 6b 5f 6c 61 75 6e 63 68 65 64 71 ce 89 75 62 58 06 00 00 00 5f 6e 5f .X....fork_launchedq..ubX...._n_
11a0 67 70 75 71 cf 4b 01 58 0e 00 00 00 5f 73 65 74 75 70 5f 64 65 76 69 63 65 73 71 d0 68 c2 58 04 gpuq.K.X...._setup_devicesq.h.X.
11c0 00 00 00 63 75 64 61 71 d1 4b 00 86 71 d2 52 71 d3 58 10 00 00 00 64 65 65 70 73 70 65 65 64 5f ...cudaq.K..q.Rq.X....deepspeed_
11e0 70 6c 75 67 69 6e 71 d4 4e 75 62 2e 50 4b 07 08 ca 9a a6 3b ac 11 00 00 ac 11 00 00 50 4b 03 04 pluginq.Nub.PK.....;........PK..
1200 00 00 08 08 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 1d 00 09 00 74 72 61 69 6e 69 ..........................traini
1220 6e 67 5f 61 72 67 73 2f 2e 66 6f 72 6d 61 74 5f 76 65 72 73 69 6f 6e 46 42 05 00 5a 5a 5a 5a 5a ng_args/.format_versionFB..ZZZZZ
1240 31 50 4b 07 08 b7 ef dc 83 01 00 00 00 01 00 00 00 50 4b 03 04 00 00 08 08 00 00 00 00 00 00 00 1PK..............PK.............
1260 00 00 00 00 00 00 00 00 00 00 00 20 00 31 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 2e 73 74 .............1.training_args/.st
1280 6f 72 61 67 65 5f 61 6c 69 67 6e 6d 65 6e 74 46 42 2d 00 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a orage_alignmentFB-.ZZZZZZZZZZZZZ
12a0 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a ZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZ
12c0 36 34 50 4b 07 08 3f 77 71 e9 02 00 00 00 02 00 00 00 50 4b 03 04 00 00 08 08 00 00 00 00 00 00 64PK..?wq.........PK............
12e0 00 00 00 00 00 00 00 00 00 00 00 00 17 00 39 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 62 79 ..............9.training_args/by
1300 74 65 6f 72 64 65 72 46 42 35 00 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a teorderFB5.ZZZZZZZZZZZZZZZZZZZZZ
1320 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a ZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZ
1340 6c 69 74 74 6c 65 50 4b 07 08 85 3d e3 19 06 00 00 00 06 00 00 00 50 4b 03 04 00 00 08 08 00 00 littlePK...=..........PK........
1360 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 15 00 37 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 ..................7.training_arg
1380 73 2f 76 65 72 73 69 6f 6e 46 42 33 00 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a s/versionFB3.ZZZZZZZZZZZZZZZZZZZ
13a0 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a ZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZ
13c0 33 0a 50 4b 07 08 d1 9e 67 55 02 00 00 00 02 00 00 00 50 4b 03 04 00 00 08 08 00 00 00 00 00 00 3.PK....gU........PK............
13e0 00 00 00 00 00 00 00 00 00 00 00 00 24 00 2c 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 2e 64 ............$.,.training_args/.d
1400 61 74 61 2f 73 65 72 69 61 6c 69 7a 61 74 69 6f 6e 5f 69 64 46 42 28 00 5a 5a 5a 5a 5a 5a 5a 5a ata/serialization_idFB(.ZZZZZZZZ
1420 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a 5a ZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZZ
1440 30 32 39 30 38 34 36 38 36 37 37 37 36 32 39 32 33 31 30 34 30 30 30 36 32 36 32 34 32 31 30 35 02908468677762923104000626242105
1460 36 32 31 30 30 38 31 36 50 4b 07 08 4c 33 94 53 28 00 00 00 28 00 00 00 50 4b 01 02 00 00 00 00 62100816PK..L3.S(...(...PK......
1480 08 08 00 00 00 00 00 00 ca 9a a6 3b ac 11 00 00 ac 11 00 00 16 00 00 00 00 00 00 00 00 00 00 00 ...........;....................
14a0 00 00 00 00 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 64 61 74 61 2e 70 6b 6c 50 4b 01 02 ......training_args/data.pklPK..
14c0 00 00 00 00 08 08 00 00 00 00 00 00 b7 ef dc 83 01 00 00 00 01 00 00 00 1d 00 00 00 00 00 00 00 ................................
14e0 00 00 00 00 00 00 fc 11 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 2e 66 6f 72 6d 61 74 5f ..........training_args/.format_
1500 76 65 72 73 69 6f 6e 50 4b 01 02 00 00 00 00 08 08 00 00 00 00 00 00 3f 77 71 e9 02 00 00 00 02 versionPK..............?wq......
1520 00 00 00 20 00 00 00 00 00 00 00 00 00 00 00 00 00 51 12 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 .................Q...training_ar
1540 67 73 2f 2e 73 74 6f 72 61 67 65 5f 61 6c 69 67 6e 6d 65 6e 74 50 4b 01 02 00 00 00 00 08 08 00 gs/.storage_alignmentPK.........
1560 00 00 00 00 00 85 3d e3 19 06 00 00 00 06 00 00 00 17 00 00 00 00 00 00 00 00 00 00 00 00 00 d2 ......=.........................
1580 12 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 62 79 74 65 6f 72 64 65 72 50 4b 01 02 00 00 ...training_args/byteorderPK....
15a0 00 00 08 08 00 00 00 00 00 00 d1 9e 67 55 02 00 00 00 02 00 00 00 15 00 00 00 00 00 00 00 00 00 ............gU..................
15c0 00 00 00 00 56 13 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 76 65 72 73 69 6f 6e 50 4b 01 ....V...training_args/versionPK.
15e0 02 00 00 00 00 08 08 00 00 00 00 00 00 4c 33 94 53 28 00 00 00 28 00 00 00 24 00 00 00 00 00 00 .............L3.S(...(...$......
1600 00 00 00 00 00 00 00 d2 13 00 00 74 72 61 69 6e 69 6e 67 5f 61 72 67 73 2f 2e 64 61 74 61 2f 73 ...........training_args/.data/s
1620 65 72 69 61 6c 69 7a 61 74 69 6f 6e 5f 69 64 50 4b 06 06 2c 00 00 00 00 00 00 00 1e 03 2d 00 00 erialization_idPK..,.........-..
1640 00 00 00 00 00 00 00 06 00 00 00 00 00 00 00 06 00 00 00 00 00 00 00 b7 01 00 00 00 00 00 00 78 ...............................x
1660 14 00 00 00 00 00 00 50 4b 06 07 00 00 00 00 2f 16 00 00 00 00 00 00 01 00 00 00 50 4b 05 06 00 .......PK....../...........PK...
1680 00 00 00 06 00 06 00 b7 01 00 00 78 14 00 00 00 00 ...........x.....