Repository Analysis

huggingface/trl

Train transformer language models with reinforcement learning.

19.3 Moderate AI signal View on GitHub
19.3
Adjusted Score
19.3
Raw Score
100%
Time Factor
2026-05-30
Last Push
18,494
Stars
Python
Language
113,748
Lines of Code
454
Files
1723
Pattern Hits
2026-05-31
Scan Date

Score History

Severity Breakdown

CRITICAL 5HIGH 71MEDIUM 136LOW 1511

Pattern Findings

1723 matches across 15 categories. Click a row to expand file-level details.

Hyper-Verbose Identifiers752 hits · 684 pts
SeverityFileLineSnippet
LOWtests/test_skills_cli.py26 def test_cmd_list_without_target(self, capsys):
LOWtests/test_skills_cli.py38 def test_cmd_list_with_target(self, tmp_path, capsys):
LOWtests/test_skills_cli.py51 def test_cmd_list_empty_target(self, tmp_path, capsys):
LOWtests/test_skills_cli.py61 def test_cmd_install_single_skill(self, tmp_path, capsys):
LOWtests/test_skills_cli.py73 def test_cmd_install_all_skills(self, tmp_path, capsys):
LOWtests/test_skills_cli.py85 def test_cmd_install_no_skill_or_all(self, capsys):
LOWtests/test_skills_cli.py95 def test_cmd_install_both_skill_and_all(self, capsys):
LOWtests/test_skills_cli.py105 def test_cmd_install_nonexistent_skill(self, tmp_path, capsys):
LOWtests/test_skills_cli.py116 def test_cmd_install_already_exists(self, tmp_path, capsys):
LOWtests/test_skills_cli.py130 def test_cmd_install_with_force(self, tmp_path, capsys):
LOWtests/test_skills_cli.py144 def test_cmd_uninstall_success(self, tmp_path, capsys):
LOWtests/test_skills_cli.py159 def test_cmd_uninstall_not_installed(self, tmp_path, capsys):
LOWtests/test_skills_cli.py170 def test_cmd_install_creates_target_directory(self, tmp_path, capsys):
LOWtests/test_skills_cli.py187 def test_cmd_uninstall_invalid_target(self, capsys):
LOWtests/test_skills_cli.py201 def test_add_skills_subcommands_creates_parsers(self):
LOWtests/test_skills_cli.py222 def test_list_command_optional_target(self):
LOWtests/test_skills_cli.py236 def test_install_command_requires_target(self):
LOWtests/test_skills_cli.py282 def test_default_scope_is_project(self):
LOWtests/test_rloo_trainer.py102 def test_train_with_num_generations_eval(self):
LOWtests/test_rloo_trainer.py126 def test_train_multiple_iterations(self):
LOWtests/test_rloo_trainer.py233 def test_train_peft_with_gradient_checkpointing(self):
LOWtests/test_rloo_trainer.py269 def test_train_different_reward_model(self):
LOWtests/test_rloo_trainer.py308 def test_train_reward_func_standard(self):
LOWtests/test_rloo_trainer.py342 def test_train_reward_func_conversational(self):
LOWtests/test_rloo_trainer.py377 def test_train_multiple_reward_funcs(self):
LOWtests/test_rloo_trainer.py415 def test_train_sync_and_async_reward_funcs(self):
LOWtests/test_rloo_trainer.py464 def non_applicable_reward_func(completions, **kwargs):
LOWtests/test_rloo_trainer.py500 def test_train_multiple_reward_funcs_with_weights(self):
LOWtests/test_rloo_trainer.py544 def test_reward_metric_reflects_reward_weights(self):
LOWtests/test_rloo_trainer.py581 def test_train_multiple_mixed_reward_funcs(self):
LOWtests/test_rloo_trainer.py615 def test_train_reward_func_additional_column(self):
LOWtests/test_rloo_trainer.py655 def test_train_with_sync_ref_model(self):
LOWtests/test_rloo_trainer.py720 def test_train_with_pad_to_multiple_of(self):
LOWtests/test_rloo_trainer.py800 def test_train_vllm_structured_outputs(self):
LOWtests/test_rloo_trainer.py832 def test_train_with_additional_generation_kwargs(self):
LOWtests/test_rloo_trainer.py869 def test_train_vllm_with_additional_generation_kwargs(self):
LOWtests/test_rloo_trainer.py905 def test_train_with_normalized_advantages(self):
LOWtests/test_rloo_trainer.py935 def test_train_with_clipped_rewards(self):
LOWtests/test_rloo_trainer.py966 def test_train_with_mask_truncated_completions(self, mock_generate):
LOWtests/test_rloo_trainer.py1015 def test_train_with_mask_truncated_completions_all_masked(self):
LOWtests/test_rloo_trainer.py1053 def test_warning_raised_all_rewards_none(self, caplog):
LOWtests/test_rloo_trainer.py1082 def test_train_num_generations_larger_than_batch_size(self):
LOWtests/test_rloo_trainer.py1112 def test_train_multiple_dataloader_workers(self):
LOWtests/test_rloo_trainer.py1153 def test_train_with_generation_kwargs(self):
LOWtests/test_rloo_trainer.py1184 def test_train_with_reward_func_accessing_trainer_state(self):
LOWtests/test_rloo_trainer.py1209 def test_train_reward_func_with_log_extra(self):
LOWtests/test_rloo_trainer.py1235 def test_train_reward_func_with_log_metric(self):
LOWtests/test_rloo_trainer.py1262 def test_prepare_input_called_with_correct_data(self):
LOWtests/test_rloo_trainer.py1389 def test_train_vlm_with_pad_to_multiple_of(self):
LOWtests/test_rloo_trainer.py1433 def test_train_vlm_beta_non_zero(self, model_id):
LOWtests/test_rloo_trainer.py1575 def test_train_vlm_multi_image(self, model_id):
LOWtests/test_rloo_trainer.py1608 def test_train_with_chat_template_kwargs(self):
LOWtests/test_rloo_trainer.py1638 def test_mismatched_reward_processing_classes_length(self):
LOWtests/test_rloo_trainer.py1664 def test_correct_reward_processing_classes_list(self):
LOWtests/test_rloo_trainer.py1695 def test_single_reward_model_with_single_processing_class(self):
LOWtests/test_utils.py181 def test_pad_to_multiple_of_side_left(self):
LOWtests/test_utils.py189 def test_pad_to_multiple_of_no_extra_padding(self):
LOWtests/test_utils.py199 def test_hash_module_deterministic_across_order(self):
LOWtests/test_utils.py216 def test_hash_module_changes_with_value(self):
LOWtests/test_utils.py224 def test_hash_module_includes_dtype(self):
692 more matches not shown…
Over-Commented Block336 hits · 330 pts
SeverityFileLineSnippet
LOWtests/test_skills_cli.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_rloo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/conftest.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_callbacks.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_sft_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/testing_constants.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_chat_template_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_grpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_model_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/testing_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_data_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/__init__.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_vllm_client_server.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_rich_progress_callback.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_activation_offloading.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_rewards.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_cli_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_skills.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_dpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_cli.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/test_reward_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/_openreward_echo_env.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_utils.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_gkd_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_nash_md_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_minillm_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_tpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_gspo_token_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_sdft_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/__init__.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_sdpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_xpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_gold_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_prm_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_online_dpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_openreward.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_openreward.py201 # If a task spec ever shipped a `prompt` key, the metadata loop must
LOWtests/experimental/test_async_grpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_ssd_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_orpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_kto_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_bco_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_cpo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_distillation_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_modeling_value_head.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_dppo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_ppo_trainer.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/experimental/test_merge_model_callback.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/invariant/__init__.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/invariant/test_invariant.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/distributed/__init__.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWtests/distributed/test_distributed.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWexamples/accelerate_configs/alst_ulysses_4gpu.yaml1# ALST/Ulysses Sequence Parallelism with 2D Parallelism (DP + SP) for 4 GPUs
LOWexamples/datasets/tldr.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWexamples/datasets/deepmath_103k.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWexamples/datasets/ultrafeedback.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWexamples/datasets/lm-human-preferences-sentiment.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
LOWexamples/datasets/prm800k.py1# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
276 more matches not shown…
Cross-File Repetition51 hits · 255 pts
SeverityFileLineSnippet
HIGHAGENTS.md0brief one-line description of what this does. args: param1 (`str`): description of required param. param2 (`int`, *optio
HIGHCLAUDE.md0brief one-line description of what this does. args: param1 (`str`): description of required param. param2 (`int`, *optio
HIGH.cursor/BUGBOT.md0brief one-line description of what this does. args: param1 (`str`): description of required param. param2 (`int`, *optio
HIGH.ai/AGENTS.md0brief one-line description of what this does. args: param1 (`str`): description of required param. param2 (`int`, *optio
HIGHtests/test_rloo_trainer.py0reward function that rewards completions with more unique letters.
HIGHtests/test_rloo_trainer.py0reward function that rewards completions with more unique letters.
HIGHtests/test_grpo_trainer.py0reward function that rewards completions with more unique letters.
HIGHtests/test_grpo_trainer.py0reward function that rewards completions with more unique letters.
HIGHtests/test_grpo_trainer.py0reward function that rewards completions with more unique letters.
HIGHtests/test_rloo_trainer.py0test that training works with vllm for generation with structured outputs.
HIGHtests/test_grpo_trainer.py0test that training works with vllm for generation with structured outputs.
HIGHtests/test_grpo_trainer.py0test that training works with vllm for generation with structured outputs.
HIGHtests/test_callbacks.py0test that bema callback respects the update frequency.
HIGHtests/test_callbacks.py0test that bema callback respects the update frequency.
HIGHtests/test_callbacks.py0test that bema callback respects the update frequency.
HIGHtests/test_grpo_trainer.py0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHtests/test_vllm_client_server.py0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHtests/test_vllm_client_server.py0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHtests/test_vllm_client_server.py0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHtests/test_vllm_client_server.py0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHdocs/source/grpo_trainer.md0multiplies two integers. args: a: the first integer. b: the second integer. returns: the product of the two integers.
HIGHtests/test_data_utils.py0\ <|start|>system<|message|>you are hugginggpt. knowledge cutoff: 2024-06 current date: {strftime("%y-%m-%d")} reasoning
HIGHtests/test_data_utils.py0\ <|start|>system<|message|>you are hugginggpt. knowledge cutoff: 2024-06 current date: {strftime("%y-%m-%d")} reasoning
HIGHtests/test_data_utils.py0\ <|start|>system<|message|>you are hugginggpt. knowledge cutoff: 2024-06 current date: {strftime("%y-%m-%d")} reasoning
HIGHtests/test_data_utils.py0\ <|start|>system<|message|>you are hugginggpt. knowledge cutoff: 2024-06 current date: {strftime("%y-%m-%d")} reasoning
HIGHtests/test_cli_utils.py0test that config defaults are applied to all subparsers.
HIGHtests/test_cli_utils.py0test that config defaults are applied to all subparsers.
HIGHtests/test_cli_utils.py0test that config defaults are applied to all subparsers.
HIGHtests/test_cli_utils.py0test that config defaults are applied to all subparsers.
HIGHtests/experimental/test_ppo_trainer.py0test if we instantiate a model by adding `summary_drop_prob` to the config it will be added to the v_head
HIGHtests/experimental/test_ppo_trainer.py0test if we instantiate a model by adding `summary_drop_prob` to the config it will be added to the v_head
HIGHtests/experimental/test_ppo_trainer.py0test if we instantiate a model by adding `summary_drop_prob` to the config it will be added to the v_head
HIGHtests/experimental/test_ppo_trainer.py0test if we instantiate a model by adding `summary_drop_prob` to the config it will be added to the v_head
HIGHtests/experimental/test_ppo_trainer.py0simply creates a peft model and checks that it can be loaded.
HIGHtests/experimental/test_ppo_trainer.py0simply creates a peft model and checks that it can be loaded.
HIGHtests/experimental/test_ppo_trainer.py0simply creates a peft model and checks that it can be loaded.
HIGHdocs/source/openenv.md0make a guess in the wordle environment. args: guess: the guessed word, formatted as '[abcde]' returns: the feedback mess
HIGHexamples/scripts/openenv/multi_env.py0make a guess in the wordle environment. args: guess: the guessed word, formatted as '[abcde]' returns: the feedback mess
HIGHexamples/scripts/openenv/wordle.py0make a guess in the wordle environment. args: guess: the guessed word, formatted as '[abcde]' returns: the feedback mess
HIGHtrl/experimental/cpo/cpo_trainer.py0generate samples from the model and reference model for the given batch of inputs.
HIGHtrl/experimental/bco/bco_trainer.py0generate samples from the model and reference model for the given batch of inputs.
HIGHtrl/experimental/orpo/orpo_trainer.py0generate samples from the model and reference model for the given batch of inputs.
HIGHtrl/experimental/cpo/cpo_trainer.py0overriding built-in evaluation loop to store metrics for each batch. prediction/evaluation loop, shared by `trainer.eval
HIGHtrl/experimental/bco/bco_trainer.py0overriding built-in evaluation loop to store metrics for each batch. prediction/evaluation loop, shared by `trainer.eval
HIGHtrl/experimental/orpo/orpo_trainer.py0overriding built-in evaluation loop to store metrics for each batch. prediction/evaluation loop, shared by `trainer.eval
HIGHtrl/experimental/cpo/cpo_trainer.py0log `logs` on the various objects watching training, including stored metrics. args: logs (`dict[str, float]`): the valu
HIGHtrl/experimental/bco/bco_trainer.py0log `logs` on the various objects watching training, including stored metrics. args: logs (`dict[str, float]`): the valu
HIGHtrl/experimental/orpo/orpo_trainer.py0log `logs` on the various objects watching training, including stored metrics. args: logs (`dict[str, float]`): the valu
HIGHtrl/experimental/dppo/dppo_trainer.py0tokenize prompts and extract images/multimodal fields for generation.
HIGHtrl/trainer/rloo_trainer.py0tokenize prompts and extract images/multimodal fields for generation.
HIGHtrl/trainer/grpo_trainer.py0tokenize prompts and extract images/multimodal fields for generation.
Decorative Section Separators60 hits · 176 pts
SeverityFileLineSnippet
MEDIUMtests/conftest.py54# ============================================================================
MEDIUMtests/conftest.py56# ============================================================================
MEDIUMtests/conftest.py68# ============================================================================
MEDIUMexamples/scripts/grpo_agent.py184# ------------------------
MEDIUMexamples/scripts/grpo_agent.py186# ------------------------
MEDIUMexamples/scripts/grpo_agent.py231# ------------------------
MEDIUMexamples/scripts/grpo_agent.py233# ------------------------
MEDIUMexamples/scripts/grpo_agent.py260# ------------------------
MEDIUMexamples/scripts/grpo_agent.py262# ------------------------
MEDIUMexamples/scripts/grpo_agent.py267 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py269 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py284 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py286 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py298 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py300 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py310 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py312 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py315 # ------------------------
MEDIUMexamples/scripts/grpo_agent.py317 # ------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py234# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py236# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py253# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py255# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py263# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/browsergym_llm.py265# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py105# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py107# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py187# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py189# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py339# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py341# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py369# ---------------------------------------------------------------------------
MEDIUMexamples/scripts/openenv/sudoku.py371# ---------------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py269 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py271 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py319 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py321 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py338 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py340 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py421 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py423 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py472 # ------------------------------------------------------------------
MEDIUMtrl/experimental/ssd/ssd_trainer.py474 # ------------------------------------------------------------------
MEDIUMtrl/experimental/distillation/distillation_trainer.py702 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py704 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py764 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py766 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py1022 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py1024 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py1576 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/distillation/distillation_trainer.py1578 # ──────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/_spec.py144 # ── public surface ──────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/_spec.py251 # ── internals ───────────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/environment.py101# ────────────────────────────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/environment.py204 # ── TRL contract ─────────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/environment.py252 # ── helpers ──────────────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/environment.py299# ── dynamic tool binding ─────────────────────────────────────────────
MEDIUMtrl/experimental/openreward/environment.py366# ── small utilities ──────────────────────────────────────────────────
MEDIUMtrl/trainer/rloo_trainer.py645 # <-───────> per_device_train_batch_size=3
MEDIUMtrl/trainer/grpo_trainer.py930 # <-───────> per_device_train_batch_size=3
Self-Referential Comments60 hits · 174 pts
SeverityFileLineSnippet
MEDIUMtests/test_rloo_trainer.py1648 # Create a single processing class (tokenizer)
MEDIUMtests/test_rloo_trainer.py1702 # Create a single processing class (tokenizer)
MEDIUMtests/test_grpo_trainer.py93 # Create a mock trainer with minimal setup
MEDIUMtests/test_grpo_trainer.py96 # Create a mock accelerator
MEDIUMtests/test_grpo_trainer.py100 # Create a minimal trainer instance just to access the method
MEDIUMtests/test_grpo_trainer.py2704 # Create a single processing class (tokenizer)
MEDIUMtests/test_grpo_trainer.py2758 # Create a single processing class (tokenizer)
MEDIUMtests/test_grpo_trainer.py3146 # Create a VLM processor
MEDIUMtests/test_cli_utils.py176 # Create the main parser
MEDIUMtests/test_cli_utils.py182 # Create a subparser for a specific command
MEDIUMtests/test_cli_utils.py202 # Create the main parser
MEDIUMtests/test_cli_utils.py208 # Create a subparser for a specific command
MEDIUMtests/test_cli_utils.py225 # Create the main parser
MEDIUMtests/test_cli_utils.py231 # Create a subparser for a specific command
MEDIUMtests/test_cli_utils.py247 # Create the main parser
MEDIUMtests/test_cli_utils.py253 # Create a subparser for a specific command
MEDIUMtests/test_skills.py188 # Create a file instead of directory
MEDIUMtests/test_skills.py199 # Create a skill with subdirectories
MEDIUMtests/test_skills.py264 # Create a skill with multiple files
MEDIUMtests/test_skills.py171 # Create a symlink
MEDIUMtests/test_skills.py217 # Create a skill
MEDIUMtests/test_skills.py435 # Create a real skill
MEDIUMtests/test_cli.py101 # Create a temporary config file
MEDIUMtests/experimental/test_prm_trainer.py126 # Define the input features
MEDIUMtests/experimental/test_prm_trainer.py150 # Define the input features
MEDIUMtests/experimental/test_prm_trainer.py173 # Define the input features
MEDIUMtests/experimental/test_prm_trainer.py197 # Define the input features
MEDIUMtests/experimental/test_prm_trainer.py221 # Define the input features
MEDIUMscripts/generate_zen_multi_image_dataset.py76 # Create the images
MEDIUMscripts/generate_zen_multi_image_dataset.py106 # Create the images
MEDIUMscripts/generate_zen_multi_image_dataset.py157 # Create the images
MEDIUMscripts/generate_zen_multi_image_dataset.py229 # Create the images
MEDIUMtrl/data_utils.py741 # Create a new bin
MEDIUMtrl/experimental/merge_model_callback.py37 # Create the repository if it doesn't exist
MEDIUMtrl/experimental/merge_model_callback.py118 # Create the merge configuration dictionary
MEDIUMtrl/experimental/merge_model_callback.py128 # Create the MergeConfiguration from the dictionary
MEDIUMtrl/experimental/merge_model_callback.py137 # Create the TIES merge configuration dictionary
MEDIUMtrl/experimental/merge_model_callback.py172 # Create the MergeConfiguration from the dictionary
MEDIUMtrl/experimental/merge_model_callback.py181 # Create the DARE TIES merge configuration dictionary
MEDIUMtrl/experimental/merge_model_callback.py216 # Create the MergeConfiguration from the dictionary
MEDIUMtrl/experimental/merge_model_callback.py226 # Create the SLERP merge configuration dictionary
MEDIUMtrl/experimental/merge_model_callback.py255 # Create the MergeConfiguration from the dictionary
MEDIUMtrl/experimental/utils.py15# This file contains utility classes and functions that are used across more than one experimental trainer or feature.
MEDIUMtrl/experimental/cpo/cpo_trainer.py174 # Initialize this variable to False. This helps tracking the case when `peft_module_casting_to_bf16`
MEDIUMtrl/experimental/bco/bco_trainer.py473 # Initialize this variable to False. This helps tracking the case when `peft_module_casting_to_bf16`
MEDIUMtrl/experimental/orpo/orpo_trainer.py183 # Initialize this variable to False. This helps tracking the case when `peft_module_casting_to_bf16`
MEDIUMtrl/experimental/online_dpo/online_dpo_trainer.py382 # Define the collator if not provided
MEDIUMtrl/experimental/online_dpo/online_dpo_trainer.py886 # Create the output dict with required fields
MEDIUMtrl/experimental/gold/gold_trainer.py1465 # Create a completion mask
MEDIUMtrl/experimental/prm/prm_trainer.py337 # Create the label
MEDIUMtrl/experimental/ppo/ppo_trainer.py394 # Define the collator if not provided
MEDIUMtrl/scripts/vllm_serve.py109 # Create a stateless process group to manage communication between training processes and vLLM workers.
MEDIUMtrl/scripts/vllm_serve.py491 # Define the endpoints for the model server
MEDIUMtrl/trainer/utils.py160 # Create an output tensor filled with the padding value
MEDIUMtrl/trainer/utils.py171 # Define the slices
MEDIUMtrl/trainer/utils.py719 self.generator = torch.Generator() # Create a local random generator
MEDIUMtrl/trainer/utils.py950# This function is intentionally not used internally. It is provided as a utility for users whose datasets contain
MEDIUMtrl/trainer/callbacks.py218 # Create a table per group
MEDIUMtrl/trainer/callbacks.py693 # Create a new instance and load state_dict
MEDIUMtrl/trainer/grpo_trainer.py494 # Create the environments and extract their methods to be used as tools. We create one environment per rollout
Unused Imports182 hits · 166 pts
SeverityFileLineSnippet
LOWexamples/scripts/openenv/browsergym_llm.py64
LOWexamples/scripts/openenv/sudoku.py84
LOWexamples/scripts/openenv/browsergym.py50
LOWtrl/__init__.py19
LOWtrl/__init__.py77
LOWtrl/__init__.py77
LOWtrl/__init__.py77
LOWtrl/__init__.py77
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py83
LOWtrl/__init__.py97
LOWtrl/__init__.py98
LOWtrl/__init__.py98
LOWtrl/__init__.py98
LOWtrl/__init__.py98
LOWtrl/__init__.py98
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/__init__.py99
LOWtrl/experimental/utils.py47
LOWtrl/experimental/ssd/__init__.py15
LOWtrl/experimental/ssd/__init__.py16
LOWtrl/experimental/ssd/ssd_eval.py59
LOWtrl/experimental/ssd/ssd_trainer.py23
LOWtrl/experimental/gfpo/__init__.py15
LOWtrl/experimental/gfpo/__init__.py16
LOWtrl/experimental/sdpo/__init__.py15
LOWtrl/experimental/sdpo/__init__.py16
LOWtrl/experimental/cpo/__init__.py15
LOWtrl/experimental/cpo/__init__.py16
LOWtrl/experimental/papo/__init__.py16
LOWtrl/experimental/papo/__init__.py17
122 more matches not shown…
Deep Nesting145 hits · 138 pts
SeverityFileLineSnippet
LOWtests/test_utils.py809
LOWtests/test_utils.py840
LOWtests/test_grpo_trainer.py3002
LOWtests/test_grpo_trainer.py3118
LOWtests/test_grpo_trainer.py3266
LOWexamples/datasets/math_shepherd.py52
LOWexamples/scripts/sft_vlm_gemma3.py78
LOWexamples/scripts/sft_vlm_gemma3.py97
LOWexamples/scripts/grpo_agent.py50
LOWexamples/scripts/grpo_agent.py145
LOWexamples/scripts/sft_video_llm.py68
LOWexamples/scripts/openenv/multi_env.py127
LOWexamples/scripts/openenv/catch.py205
LOWexamples/scripts/openenv/sudoku.py208
LOWexamples/scripts/openenv/sudoku.py290
LOWexamples/scripts/openenv/sudoku.py374
LOWexamples/scripts/openenv/sudoku.py543
LOWscripts/log_reports.py34
LOWscripts/generate_tiny_models/_common.py256
LOWtrl/chat_template_utils.py355
LOWtrl/data_utils.py33
LOWtrl/data_utils.py127
LOWtrl/data_utils.py922
LOWtrl/_compat.py86
LOWtrl/import_utils.py29
LOWtrl/experimental/merge_model_callback.py82
LOWtrl/experimental/merge_model_callback.py260
LOWtrl/experimental/utils.py537
LOWtrl/experimental/utils.py557
LOWtrl/experimental/utils.py65
LOWtrl/experimental/utils.py150
LOWtrl/experimental/gfpo/gfpo_trainer.py69
LOWtrl/experimental/sdpo/sdpo_trainer.py96
LOWtrl/experimental/sdpo/sdpo.py163
LOWtrl/experimental/cpo/cpo_trainer.py130
LOWtrl/experimental/cpo/cpo_trainer.py446
LOWtrl/experimental/cpo/cpo_trainer.py579
LOWtrl/experimental/cpo/cpo_trainer.py643
LOWtrl/experimental/papo/papo_trainer.py154
LOWtrl/experimental/bco/bco_trainer.py407
LOWtrl/experimental/bco/bco_trainer.py1030
LOWtrl/experimental/bco/bco_trainer.py1233
LOWtrl/experimental/bco/bco_trainer.py1362
LOWtrl/experimental/orpo/orpo_trainer.py139
LOWtrl/experimental/orpo/orpo_trainer.py431
LOWtrl/experimental/orpo/orpo_trainer.py574
LOWtrl/experimental/online_dpo/online_dpo_trainer.py169
LOWtrl/experimental/online_dpo/online_dpo_trainer.py764
LOWtrl/experimental/online_dpo/online_dpo_trainer.py840
LOWtrl/experimental/online_dpo/online_dpo_trainer.py902
LOWtrl/experimental/online_dpo/online_dpo_trainer.py1096
LOWtrl/experimental/bema_for_ref_model/callback.py202
LOWtrl/experimental/sdft/sdft.py133
LOWtrl/experimental/sdft/sdft_trainer.py160
LOWtrl/experimental/distillation/distillation_trainer.py233
LOWtrl/experimental/distillation/distillation_trainer.py385
LOWtrl/experimental/distillation/distillation_trainer.py671
LOWtrl/experimental/distillation/distillation_trainer.py823
LOWtrl/experimental/distillation/distillation_trainer.py865
LOWtrl/experimental/distillation/distillation_trainer.py1049
85 more matches not shown…
Docstring Block Structure18 hits · 90 pts
SeverityFileLineSnippet
HIGHCONTRIBUTING.md268 Replicate a string `n` times with a separator. Args: string (`str`): String to replicate.
HIGHAGENTS.md71 Brief one-line description of what this does. Args: param1 (`str`): Description of require
HIGHCLAUDE.md71 Brief one-line description of what this does. Args: param1 (`str`): Description of require
HIGH.cursor/BUGBOT.md71 Brief one-line description of what this does. Args: param1 (`str`): Description of require
HIGHtrl/chat_template_utils.py356 Adds the appropriate response schema to the given tokenizer based on its chat template. At the time of initial
HIGHtrl/data_utils.py35 Convert messages into a structured multimodal format and inject the provided images into the message contents.
HIGHtrl/data_utils.py161 Check if the example is in a conversational format. Args: example (`dict[str, Any]`): A si
HIGHtrl/data_utils.py341 If the example is in a conversational format, apply a chat template to it. Args: example (`dict[str, l
HIGHtrl/data_utils.py505 Extracts the shared prompt from a preference data example, where the prompt is implicit within both the chosen and
HIGHtrl/data_utils.py883 Check if the example is in a conversational format (from/value). Note that this format isn't recommended. Prefer
HIGHtrl/experimental/gold/gold_trainer.py520 Merge probabilities based on alignment groups with corrected conditional probability handling. For a g
HIGHtrl/skills/skills.py73 Resolve target to a concrete directory path. Converts semantic agent names (e.g., 'claude') with scope to actu
HIGHtrl/skills/skills.py184 Install a skill to target directory. Args: skill_name (`str`): Name of skill to install. targe
HIGHtrl/skills/skills.py251 Install a skill. Args: skill_name (`str`): Name of skill to install. target (`str | Path`): Ag
HIGHtrl/skills/skills.py295 Uninstall a skill from target directory. Args: skill_name (`str`): Name of skill to uninstall.
HIGHtrl/skills/skills.py327 Uninstall a skill. Args: skill_name (`str`): Name of skill to uninstall. target (`str | Path`)
HIGHtrl/trainer/utils.py119 Pads a list of tensors to the same shape along the first dimension. Args: tensors (`list[torch.Tensor]
HIGH.ai/AGENTS.md71 Brief one-line description of what this does. Args: param1 (`str`): Description of require
Redundant / Tautological Comments54 hits · 70 pts
SeverityFileLineSnippet
LOWtests/test_chat_template_utils.py45 # Check if special tokens are correctly set
LOWtests/test_chat_template_utils.py112 # Check if special tokens are correctly set
LOWtests/test_grpo_trainer.py3213 # Check if signature columns were set properly
LOWtests/experimental/test_gkd_trainer.py52 # Set temperature to 0 for deterministic output
LOWtests/experimental/test_gkd_trainer.py71 # Check if the generated texts start with the original prompts
LOWtests/experimental/test_gkd_trainer.py84 # Check if the two generations are identical
LOWtests/experimental/test_online_dpo_trainer.py228 # Check if training loss is available
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py45 # Check if the buffer contains the correct number of elements
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py48 # Check if the buffer maintains the min-heap property
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py67 # Check if the buffer contains the correct number of elements
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py70 # Check if the buffer maintains the min-heap property
LOW…s/experimental/test_grpo_with_replay_buffer_trainer.py90 # Check if the sampled elements are from the buffer
LOWtests/experimental/test_ppo_trainer.py750 # Check if critic weights have been updated
LOWtests/experimental/test_ppo_trainer.py757 # Check if policy weights have been updated
LOWtests/experimental/test_ppo_trainer.py812 # Check if critic weights have been updated
LOWtests/experimental/test_ppo_trainer.py819 # Check if policy weights have been updated - for PEFT we check the LoRA weights
LOWtests/experimental/test_ppo_trainer.py191 # Check if the weights are the same
LOWtests/experimental/test_ppo_trainer.py206 # Check if the weights are the same
LOWtests/experimental/test_ppo_trainer.py224 # Check if the weights are the same
LOWtests/experimental/test_ppo_trainer.py245 # Check if the weights are the same
LOWtests/experimental/test_ppo_trainer.py251 # Check if the trl model has the same keys as the transformers model
LOWtests/experimental/test_ppo_trainer.py290 # Check if the outputs are of the right size - here
LOWtests/experimental/test_ppo_trainer.py303 # Check if v head of the model has the same dropout as the config
LOWtests/experimental/test_ppo_trainer.py315 # Check if v head of the model has the same dropout as the config
LOWtests/experimental/test_ppo_trainer.py320 # Check if v head of the model has the same dropout as the config
LOWtests/experimental/test_ppo_trainer.py405 # Check if the outputs are of the right size - here
LOWtests/experimental/test_ppo_trainer.py418 # Check if v head of the model has the same dropout as the config
LOWtests/experimental/test_ppo_trainer.py430 # Check if v head of the model has the same dropout as the config
LOWtests/experimental/test_ppo_trainer.py435 # Check if v head of the model has the same dropout as the config
LOWscripts/add_copyrights.py61 # Check if the exact copyright header exists
LOW.github/workflows/tests.yml90 if: github.ref == 'refs/heads/main' && always() # Check if the branch is main
LOW.github/workflows/tests.yml146 if: github.ref == 'refs/heads/main' && always() # Check if the branch is main
LOW.github/workflows/tests.yml197 if: github.ref == 'refs/heads/main' && always() # Check if the branch is main
LOW.github/workflows/tests.yml252 if: github.ref == 'refs/heads/main' && always() # Check if the branch is main
LOW.github/workflows/tests.yml305 if: github.ref == 'refs/heads/main' && always() # Check if the branch is main
LOWtrl/experimental/utils.py486 # Check if model is sharded (FSDP/DS-Zero3)
LOWtrl/experimental/gold/gold_trainer.py1456 # Check if the tokenized prompt starts with the tokenized prompt+completion
LOWtrl/experimental/tpo/tpo_trainer.py569 # Check if the tokenized prompt starts with the tokenized prompt+completion
LOWtrl/models/activation_offloading.py221 # Check if tensor is on CPU (skip offloading)
LOWtrl/models/activation_offloading.py226 # Check if tensor is too small
LOWtrl/models/activation_offloading.py231 # Check if tensor is a parameter or buffer
LOWtrl/models/activation_offloading.py238 # Check if tensor is an FP8 tensor (TorchAO) - skip offloading as they're already compressed
LOWtrl/models/activation_offloading.py244 # Check if tensor storage is a model parameter (for FSDP compatibility)
LOWtrl/models/activation_offloading.py286 # Check if tensor has broadcast dimensions (stride == 0)
LOWtrl/models/activation_offloading.py495 # Check if tensor still exists (might have been cleaned up by a previous node)
LOWtrl/models/utils.py275 # Check if the model is already a FSDP model due to `Manual Wrapping` and if so, don't wrap it again
LOWtrl/scripts/vllm_serve.py733 # Check if adding this item would exceed the token budget
LOWtrl/skills/skills.py105 # Check if it's a predefined agent
LOWtrl/skills/skills.py205 # Check if source skill exists
LOWtrl/skills/skills.py218 # Check if already exists
LOWtrl/trainer/sft_trainer.py1478 # Check if the tokenized prompt starts with the tokenized prompt+completion
LOWtrl/trainer/dpo_trainer.py960 # Check if the tokenized prompt starts with the tokenized prompt+completion
LOWtrl/generation/vllm_client.py186 # Check if the total timeout duration has passed
LOWtrl/extras/profiling.py199 # Check if self is a Trainer-like object with required attributes
Excessive Try-Catch Wrapping51 hits · 60 pts
SeverityFileLineSnippet
LOWtests/test_sft_trainer.py2186 except Exception:
LOWtests/test_grpo_trainer.py3106 except Exception as e:
LOWtests/test_grpo_trainer.py3233 except Exception as e:
LOWtests/test_grpo_trainer.py3300 except Exception as e:
LOWtests/test_rewards.py143 except Exception as e:
MEDIUMtests/test_rewards.py140def target():
MEDIUMtests/experimental/test_gold_trainer.py28def openr1_examples():
MEDIUMtests/experimental/test_gold_trainer.py41def countdown_examples():
LOWtests/experimental/test_gold_trainer.py35 except Exception as exc: # pragma: no cover - network/environment dependent
LOWtests/experimental/test_gold_trainer.py48 except Exception as exc: # pragma: no cover - network/environment dependent
LOWtests/experimental/test_online_dpo_trainer.py199 except Exception:
LOWdocs/source/openenv.md398 except Exception:
LOWdocs/source/openenv.md409 except Exception:
LOWexamples/scripts/sft_vlm_gemma3.py107 except Exception as e:
MEDIUMexamples/scripts/sft_vlm_gemma3.py108 print(f"Error processing image {img_path}: {e}")
LOWexamples/scripts/sft_video_llm.py137 except Exception as e:
LOWexamples/scripts/openenv/multi_env.py136 except Exception:
LOWexamples/scripts/openenv/multi_env.py147 except Exception:
LOWexamples/scripts/openenv/carla_vlm_gemma.py165 except Exception as e:
LOWexamples/scripts/openenv/catch.py162 except Exception as e:
LOWscripts/log_reports.py59 except Exception as e:
MEDIUMscripts/add_copyrights.py48 print(f"Error fetching tracked files: {e}")
LOWtrl/_lazy_module.py72 except Exception as e:
LOWtrl/_compat.py45 except Exception as e:
LOWtrl/_compat.py69 except Exception as e:
LOWtrl/_compat.py126 except Exception as e:
LOWtrl/_compat.py155 except Exception as e:
LOWtrl/experimental/sdft/sdft.py213 except Exception:
LOWtrl/experimental/openreward/_spec.py175 except Exception: # noqa: BLE001
LOWtrl/experimental/openreward/_spec.py282 except Exception as e: # noqa: BLE001
LOWtrl/experimental/openreward/_spec.py312 except Exception as e: # noqa: BLE001
LOWtrl/experimental/openreward/environment.py261 except Exception as e: # noqa: BLE001
LOWtrl/experimental/openreward/environment.py273 except Exception as e: # noqa: BLE001
LOWtrl/experimental/async_grpo/async_rollout_worker.py646 except Exception as error:
LOWtrl/experimental/dppo/dppo_trainer.py463 except Exception as err:
LOWtrl/experimental/ppo/modeling_value_head.py459 except Exception:
LOWtrl/experimental/ppo/modeling_value_head.py469 except Exception as exc:
MEDIUMtrl/cli/commands/skills.py37 print("Error: Unknown skills command")
LOWtrl/scripts/vllm_serve.py784 except Exception as e:
LOWtrl/scripts/vllm_serve.py789 except Exception as e:
LOWtrl/scripts/utils.py400 except Exception as e:
MEDIUMtrl/scripts/utils.py381def get_git_commit_hash(package_name):
MEDIUMtrl/skills/cli.py94 print("Error: Either provide a skill name or use --all to install all skills")
MEDIUMtrl/skills/cli.py100 print("Error: Cannot specify both a skill name and --all")
MEDIUMtrl/skills/cli.py158 print(f"Error: {e}")
MEDIUMtrl/skills/cli.py193 print(f"Error: {e}")
LOWtrl/trainer/callbacks.py541 except Exception as scorer_e:
LOWtrl/trainer/callbacks.py547 except Exception as pred_e:
LOWtrl/trainer/callbacks.py564 except Exception as summary_e:
LOWtrl/trainer/callbacks.py569 except Exception as finish_e:
LOWtrl/trainer/grpo_trainer.py1527 except Exception as e:
Hallucination Indicators5 hits · 35 pts
SeverityFileLineSnippet
CRITICALtrl/experimental/ppo/modeling_value_head.py700 self.v_head.summary.weight.data.normal_(mean=0.0, std=initializer_range)
CRITICALtrl/experimental/ppo/modeling_value_head.py701 self.v_head.summary.bias.data.zero_()
CRITICALtrl/experimental/ppo/modeling_value_head.py966 self.v_head.summary.weight.data.normal_(mean=0.0, std=initializer_range)
CRITICALtrl/experimental/ppo/modeling_value_head.py967 self.v_head.summary.bias.data.zero_()
CRITICALtrl/models/activation_offloading.py397 torch.autograd.variable.Variable._execution_engine.queue_callback(wait_and_del_remaining_references)
AI Slop Vocabulary5 hits · 14 pts
SeverityFileLineSnippet
LOWtests/test_dpo_trainer.py415 # purposes we will just just use the same checkpoint
MEDIUMtrl/experimental/cpo/cpo_trainer.py464 # 2. https://github.com/EleutherAI/lm-evaluation-harness/pull/531#issuecomment-1595586257
MEDIUMtrl/experimental/bco/bco_trainer.py258 # 2. https://github.com/EleutherAI/lm-evaluation-harness/pull/531#issuecomment-1595586257
MEDIUMtrl/experimental/orpo/orpo_trainer.py449 # 2. https://github.com/EleutherAI/lm-evaluation-harness/pull/531#issuecomment-1595586257
MEDIUMtrl/generation/vllm_client.py138 # This is not strictly required for correctness, but it helps make training more robust to rare, transient
Cross-Language Confusion2 hits · 5 pts
SeverityFileLineSnippet
HIGHexamples/scripts/openenv/wordle.py77uv venv && source .venv/bin/activate
HIGHtrl/data_utils.py637 elif not first_column_offsets.equals(column.offsets):
Slop Phrases1 hit · 3 pts
SeverityFileLineSnippet
MEDIUMexamples/cli_configs/example_config.yaml1# This is an example configuration file of TRL CLI, you can use it for
Example Usage Blocks1 hit · 2 pts
SeverityFileLineSnippet
LOWtrl/generation/vllm_client.py748# Example usage