PaddleFormers is an easy-to-use library of pre-trained large language model zoo based on PaddlePaddle.
6121 matches across 18 categories. Click a row to expand file-level details.
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/testing_utils.py | 82 | def softmax_with_cross_entropy(logits, label, soft_label=False, axis=-1, ignore_index=-1): |
| LOW | tests/testing_utils.py | 467 | def require_paddle_non_multi_gpu(test_case): |
| LOW | tests/mergekit/test_merge_model.py | 128 | def test_fuse_qkv_lora_merge_torch(self): |
| LOW | tests/nn/test_mlp.py | 39 | def test_initialization_default(self): |
| LOW | tests/nn/test_mlp.py | 52 | def test_initialization_fuse_ffn(self): |
| LOW | tests/nn/test_mlp.py | 63 | def test_initialization_non_fuse_ffn(self): |
| LOW | tests/nn/test_criterion.py | 38 | def test_forward_non_fuse_subbatch_sft(self): |
| LOW | tests/nn/test_criterion.py | 45 | def test_forward_with_loss_mask(self): |
| LOW | tests/nn/test_criterion.py | 50 | def test_forward_with_recompute(self): |
| LOW | tests/nn/test_norm.py | 30 | def test_layer_norm_initialization(self): |
| LOW | tests/nn/test_norm.py | 40 | def test_layer_norm_sequence_parallel(self): |
| LOW | tests/nn/test_norm.py | 50 | def test_rms_norm_initialization(self): |
| LOW | tests/nn/test_norm.py | 59 | def test_rms_norm_sequence_parallel(self): |
| LOW | tests/nn/test_lm_head.py | 24 | def test_initialization_default(self): |
| LOW | tests/nn/test_lm_head.py | 35 | def test_initialization_with_tie_word_embeddings(self): |
| LOW | tests/nn/test_lm_head.py | 50 | def test_forward_fused_head_loss(self): |
| LOW | tests/nn/test_attention.py | 203 | def test_forward_calls_correct_function(self): |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 114 | def test_loss_impl_calls_loss_func(self): |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 274 | def test_invalid_loss_type_raises(self): |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 289 | def test_sigmoid_with_offset_alpha(self): |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 305 | def test_pref_loss_ratio_applied(self): |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 322 | def test_label_smoothing_applied(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 17 | def test_single_eos_token_not_finished(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 26 | def test_single_eos_token_finished(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 35 | def test_already_finished_stays_finished(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 54 | def test_list_eos_tokens_none_match(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 63 | def test_nested_list_eos_tokens(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 73 | def test_nested_list_eos_none_match(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 139 | def test_add_better_than_worst(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 152 | def test_is_done_not_enough_beams(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 159 | def test_is_done_early_stopping(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 168 | def test_is_done_no_early_stopping_better_available(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 187 | def test_is_done_with_origin_len(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 207 | def test_with_past_key_values(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 233 | def test_window_size_larger_than_seq(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 247 | def test_init_validation_num_beams(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 254 | def test_init_validation_beam_groups(self): |
| LOW | tests/ai_edited_test/nn/test_ai_generation_utils.py | 270 | def test_init_with_beam_groups(self): |
| LOW | tests/ai_edited_test/nn/test_ai_sdpa_attention.py | 58 | def test_is_causal_inferred_multi_token(self, mock_sdpa): |
| LOW | tests/ai_edited_test/nn/test_ai_sdpa_attention.py | 72 | def test_is_causal_single_token(self, mock_sdpa): |
| LOW | tests/ai_edited_test/nn/test_ai_sdpa_attention.py | 87 | def test_explicit_is_causal_false(self, mock_sdpa): |
| LOW | tests/ai_edited_test/nn/test_ai_sdpa_attention.py | 151 | def test_dropout_passed_through(self, mock_sdpa): |
| LOW | tests/ai_edited_test/nn/test_ai_sdpa_attention.py | 166 | def test_training_passed_through(self, mock_sdpa): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 19 | def test_subbatch_small_input_no_split(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 31 | def test_subbatch_splits_and_concatenates(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 44 | def test_subbatch_multiple_args(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 57 | def test_subbatch_same_arg_idx(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 74 | def test_subbatch_preserves_function_name(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 84 | def test_subbatch_axis_width_mismatch_raises(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 97 | def test_subbatch_same_arg_idx_invalid_raises(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 111 | def test_subbatch_with_recompute(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 141 | def test_calc_lm_head_logits_basic(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 153 | def test_calc_lm_head_logits_with_bias(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 167 | def test_calc_lm_head_logits_sequence_parallel(self): |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 181 | def test_calc_lm_head_logits_tensor_parallel_output_override(self): |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 36 | def test_single_rank_returns_clone(self, mock_fleet): |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 51 | def test_group_none_uses_model_parallel(self, mock_fleet): |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 66 | def test_multi_rank_returns_correct_shape(self, mock_fleet, mock_all_gather): |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 95 | def test_single_rank_returns_clone(self, mock_fleet): |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 110 | def test_group_none_uses_model_parallel(self, mock_fleet): |
| 2964 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | tests/ai_edited_test/cli/test_ai_load_hf_ckpt.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | tests/ai_edited_test/cli/test_ai_deepseek_v3_fp8.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | tests/ai_edited_test/cli/test_ai_convert_ckpt_sft.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | …ts/ai_edited_test/cli/test_ai_deepseek_v3_moe_utils.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | tests/ai_edited_test/cli/test_ai_deepseek_v3_config.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | tests/ai_edited_test/cli/test_ai_deepseek_v3_kernel.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | …ts/ai_edited_test/cli/test_ai_deepseek_v3_moe_layer.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | …sts/ai_edited_test/cli/test_ai_deepseek_v3_workflow.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | …s/ai_edited_test/cli/test_ai_deepseek_v3_token_disp.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | …sts/ai_edited_test/cli/test_ai_deepseek_v3_moe_gate.py | 0 | load a module directly from file path without going through __init__.py. |
| HIGH | tests/transformers/test_processing_common.py | 0 | we use do_rescale=true, rescale_factor=-1.0 to ensure that image_processor kwargs are preserved in the processor. we the |
| HIGH | tests/transformers/test_processing_common.py | 0 | we use do_rescale=true, rescale_factor=-1.0 to ensure that image_processor kwargs are preserved in the processor. we the |
| HIGH | tests/transformers/ernie4_5_moe_vl/test_processor.py | 0 | we use do_rescale=true, rescale_factor=-1.0 to ensure that image_processor kwargs are preserved in the processor. we the |
| HIGH | tests/transformers/kimi_k25/test_processor.py | 0 | tests that special vision tokens do not get truncated when `truncation=true` is set. |
| HIGH | tests/transformers/qwen2_5_vl/test_processor.py | 0 | tests that special vision tokens do not get truncated when `truncation=true` is set. |
| HIGH | tests/transformers/qwen2_vl/test_processor.py | 0 | tests that special vision tokens do not get truncated when `truncation=true` is set. |
| HIGH | tests/transformers/qwen3_vl/test_processor.py | 0 | tests that special vision tokens do not get truncated when `truncation=true` is set. |
| HIGH | tests/transformers/qwen2_5_vl/test_modeling.py | 0 | tests that vlms through an error with explicit message saying what is wrong when number of images don't match number of |
| HIGH | tests/transformers/qwen3_vl_moe/test_modeling.py | 0 | tests that vlms through an error with explicit message saying what is wrong when number of images don't match number of |
| HIGH | tests/transformers/qwen3_vl/test_modeling.py | 0 | tests that vlms through an error with explicit message saying what is wrong when number of images don't match number of |
| HIGH | examples/experiments/paddlefleet/run_pretrain.py | 0 | arguments pertaining to what data we are going to input our model for training and evaluating. using `pdargumentparser` |
| HIGH | …mples/experiments/deepseek_v3_pretrain/run_pretrain.py | 0 | arguments pertaining to what data we are going to input our model for training and evaluating. using `pdargumentparser` |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/workflow.py | 0 | arguments pertaining to what data we are going to input our model for training and evaluating. using `pdargumentparser` |
| HIGH | examples/experiments/paddlefleet/run_pretrain.py | 0 | arguments pertaining to which model/config/tokenizer we are going to pre-train from. |
| HIGH | …mples/experiments/deepseek_v3_pretrain/run_pretrain.py | 0 | arguments pertaining to which model/config/tokenizer we are going to pre-train from. |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/workflow.py | 0 | arguments pertaining to which model/config/tokenizer we are going to pre-train from. |
| HIGH | examples/experiments/paddlefleet/glm45_provider.py | 0 | provider for glm 4.5 air 106b-a12b: https://huggingface.co/zai-org/glm-4.5-air |
| HIGH | examples/experiments/paddlefleet/glm45_provider.py | 0 | provider for glm 4.5 air 106b-a12b: https://huggingface.co/zai-org/glm-4.5-air |
| HIGH | examples/experiments/paddlefleet/glm45_provider.py | 0 | provider for glm 4.5 air 106b-a12b: https://huggingface.co/zai-org/glm-4.5-air |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_layer.py | 0 | moe layer forward function 1. gate forward. 2. dispatch export. 3. experts forward. args: hidden_state: moe layer input |
| HIGH | …dleformers/cli/train/deepseek_v3_pretrain/moe_layer.py | 0 | moe layer forward function 1. gate forward. 2. dispatch export. 3. experts forward. args: hidden_state: moe layer input |
| HIGH | paddleformers/transformers/moe_layer.py | 0 | moe layer forward function 1. gate forward. 2. dispatch export. 3. experts forward. args: hidden_state: moe layer input |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_layer.py | 0 | moe expert dispatch from: https://huggingface.co/deepseek-ai/deepseek-v3/blob/main/modeling_deepseek.py |
| HIGH | …dleformers/cli/train/deepseek_v3_pretrain/moe_layer.py | 0 | moe expert dispatch from: https://huggingface.co/deepseek-ai/deepseek-v3/blob/main/modeling_deepseek.py |
| HIGH | paddleformers/transformers/moe_layer.py | 0 | moe expert dispatch from: https://huggingface.co/deepseek-ai/deepseek-v3/blob/main/modeling_deepseek.py |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ the priority is the cumulative sum of the expert indices. this method is used in hunyuan model args: topk_idx |
| HIGH | paddleformers/nn/moe_deepep/moe_gate.py | 0 | _summary_ the priority is the cumulative sum of the expert indices. this method is used in hunyuan model args: topk_idx |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ the priority is the cumulative sum of the expert indices. this method is used in hunyuan model args: topk_idx |
| HIGH | paddleformers/transformers/moe_gate.py | 0 | _summary_ the priority is the cumulative sum of the expert indices. this method is used in hunyuan model args: topk_idx |
| HIGH | paddleformers/transformers/moe_gate_auto.py | 0 | _summary_ the priority is the cumulative sum of the expert indices. this method is used in hunyuan model args: topk_idx |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts returns: tuple[paddle |
| HIGH | paddleformers/nn/moe_deepep/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts returns: tuple[paddle |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts returns: tuple[paddle |
| HIGH | paddleformers/transformers/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts returns: tuple[paddle |
| HIGH | paddleformers/transformers/moe_gate_auto.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts returns: tuple[paddle |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/nn/moe_deepep/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/nn/moe_deepep/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/transformers/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/transformers/moe_gate.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/transformers/moe_gate_auto.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | paddleformers/transformers/moe_gate_auto.py | 0 | _summary_ args: scores (paddle.tensor): [bsz*seq_len, n_experts] k (int): select the top k experts in each group n_group |
| HIGH | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 0 | calculate sequence auxiliary loss. args: logits (paddle.tensor): model output. returns: paddle.tensor: the value of sequ |
| HIGH | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 0 | calculate sequence auxiliary loss. args: logits (paddle.tensor): model output. returns: paddle.tensor: the value of sequ |
| HIGH | paddleformers/transformers/moe_gate_auto.py | 0 | calculate sequence auxiliary loss. args: logits (paddle.tensor): model output. returns: paddle.tensor: the value of sequ |
| HIGH | …mples/experiments/deepseek_v3_pretrain/load_hf_ckpt.py | 0 | convert paddle model parameter names to hugging face format name lists args: paddle_name: parameter name in paddle forma |
| HIGH | …xperiments/deepseek_v3_pretrain/convert_ckpt_to_sft.py | 0 | convert paddle model parameter names to hugging face format name lists args: paddle_name: parameter name in paddle forma |
| 194 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 150 | x_fp8, x_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 157 | _, _, x_t_fp8, x_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 165 | x_fp8, x_scale, x_t_fp8, x_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 172 | _, _, w1_fp8, w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 182 | o2_fp8, o2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 186 | _, _, w2_t_fp8, w2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 227 | do3_fp8, do3_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 234 | _, _, do3_t_fp8, do3_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 241 | do3_fp8, do3_scale, do3_t_fp8, do3_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 247 | w2_fp8, w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 257 | _, _, o2_t_fp8, o2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 277 | do1_fp8, do1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 284 | _, _, do1_t_fp8, do1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 291 | do1_fp8, do1_scale, do1_t_fp8, do1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 297 | w1_fp8, w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 354 | x_fp8, x_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 358 | _, _, w1_fp8, w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 368 | o2_fp8, o2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 372 | _, _, w2_t_fp8, w2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 412 | _, _, x_t_fp8, x_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 422 | do3_fp8, do3_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 429 | _, _, do3_t_fp8, do3_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 436 | do3_fp8, do3_scale, do3_t_fp8, do3_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 442 | w2_fp8, w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 452 | _, _, o2_t_fp8, o2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 472 | do1_fp8, do1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 479 | _, _, do1_t_fp8, do1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 486 | do1_fp8, do1_scale, do1_t_fp8, do1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 492 | w1_fp8, w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …amples/experiments/ernie_pretrain/models/fp8_linear.py | 400 | _, _, w1_fp8, w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …xperiments/ernie_pretrain/models/ernie/modeling_moe.py | 2003 | layer.self_attn.o_proj.dense_experts.down_proj.weight.scale_(factor) |
| CRITICAL | …xperiments/ernie_pretrain/models/ernie/modeling_moe.py | 2015 | layer.mlp.dense_experts.down_proj.weight.scale_(factor) |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 191 | w1_t_quant, w1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 201 | x_fp8, x_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 267 | w2_quant, w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 279 | o2_quant, o2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 325 | w2_quant, w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 336 | o2_quant, o2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 384 | bw_w2_quant, bw_w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 393 | unzipped_grad_fp8, unzipped_grad_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 438 | bw_w2_quant, bw_w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 447 | unzipped_grad_fp8, unzipped_grad_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 508 | bw_w1_quant, bw_w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 518 | do1_fp8, do1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 568 | o2_t_fp8, o2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 587 | out_grad_fp8, out_grad_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 651 | input_x_fp8, input_x_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 667 | do1_fp8, do1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 891 | w1_t_quant, w1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 909 | x_fp8, x_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 966 | w2_quant, w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 986 | o2_fp8, o2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1031 | bw_w2_quant, bw_w2_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1040 | unzipped_grad_fp8, unzipped_grad_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1106 | bw_w1_quant, bw_w1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1115 | do1_fp8, do1_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1187 | o2_t_fp8, o2_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1203 | do3_t_fp8, do3_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1250 | input_x_t_fp8, input_x_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| CRITICAL | …rnie_pretrain/models/moe/token_dispatcher/fp8_utils.py | 1266 | do1_t_fp8, do1_t_scale = paddle.incubate.nn.functional.fp8.fp8_quant_blockwise( |
| 60 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | setup.py | 1 | # Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved. |
| LOW | ci/check_pr_approval.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | ci/check_approval.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/conftest.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/parallel_launch.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/testing_utils.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/common_test.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/__init__.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/check_log_for_exitcode.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_pt_fp8.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen3vl_sft.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_a100.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_dpo_lora.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/update_precision.sh | 1 | # Copyright (c) 2026 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/check_pr_approval.py | 1 | # Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen3_single_card.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen3vl_sft_single_card.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_pt_ep4.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen3vl_lora.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_dpo.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/qwen3_a100.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_pt_single_card.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_sft_cp.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_pt.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/preprocess.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_sft.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/check_precision_approval.sh | 1 | # Copyright (c) 2026 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/check_loss.py | 1 | # Copyright (c) 2026 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_lora.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/integration_test/glm45_pt_grouped_gemm.sh | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/mergekit/test_merge_model.py | 1 | # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/mergekit/test_sparsify_method.py | 1 | # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/mergekit/__init__.py | 1 | # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/mergekit/test_merge_config.py | 1 | # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/mergekit/test_merge_method.py | 1 | # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_mlp.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_activation.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_criterion.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_norm.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/__init__.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_lm_head.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/nn/test_attention.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_dpo_loss.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_gather.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_allgather_layer.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_deepep_gate.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_kto_loss.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_deepep_factory.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_block.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_alltoall_layer.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_sink_impl.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_all_to_all.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_topk_gate.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_pp_model.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_deepep_layer.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_deepep_comm.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_utils.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/nn/test_ai_moe_abstract.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| LOW | tests/ai_edited_test/datasets/test_ai_augment_utils.py | 1 | # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. |
| 956 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | setup.py | 149 | |
| LOW | tests/testing_utils.py | 260 | |
| LOW | tests/testing_utils.py | 512 | |
| LOW | tests/testing_utils.py | 578 | |
| LOW | tests/testing_utils.py | 517 | |
| LOW | tests/testing_utils.py | 587 | |
| LOW | tests/testing_utils.py | 518 | |
| LOW | tests/testing_utils.py | 589 | |
| LOW | tests/integration_test/check_loss.py | 41 | |
| LOW | tests/integration_test/check_loss.py | 65 | |
| LOW | tests/nn/test_attention.py | 27 | |
| LOW | tests/ai_edited_test/utils/test_ai_env.py | 27 | |
| LOW | tests/ai_edited_test/utils/test_ai_tools.py | 118 | |
| LOW | tests/ai_edited_test/cli/test_ai_finetuning_args.py | 132 | |
| LOW | tests/ai_edited_test/cli/test_ai_launcher.py | 87 | |
| LOW | tests/ai_edited_test/cli/test_ai_launcher.py | 98 | |
| LOW | tests/ai_edited_test/trainer/test_ai_async_handler.py | 32 | |
| LOW | tests/ai_edited_test/trainer/test_ai_async_handler.py | 163 | |
| LOW | tests/peft/test_lora.py | 94 | |
| LOW | tests/transformers/test_modeling_common.py | 486 | |
| LOW | tests/transformers/test_modeling_common.py | 677 | |
| LOW | tests/transformers/test_modeling_common.py | 735 | |
| LOW | tests/transformers/test_processing_common.py | 160 | |
| LOW | tests/transformers/test_segment_parallel_utils.py | 107 | |
| LOW | tests/transformers/test_conversion_common.py | 118 | |
| LOW | tests/transformers/test_conversion_common.py | 153 | |
| LOW | tests/transformers/test_video_processing_common.py | 382 | |
| LOW | tests/transformers/test_safetensors.py | 56 | |
| LOW | tests/transformers/test_safetensors.py | 90 | |
| LOW | tests/transformers/phi3/test_modeling.py | 349 | |
| LOW | tests/transformers/auto/test_modeling.py | 110 | |
| LOW | tests/transformers/glm4_moe/test_modeling.py | 380 | |
| LOW | tests/transformers/llama/test_modeling.py | 319 | |
| LOW | tests/trainer/test_trainer_callback.py | 108 | |
| LOW | examples/tools/trans_paddlenlp2hf.py | 44 | |
| LOW | examples/tools/merge.py | 30 | |
| LOW | examples/tools/create_pretraining_data.py | 134 | |
| LOW | examples/tools/create_pretraining_data.py | 306 | |
| LOW | examples/tools/create_pretraining_data.py | 213 | |
| LOW | examples/tools/create_pretraining_data.py | 248 | |
| LOW | examples/experiments/paddlefleet/run_pretrain.py | 474 | |
| LOW | examples/experiments/deepseek_v3_pretrain/fp8_linear.py | 54 | |
| LOW | examples/experiments/deepseek_v3_pretrain/moe_utils.py | 420 | |
| LOW | …mples/experiments/deepseek_v3_pretrain/load_hf_ckpt.py | 274 | |
| LOW | …xperiments/deepseek_v3_pretrain/convert_ckpt_to_sft.py | 218 | |
| LOW | examples/experiments/deepseek_v3_pretrain/modeling.py | 163 | |
| LOW | examples/experiments/deepseek_v3_pretrain/modeling.py | 635 | |
| LOW | examples/experiments/deepseek_v3_pretrain/modeling.py | 1398 | |
| LOW | examples/experiments/deepseek_v3_pretrain/modeling.py | 2515 | |
| LOW | …amples/experiments/deepseek_v3_pretrain/modeling_pp.py | 97 | |
| LOW | …amples/experiments/deepseek_v3_pretrain/modeling_pp.py | 1834 | |
| LOW | …amples/experiments/deepseek_v3_pretrain/modeling_pp.py | 2309 | |
| LOW | …_pretrain/tools/uc_to_sharded/convert_uc_to_sharded.py | 40 | |
| LOW | …_pretrain/tools/uc_to_sharded/convert_uc_to_sharded.py | 138 | |
| LOW | …rnie_pretrain/tools/sharded_to_uc/merge_sharding_ep.py | 404 | |
| LOW | …rnie_pretrain/tools/sharded_to_uc/merge_sharding_ep.py | 549 | |
| LOW | …rnie_pretrain/tools/sharded_to_uc/merge_sharding_ep.py | 664 | |
| LOW | …amples/experiments/ernie_pretrain/models/comm_utils.py | 148 | |
| LOW | …amples/experiments/ernie_pretrain/models/comm_utils.py | 193 | |
| LOW | …amples/experiments/ernie_pretrain/models/comm_utils.py | 150 | |
| 558 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/testing_utils.py | 14 | |
| LOW | tests/ai_edited_test/quantization/test_ai_qlora.py | 10 | |
| LOW | tests/utils/test_downloader.py | 15 | |
| LOW | tests/transformers/test_modeling_common.py | 15 | |
| LOW | tests/transformers/test_processing_common.py | 16 | |
| LOW | tests/transformers/test_generation_utils.py | 15 | |
| LOW | tests/transformers/test_video_processing_common.py | 16 | |
| LOW | tests/transformers/gpt_oss/test_modeling.py | 15 | |
| LOW | tests/transformers/kimi_k2/test_modeling.py | 15 | |
| LOW | tests/transformers/phi3/test_modeling.py | 15 | |
| LOW | tests/transformers/auto/test_configuration.py | 15 | |
| LOW | tests/transformers/qwen2/test_modeling.py | 15 | |
| LOW | tests/transformers/kimi_k25/test_processor.py | 16 | |
| LOW | tests/transformers/qwen3moe/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen3/test_modeling.py | 15 | |
| LOW | tests/transformers/gemma3_text/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen2moe/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen2_5_vl/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen2_5_vl/test_processor.py | 16 | |
| LOW | …ts/transformers/ernie4_5_moe_vl/test_vision_process.py | 14 | |
| LOW | tests/transformers/ernie4_5_moe_vl/test_modeling.py | 15 | |
| LOW | tests/transformers/ernie4_5_moe_vl/test_processor.py | 14 | |
| LOW | tests/transformers/glm_ocr/test_modeling.py | 15 | |
| LOW | tests/transformers/glm_ocr/test_processor.py | 14 | |
| LOW | tests/transformers/deepseek_v3/test_modeling.py | 15 | |
| LOW | tests/transformers/glm_moe_dsa/test_modeling.py | 15 | |
| LOW | tests/transformers/glm4v_moe/test_modeling.py | 15 | |
| LOW | tests/transformers/glm4v_moe/test_processor.py | 16 | |
| LOW | tests/transformers/qwen3_vl_moe/test_modeling.py | 15 | |
| LOW | tests/transformers/glm4_moe/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen2_vl/test_vision_process.py | 16 | |
| LOW | tests/transformers/qwen2_vl/test_processor.py | 16 | |
| LOW | tests/transformers/qwen2_vl/test_video_processor.py | 16 | |
| LOW | tests/transformers/qwen3next/test_modeling.py | 15 | |
| LOW | tests/transformers/ernie4_5/test_modeling.py | 15 | |
| LOW | tests/transformers/paddleocr_vl/test_modeling.py | 15 | |
| LOW | tests/transformers/paddleocr_vl/test_processor.py | 15 | |
| LOW | tests/transformers/llama/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen3_vl/test_modeling.py | 15 | |
| LOW | tests/transformers/qwen3_vl/test_processor.py | 16 | |
| LOW | tests/transformers/qwen3_vl/test_modeling_fleet.py | 14 | |
| LOW | tests/transformers/qwen3_vl/test_video_processor.py | 16 | |
| LOW | examples/experiments/deepseek_v3_pretrain/moe_layer.py | 17 | |
| LOW | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 17 | |
| LOW | examples/experiments/deepseek_v3_pretrain/modeling.py | 22 | |
| LOW | …es/experiments/deepseek_v3_pretrain/config/__init__.py | 86 | |
| LOW | …es/experiments/deepseek_v3_pretrain/config/__init__.py | 87 | |
| LOW | …es/experiments/deepseek_v3_pretrain/config/__init__.py | 88 | |
| LOW | …es/experiments/deepseek_v3_pretrain/config/__init__.py | 89 | |
| LOW | …es/experiments/deepseek_v3_pretrain/config/__init__.py | 90 | |
| LOW | …es/experiments/ernie_pretrain/models/ernie/__init__.py | 16 | |
| LOW | …es/experiments/ernie_pretrain/models/ernie/__init__.py | 17 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 15 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 16 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 17 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 18 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 19 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 19 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 20 | |
| LOW | …riments/ernie_pretrain/ernie/src/callbacks/__init__.py | 21 | |
| 543 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | tests/nn/test_mlp.py | 25 | # Create a mock config with default values |
| MEDIUM | tests/nn/test_attention.py | 267 | # Create the ground truth dense causal mask for the naive implementation |
| MEDIUM | tests/nn/test_attention.py | 297 | # Create the ground truth dense mask from the FlashMask sparse format |
| MEDIUM | tests/ai_edited_test/nn/test_ai_pp_model.py | 401 | # Create a config where head_dim attribute doesn't exist at all, |
| MEDIUM | tests/ai_edited_test/nn/test_ai_pp_model.py | 691 | # Create a mock layer that has a weight attribute |
| MEDIUM | tests/ai_edited_test/datasets/test_ai_mm_plugin.py | 188 | # Create a new plugin class |
| MEDIUM | tests/ai_edited_test/utils/test_ai_doc_parser.py | 46 | # Create a temp file with content < 1024 chars |
| MEDIUM | tests/ai_edited_test/utils/test_ai_aistudio_download.py | 237 | # Create the expected cache structure |
| MEDIUM | tests/ai_edited_test/utils/test_ai_optimizer.py | 28 | # Create a simple model and optimizer so we can call the method |
| MEDIUM | tests/ai_edited_test/utils/test_ai_image_utils.py | 63 | # Create a simple test image and its base64 encoding |
| MEDIUM | tests/ai_edited_test/cli/test_ai_ernie_top2_gate.py | 128 | # Create a near-orthogonal weight matrix |
| MEDIUM | tests/ai_edited_test/cli/test_ai_dataset_formatting.py | 180 | # Create a dataset with unsupported features |
| MEDIUM | tests/ai_edited_test/cli/test_ai_cli.py | 54 | # Create the partial after mocking print |
| MEDIUM | tests/ai_edited_test/peft/test_ai_loraga_utils.py | 105 | # Create a mock LoRA module |
| MEDIUM | …s/ai_edited_test/transformers/test_ai_moe_gate_auto.py | 140 | # Create a weight parameter for the gate |
| MEDIUM | …_edited_test/transformers/test_ai_kimi_k2_tokenizer.py | 27 | # Create a minimal tiktoken model file for testing |
| MEDIUM | tests/ai_edited_test/trainer/test_ai_timer.py | 172 | # Create a _Timer first |
| MEDIUM | tests/ai_edited_test/trainer/test_ai_timer.py | 184 | # Create a distinct class to force type mismatch |
| MEDIUM | tests/transformers/test_processing_common.py | 379 | # Define the kwargs for each modality |
| MEDIUM | tests/transformers/test_processing_common.py | 400 | # Define the kwargs for each modality |
| MEDIUM | tests/transformers/test_processing_common.py | 570 | # Define the kwargs for each modality |
| MEDIUM | tests/transformers/test_processing_common.py | 591 | # Define the kwargs for each modality |
| MEDIUM | tests/transformers/ernie4_5_moe_vl/test_processor.py | 461 | # Define the kwargs for each modality |
| MEDIUM | tests/transformers/ernie4_5_moe_vl/test_processor.py | 477 | # Define the kwargs for each modality |
| MEDIUM | tests/trainer/test_trainer_callback.py | 16 | # This file is modified from |
| MEDIUM | examples/experiments/paddlefleet/run_pretrain.py | 614 | # Create the learning_rate sheduler and optimizer |
| MEDIUM | …mples/experiments/deepseek_v3_pretrain/run_pretrain.py | 577 | # Create the learning_rate sheduler and optimizer |
| MEDIUM | examples/experiments/deepseek_v3_pretrain/moe_utils.py | 118 | # Create an output tensor filled with zeros |
| MEDIUM | examples/experiments/deepseek_v3_pretrain/moe_utils.py | 335 | # Create an output tensor filled with zeros |
| MEDIUM | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 186 | # Create a mask for 1st's expert per token |
| MEDIUM | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 252 | # Create a mask for 1st's expert per token. |
| MEDIUM | examples/experiments/deepseek_v3_pretrain/moe_gate.py | 257 | # Create a mask for 2nd's expert per token using Gumbel-max trick. |
| MEDIUM | scripts/iluvatar_ci/test_ernie_21b_sft.py | 27 | # Define the exact shell command to execute |
| MEDIUM | scripts/xpu_ci/test_ernie_21b_sft.py | 27 | # Define the exact shell command to execute |
| MEDIUM | scripts/xpu_ci/test_ernie_28b_thinking_sft.py | 27 | # Define the exact shell command to execute |
| MEDIUM | scripts/codestyle/check_dead_links.py | 118 | # Create the symlink |
| MEDIUM | .github/workflows/cherry-pick.yml | 97 | # Create a new branch for the cherry-pick |
| MEDIUM | paddleformers/datasets/template/mm_plugin.py | 561 | # Create an image with a white background and the same size as the original image |
| MEDIUM | paddleformers/utils/download/common.py | 310 | # Create a factory function that returns a Session with configured proxies |
| MEDIUM | paddleformers/cli/cli.py | 94 | # Create a default GPU list string (e.g., "0,1,2" for 3 GPUs) |
| MEDIUM | …dleformers/cli/train/deepseek_v3_pretrain/moe_utils.py | 118 | # Create an output tensor filled with zeros |
| MEDIUM | …dleformers/cli/train/deepseek_v3_pretrain/moe_utils.py | 335 | # Create an output tensor filled with zeros |
| MEDIUM | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 186 | # Create a mask for 1st's expert per token |
| MEDIUM | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 252 | # Create a mask for 1st's expert per token. |
| MEDIUM | …ddleformers/cli/train/deepseek_v3_pretrain/moe_gate.py | 257 | # Create a mask for 2nd's expert per token using Gumbel-max trick. |
| MEDIUM | …ddleformers/cli/train/deepseek_v3_pretrain/workflow.py | 507 | # Create the learning_rate sheduler and optimizer |
| MEDIUM | paddleformers/cli/train/auto_parallel/workflow.py | 320 | # Create the learning_rate scheduler and optimizer |
| MEDIUM | paddleformers/cli/train/sft/workflow.py | 692 | # Create the learning_rate sheduler and optimizer |
| MEDIUM | paddleformers/transformers/video_utils.py | 220 | # Create a batched list from single object |
| MEDIUM | paddleformers/transformers/image_transforms.py | 722 | # Create the outer list |
| MEDIUM | paddleformers/transformers/moe_utils.py | 66 | # Create a dense expert-to-token mapping from the sparse token-to-expert mapping |
| MEDIUM | paddleformers/transformers/moe_utils.py | 109 | # Create an output tensor filled with zeros |
| MEDIUM | paddleformers/transformers/processing_utils.py | 471 | # Create a unified `preprocessor_config.json` and save all attributes as a composite config, except for toke |
| MEDIUM | paddleformers/transformers/image_processing_utils.py | 53 | # Define the key methods that should support Paddle tensor return types. |
| MEDIUM | paddleformers/transformers/moe_gate.py | 345 | # Create a mask for 1st's expert per token |
| MEDIUM | paddleformers/transformers/moe_gate.py | 413 | # Create a mask for 1st's expert per token. |
| MEDIUM | paddleformers/transformers/moe_gate.py | 418 | # Create a mask for 2nd's expert per token using Gumbel-max trick. |
| MEDIUM | paddleformers/transformers/moe_gate_auto.py | 348 | # Create a mask for 1st's expert per token |
| MEDIUM | paddleformers/transformers/moe_gate_auto.py | 414 | # Create a mask for 1st's expert per token. |
| MEDIUM | paddleformers/transformers/moe_gate_auto.py | 419 | # Create a mask for 2nd's expert per token using Gumbel-max trick. |
| 26 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | examples/experiments/deepseek_v3_pretrain/fp8_linear.py | 57 | Applies a linear transformation to the incoming data: y = xA^T + b. This function supports specialized implemen |
| HIGH | examples/experiments/deepseek_v3_pretrain/kernel.py | 101 | Dequantizes the given weight tensor using the provided scale tensor. Args: x (paddle.Tensor): The quant |
| HIGH | …rnie_pretrain/models/moe/token_dispatcher/moe_utils.py | 110 | Permute tokens based on expert assignment indices. Args: tokens (paddle.Tensor): Input tokens to be permute |
| HIGH | …rnie_pretrain/models/moe/token_dispatcher/moe_utils.py | 136 | Restore original token order from permuted tokens. Args: permuted_tokens (paddle.Tensor): Permuted tokens t |
| HIGH | scripts/regression/test_models.py | 116 | Load model configuration from YAML file. Args: model_key: The model identifier to load configuratio |
| HIGH | paddleformers/nn/pp_model.py | 114 | Determines the layer partitioning scheme for Pipeline Parallelism (PP) and Virtual Pipeline Parallelism (VP) wi |
| HIGH | paddleformers/nn/attention/sink_impl.py | 561 | A unified, high-performance attention implementation with Sink mechanism support. This function automatically |
| HIGH | paddleformers/datasets/data_utils.py | 119 | Convert batch dialogue into input_ids. The API support multiple data format: `pt`, `sft. Args: dials ( |
| HIGH | paddleformers/datasets/DPODataset.py | 161 | Generate packed sequences using greedy strategy. Args: examples: List of examples to pack. |
| HIGH | paddleformers/datasets/DPODataset.py | 187 | Preprocess DPO training examples Args: example: Raw training example containing: - |
| HIGH | paddleformers/utils/downloader.py | 94 | Get weights path from WEIGHT_HOME, if not exists, download it from url. Args: url (str): download url |
| HIGH | paddleformers/utils/tools.py | 148 | Args: version (str): The first version string needed to be compared. The format of version stri |
| HIGH | paddleformers/utils/distributed.py | 167 | nested all gather function with offload Args: tensor (Any): the desired tensor, list of tensor, dict of ten |
| HIGH | paddleformers/utils/download/aistudio_hub_download.py | 628 | Checks if a file exists in a repository on the Aistudio Hub. Args: repo_id (`str`): A name |
| HIGH | paddleformers/cli/hparams/parser.py | 120 | _summary_ Args: parser (PdArgumentParser): _description_ args (Optional[Union[dict[str, Any], list[ |
| HIGH | …leformers/cli/train/deepseek_v3_pretrain/fp8_linear.py | 57 | Applies a linear transformation to the incoming data: y = xA^T + b. This function supports specialized implemen |
| HIGH | paddleformers/cli/train/deepseek_v3_pretrain/kernel.py | 101 | Dequantizes the given weight tensor using the provided scale tensor. Args: x (paddle.Tensor): The quant |
| HIGH | …rnie_pretrain/models/moe/token_dispatcher/moe_utils.py | 110 | Permute tokens based on expert assignment indices. Args: tokens (paddle.Tensor): Input tokens to be permute |
| HIGH | …rnie_pretrain/models/moe/token_dispatcher/moe_utils.py | 136 | Restore original token order from permuted tokens. Args: permuted_tokens (paddle.Tensor): Permuted tokens t |
| HIGH | paddleformers/transformers/configuration_utils.py | 1070 | Instantiate a [`PretrainedConfig`] (or a derived class) from a pretrained model configuration. Args: |
| HIGH | paddleformers/transformers/model_utils.py | 211 | This function chunks the `input_tensors` into smaller input tensor parts of size `chunk_size` over the dimension |
| HIGH | paddleformers/transformers/feature_extraction_utils.py | 231 | Instantiate a type of [`~feature_extraction_utils.FeatureExtractionMixin`] from a feature extractor, *e.g.* a |
| HIGH | paddleformers/transformers/fp8_utils.py | 211 | FP8 Linear computation function supporting multiple return modes and quantized/unquantized inputs. Arg |
| HIGH | paddleformers/transformers/conversion_utils.py | 1400 | get name mapping of PretrainedModel Args: config (PretrainedConfig): the configuration of name-mapp |
| HIGH | paddleformers/transformers/conversion_utils.py | 1526 | get fused parameter mapping of PretrainedModel Args: config (PretrainedConfig): the configuration o |
| HIGH | paddleformers/transformers/utils.py | 511 | Tries to locate a file in a local folder and repo, downloads and cache it if necessary. Args: path_or_r |
| HIGH | paddleformers/transformers/auto/video_processing.py | 87 | Loads the video processor configuration from a pretrained model video processor configuration. Args: p |
| HIGH | paddleformers/transformers/auto/feature_extraction.py | 91 | Loads the feature extractor configuration from a pretrained model feature extractor configuration. Args: |
| HIGH | paddleformers/transformers/auto/tokenizer.py | 65 | Loads the tokenizer configuration from a pretrained model tokenizer configuration. Args: pretrained_mo |
| HIGH | paddleformers/transformers/auto/image_processing.py | 107 | Loads the image processor configuration from a pretrained model image processor configuration. Args: p |
| HIGH | paddleformers/transformers/legacy/tokenizer_utils.py | 1093 | Add a list of new tokens to the tokenizer class. If the new tokens are not in the vocabulary, they are added to |
| HIGH | …dleformers/transformers/legacy/tokenizer_utils_base.py | 839 | Add a dictionary of special tokens (eos, pad, cls, etc.) to the encoder and link them to class attributes. If |
| HIGH | …dleformers/transformers/legacy/tokenizer_utils_base.py | 933 | Add a list of new tokens to the tokenizer class. If the new tokens are not in the vocabulary, they are added to |
| HIGH | paddleformers/transformers/qwen2_5_vl/modeling.py | 1245 | Calculate the 3D rope index based on image and video's temporal, height and width in LLM. Explanation: |
| HIGH | …/transformers/ernie4_5_moe_vl/model/modeling_moe_vl.py | 1080 | Calculate the 3D rope index based on image and video's temporal, height and width in LLM. Explanation: |
| HIGH | …/transformers/ernie4_5_moe_vl/model/modeling_moe_pp.py | 93 | Determines the layer partitioning scheme for Pipeline Parallelism (PP) and Virtual Pipeline Parallelism (VP) wi |
| HIGH | …ansformers/ernie4_5_moe_vl/model/modeling_moe_vl_pp.py | 830 | Convert input data into a format acceptable by the model, including image processing, text processing, etc. |
| HIGH | …ernie4_5_moe_vl/model/distributed/common_dist_utils.py | 83 | Performs parallel matrix multiplication with tensor model parallelism support. Args: x (paddle.Tensor) |
| HIGH | …rmers/transformers/ernie4_5_moe_vl/model/utils/misc.py | 89 | TrainingLogs Args: object (_type_): _description_ Raises: AttributeError: _description_ R |
| HIGH | …rmers/transformers/ernie4_5_moe_vl/model/utils/misc.py | 170 | gate attr Args: attr (_type_): _description_ Raises: AttributeError: _descript |
| HIGH | …/ernie4_5_moe_vl/model/fusion_ops/common_fusion_ops.py | 49 | Performs fused flash attention with multiple implementation variants. Args: q (paddle.Tensor): Query t |
| HIGH | paddleformers/transformers/glm4v_moe/modeling.py | 1340 | Calculate the 3D rope index based on image and video's temporal, height and width in LLM. Explanation: |
| HIGH | paddleformers/transformers/qwen2_vl/vision_process.py | 162 | calculate the number of frames for video used for model inputs. Args: ele (dict): a dict contains the confi |
| HIGH | paddleformers/transformers/qwen2_vl/vision_process.py | 202 | Calculate the start and end frame indices based on the given time range. Args: ele (dict): A dictionar |
| HIGH | paddleformers/transformers/paddleocr_vl/modeling.py | 1798 | Calculate the 3D rope index based on image and video's temporal, height and width in LLM. Explanation: |
| HIGH | paddleformers/data/causal_dataset.py | 36 | Retrieve logits with retry mechanism if no response is received within the specified time Parameters: |
| HIGH | paddleformers/generation/configuration_utils.py | 346 | Instantiate a [`GenerationConfig`] from a generation configuration file. Args: pretrained_ |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | setup.py | 220 | except Exception as e: |
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 125 | except Exception: |
| LOW | tests/ai_edited_test/datasets/test_ai_template.py | 291 | except Exception: |
| LOW | tests/ai_edited_test/cli/test_ai_ernie_moe_utils.py | 66 | except Exception: |
| LOW | …sts/ai_edited_test/cli/test_ai_tensorboard_callback.py | 109 | except Exception: |
| LOW | tests/ai_edited_test/cli/test_ai_deepseek_v3_kernel.py | 46 | except Exception: |
| LOW | tests/ai_edited_test/cli/test_ai_deepseek_v3_kernel.py | 85 | except Exception as e: |
| LOW | …_edited_test/transformers/test_ai_kimi_k2_tokenizer.py | 162 | except Exception: |
| LOW | …_edited_test/transformers/test_ai_kimi_k2_tokenizer.py | 170 | except Exception: |
| LOW | tests/peft/test_lora.py | 213 | except Exception as e: |
| LOW | tests/peft/test_lora.py | 283 | except Exception as e: |
| LOW | tests/transformers/qwen3_vl/test_modeling_fleet.py | 33 | except Exception as error: |
| LOW | docs/zh/custom_datasets_format_zh.md | 14 | except Exception: |
| MEDIUM | docs/zh/custom_datasets_format_zh.md | 9 | def load_parquet(file_path): |
| LOW | …mples/experiments/deepseek_v3_pretrain/load_hf_ckpt.py | 369 | except Exception as e: |
| LOW | …rnie_pretrain/tools/sharded_to_uc/merge_sharding_ep.py | 612 | except Exception: |
| MEDIUM | …rnie_pretrain/tools/sharded_to_uc/merge_sharding_ep.py | 614 | print("Error !!!!") |
| LOW | examples/experiments/ernie_pretrain/ernie/pretrain.py | 539 | except Exception: |
| LOW | …e_pretrain/ernie/src/callbacks/tensorboard_callback.py | 25 | except Exception: |
| LOW | examples/best_practices/PaddleOCR-VL/README.md | 565 | except Exception: |
| LOW | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 153 | except Exception: |
| LOW | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 231 | except Exception: |
| LOW | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 950 | except Exception: |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 146 | def download_image_cv2(url): |
| LOW | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 151 | except Exception as e: |
| LOW | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 178 | except Exception as e: |
| LOW | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 195 | except Exception as e: |
| LOW | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 296 | except Exception as e: |
| MEDIUM | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 678 | print(f"Error: Image not found at: {full_image_path}") |
| LOW | …ces/tutorials/how_to_train_a_visual_grounding_model.md | 688 | except Exception as e: |
| LOW | scripts/ci_utils/training_utils.py | 92 | except Exception as e: |
| LOW | scripts/codestyle/check_dead_links.py | 68 | except Exception as e: |
| MEDIUM | scripts/codestyle/check_dead_links.py | 69 | print(f"Error reading {file_path}: {e}") |
| MEDIUM | scripts/regression/merge_configs.py | 210 | print(f"Error: {origin_config_path} does not exist") |
| MEDIUM | scripts/regression/merge_configs.py | 214 | print(f"Error: {update_config_path} does not exist") |
| LOW | scripts/regression/test_models.py | 212 | except Exception as e: |
| LOW | scripts/regression/test_models.py | 235 | except Exception as e: |
| LOW | scripts/regression/test_models.py | 634 | except Exception as e: |
| MEDIUM | .github/workflows/cleanup_ci_gists.yml | 55 | print(f"Error: API returned {resp.status_code}: {resp.text}") |
| LOW | .github/workflows/cleanup_ci_gists.yml | 60 | except Exception as e: |
| MEDIUM | .github/workflows/cleanup_ci_gists.yml | 61 | print(f"Error parsing JSON: {e}") |
| LOW | paddleformers/nn/pp_model.py | 651 | except Exception: |
| LOW | paddleformers/nn/moe_deepep/modular_moe_layer.py | 86 | except Exception: |
| MEDIUM | paddleformers/datasets/SFTDataset.py | 239 | def _rss_mb(): |
| LOW | paddleformers/datasets/SFTDataset.py | 217 | except Exception as e: |
| LOW | paddleformers/datasets/SFTDataset.py | 221 | except Exception: |
| LOW | paddleformers/datasets/SFTDataset.py | 245 | except Exception: |
| LOW | paddleformers/datasets/SFTDataset.py | 320 | except Exception as e: |
| LOW | paddleformers/datasets/SFTDataset.py | 773 | except Exception: |
| LOW | paddleformers/datasets/SFTDataset.py | 1063 | except Exception as e: |
| LOW | paddleformers/datasets/SFTDataset.py | 1085 | except Exception as e: |
| LOW | paddleformers/datasets/SFTDataset.py | 1118 | except Exception: |
| LOW | paddleformers/datasets/SFTDataset.py | 1157 | except Exception: |
| LOW | paddleformers/datasets/DPODataset.py | 104 | except Exception as e: |
| LOW | paddleformers/datasets/DPODataset.py | 122 | except Exception as e: |
| LOW | paddleformers/datasets/DPODataset.py | 143 | except Exception as e: |
| LOW | paddleformers/datasets/reader/file_reader.py | 119 | except Exception as e: |
| LOW | paddleformers/datasets/reader/io.py | 74 | except Exception as e: |
| MEDIUM | paddleformers/datasets/reader/io.py | 47 | def load_txt(file_path): |
| MEDIUM | paddleformers/datasets/reader/mix_datasets.py | 271 | print(f"Error: cannot find class named '{class_name}'.") |
| 99 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | tests/dataset/test_collate.py | 44 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 46 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 64 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 66 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 80 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 82 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 99 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 101 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 122 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 132 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 141 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 143 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 179 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 181 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 224 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 226 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 231 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 29 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_collate.py | 31 | # --------------------------------------------------------------------------- |
| MEDIUM | tests/dataset/test_mix_datasets.py | 35 | # =========================================================================== |
| MEDIUM | tests/dataset/test_mix_datasets.py | 37 | # =========================================================================== |
| MEDIUM | tests/dataset/test_mix_datasets.py | 211 | # =========================================================================== |
| MEDIUM | tests/dataset/test_mix_datasets.py | 213 | # =========================================================================== |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 635 | # ------------------------- |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 637 | # ------------------------- |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 665 | # ------------------------- |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 668 | # ------------------------- |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 709 | # ------------------------- |
| MEDIUM | tests/transformers/glm_ocr/test_modeling.py | 711 | # ------------------------- |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/table_ocr.md | 135 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/table_ocr.md | 137 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/table_ocr.md | 285 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/table_ocr.md | 287 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 140 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 334 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 336 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 484 | # ========================================== |
| MEDIUM | examples/best_practices/PaddleOCR-VL-1.5/region_ocr.md | 486 | # ========================================== |
| MEDIUM | .github/workflows/formers_bot_analysis.yml | 86 | # ── 定时触发路径 ────────────────────────────────────────────────── |
| MEDIUM | .github/workflows/formers_bot_analysis.yml | 114 | # ── PR 触发路径 ─────────────────────────────────────────────────── |
| MEDIUM | .github/workflows/formers_bot_analysis.yml | 297 | # ── 写入 GITHUB_OUTPUT,供 report-to-monitor 步骤读取 ────────── |
| MEDIUM | paddleformers/utils/upcast_downcast_triton.py | 352 | # ----------------------------------------------------------------------------- |
| MEDIUM | paddleformers/utils/upcast_downcast_triton.py | 354 | # ----------------------------------------------------------------------------- |
| MEDIUM | paddleformers/utils/upcast_downcast_triton.py | 476 | # ------------ |
| MEDIUM | paddleformers/transformers/aoa_config_base.py | 525 | # ================================================================== |
| MEDIUM | paddleformers/transformers/aoa_config_base.py | 527 | # ================================================================== |
| MEDIUM | paddleformers/transformers/paddleocr_vl/modeling.py | 870 | # ========================================== |
| MEDIUM | paddleformers/transformers/paddleocr_vl/modeling.py | 872 | # ========================================== |
| MEDIUM | paddleformers/transformers/paddleocr_vl/modeling.py | 905 | # ========================================== |
| MEDIUM | paddleformers/transformers/paddleocr_vl/modeling.py | 907 | # ========================================== |
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | …ai_edited_test/transformers/test_ai_longcontext_ops.py | 33 | heap.push((0, 5)) |
| HIGH | …ai_edited_test/transformers/test_ai_longcontext_ops.py | 34 | heap.push((1, 3)) |
| HIGH | …ai_edited_test/transformers/test_ai_longcontext_ops.py | 35 | heap.push((2, 8)) |
| HIGH | scripts/regression/test_models.py | 673 | subprocess.run("pkill -9 -f 'paddleformers/cli/launcher.py' 2>/dev/null || true", shell=True) |
| HIGH | paddleformers/quantization/quantization_linear.py | 332 | "2) cd PaddleSlim && pip install -e .\n" |
| HIGH | paddleformers/quantization/quantization_linear.py | 333 | "3) cd csrc && python ./setup_cuda.py install" |
| HIGH | paddleformers/quantization/quantization_linear.py | 522 | "2) cd PaddleSlim && pip install -e .\n" |
| HIGH | paddleformers/quantization/quantization_linear.py | 523 | "3) cd csrc && python ./setup_cuda.py install" |
| HIGH | paddleformers/quantization/quantization_linear.py | 761 | "2) cd PaddleSlim && pip install -e .\n" |
| HIGH | paddleformers/quantization/quantization_linear.py | 762 | "3) cd csrc && python ./setup_cuda.py install" |
| HIGH | paddleformers/transformers/video_utils.py | 323 | f" 1. Install dependencies: `conda install ffmpeg -c conda-forge` or `apt-get update && apt-get install f |
| HIGH | paddleformers/transformers/audio_processing_utils.py | 23 | print("need to install audioread and librosa. Please try: pip install audioread && pip install librosa") |
| HIGH | paddleformers/transformers/kimi_k25/media_utils.py | 103 | f" 1. Install dependencies: `conda install ffmpeg -c conda-forge` or `apt-get update && apt-get install f |
| HIGH | …/transformers/ernie4_5_moe_vl/model/longcontext_ops.py | 134 | surplus_piles.push([src_rank, surplus - move_amount]) |
| HIGH | …/transformers/ernie4_5_moe_vl/model/longcontext_ops.py | 136 | deficit_piles.push([dst_rank, deficit - move_amount]) |
| HIGH | paddleformers/transformers/qwen2_vl/vision_process.py | 286 | f" 1. Install dependencies: `conda install ffmpeg -c conda-forge` or `apt-get update && apt-get install f |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/transformers/test_video_processing_common.py | 277 | # Set sampling to True. Video frames should be sampled with `num_frames` in the output |
| LOW | tests/transformers/test_cache_utils.py | 424 | # Check if they are on the same device as the model parameters |
| LOW | tests/transformers/qwen2_vl/test_video_processor.py | 302 | # Set sampling to True. Video frames should be sampled with `num_frames` in the output |
| LOW | scripts/regression/prepare_datasets.py | 95 | # Check if already exists |
| LOW | scripts/regression/ci_model_unittest.sh | 134 | # Check if file is in transformer directories (don't check file existence, rely on git diff) |
| LOW | .github/workflows/cherry-pick.yml | 90 | # Check if target branch exists on remote |
| LOW | .github/workflows/cherry-pick.yml | 154 | # Check if PR already exists |
| LOW | .github/workflows/_xpu_ci_test.yml | 60 | # Check if anything matching ${REPO_NAME}* still exists |
| LOW | paddleformers/datasets/dataset.py | 206 | # Check if selected name and split is valid in this DatasetBuilder |
| LOW | paddleformers/datasets/SFTDataset.py | 399 | # Set flag to False and yield empty list to signal the end of estimation |
| LOW | paddleformers/datasets/SFTDataset.py | 436 | # Set flag to False and yield empty list to signal the end of estimation |
| LOW | paddleformers/datasets/SFTDataset.py | 468 | # Set flag to False and yield empty list to signal the end of estimation |
| LOW | paddleformers/datasets/SFTDataset.py | 499 | # Set flag to False and yield empty list to signal the end of estimation |
| LOW | paddleformers/datasets/SFTDataset.py | 540 | # Set flag to False and yield empty list to signal the end of estimation |
| LOW | paddleformers/datasets/DPODataset.py | 218 | # Check if multimedia tags are included in "messages"+"chosen_response", and "messages"+"rejected_response" |
| LOW | paddleformers/utils/upcast_downcast_triton.py | 726 | # # Check if blocks and scales are on CPU, and move to GPU if so |
| LOW | paddleformers/utils/import_utils.py | 118 | # Check if the package spec exists and grab its version to avoid importing a local directory |
| LOW | paddleformers/utils/import_utils.py | 131 | # Check if the version contains "dev" |
| LOW | paddleformers/utils/import_utils.py | 161 | # Check if the package spec exists and grab its version to avoid importing a local directory |
| LOW | paddleformers/utils/import_utils.py | 174 | # Check if the version contains "dev" |
| LOW | paddleformers/utils/download/aistudio_hub_download.py | 714 | # Check if file is cached as "no_exist" |
| LOW | paddleformers/utils/download/aistudio_hub_download.py | 718 | # Check if revision folder exists |
| LOW | paddleformers/utils/download/aistudio_hub_download.py | 726 | # Check if file exists in cache |
| LOW | paddleformers/cli/export/export.py | 97 | # Check if the output directory is a valid model directory (contains .safetensors or .pdparams files) |
| LOW | paddleformers/transformers/model_utils.py | 1741 | # Check if README file already exist in repo |
| LOW | paddleformers/transformers/model_utils.py | 3009 | # Check if `_keep_in_fp32_modules` is not None |
| LOW | …dleformers/transformers/image_processing_utils_fast.py | 605 | # Check if we have nested structure, assuming the nesting is consistent |
| LOW | paddleformers/transformers/image_utils.py | 752 | # Check if image is in (n_channels, height, width) or (height, width, n_channels) format |
| LOW | paddleformers/transformers/image_utils.py | 762 | # Check if cropped area is within image boundaries |
| LOW | paddleformers/transformers/image_transforms.py | 438 | # Check if cropped area is within image boundaries |
| LOW | paddleformers/transformers/feature_extraction_utils.py | 174 | # Check if the args are a device or a dtype |
| LOW | paddleformers/transformers/processing_utils.py | 913 | # Check if tokenizer is fast - use backend attribute if available, otherwise fall back to class name |
| LOW | paddleformers/transformers/utils.py | 690 | # Check if the model is already cached or not. We only try the last checkpoint, this should cover most cases of |
| LOW | paddleformers/transformers/gpt_provider.py | 210 | # Check if mtp_block_spec parameter is supported |
| LOW | paddleformers/transformers/masking_utils.py | 247 | # Check if the mask can be safely skipped |
| LOW | paddleformers/transformers/kimi_k2/modeling.py | 186 | # Check if mtp_block_spec parameter is supported |
| LOW | paddleformers/transformers/kimi_k2/modeling.py | 228 | # Check if mtp_block_spec parameter is supported |
| LOW | …dleformers/transformers/legacy/tokenizer_utils_base.py | 1981 | # Check if README file already exist in repo |
| LOW | paddleformers/transformers/ernie4_5_moe_vl/tokenizer.py | 240 | # Check if padding is needed |
| LOW | …ddleformers/transformers/qwen3_vl_moe/configuration.py | 320 | # Check if the attribute exists in sub-configs |
| LOW | …ddleformers/transformers/qwen3_vl_moe/configuration.py | 356 | # Check if user has set a top-level override |
| LOW | paddleformers/transformers/qwen3_vl/configuration.py | 309 | # Check if the attribute exists in sub-configs |
| LOW | paddleformers/transformers/qwen3_vl/configuration.py | 345 | # Check if user has set a top-level override |
| LOW | paddleformers/data/data_collator.py | 571 | # Check if padding is necessary. |
| LOW | paddleformers/data/data_collator.py | 607 | # Check if padding is necessary. |
| LOW | paddleformers/trainer/trainer.py | 1950 | # Check if continuing training from a checkpoint |
| LOW | paddleformers/trainer/trainer.py | 4301 | # Check if we should delete older checkpoint(s) |
| LOW | paddleformers/trainer/trainer.py | 4327 | # Check if we should delete older hf checkpoint(s) |
| LOW | paddleformers/trainer/trainer.py | 4914 | # Set back to None to begin a new accumulation |
| LOW | paddleformers/trainer/integrations.py | 287 | # Check if a Weights & Biases (wandb) API key is provided in the training arguments |
| LOW | paddleformers/generation/utils.py | 282 | # Check if we are done so that we can save a pad step if all(done) |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/nn/test_attention.py | 163 | # Step 1: Reshape tensors from [B, S, H, D] to [B, H, S, D] for matrix multiplication |
| LOW | tests/nn/test_attention.py | 168 | # Step 2: Transpose key for matmul: [B, H, S, D] -> [B, H, D, S] |
| LOW | tests/nn/test_attention.py | 171 | # Step 3: Calculate attention scores (Query @ Key^T) and apply scaling |
| LOW | tests/nn/test_attention.py | 174 | # Step 4: Apply the attention mask if provided |
| LOW | tests/nn/test_attention.py | 179 | # Step 5: Prepare and concatenate the sink logits. The sink is a special token |
| LOW | tests/nn/test_attention.py | 184 | # Step 6: Apply softmax over the combined logits (scores + sink) |
| LOW | tests/nn/test_attention.py | 188 | # Step 7: Separate the attention probabilities from the sink probabilities |
| LOW | tests/nn/test_attention.py | 191 | # Step 8: Apply dropout to the scores |
| LOW | tests/nn/test_attention.py | 194 | # Step 9: Compute the weighted sum of values (Scores @ Value) |
| LOW | tests/nn/test_attention.py | 197 | # Step 10: Reshape the output back to [B, S, H, D] and flatten the head dimension |
| LOW | paddleformers/datasets/dataset.py | 669 | # We need to check if the example contains label column and confirm its name. |
| LOW | paddleformers/datasets/dataset.py | 705 | # We need to check if the example contains label column and confirm its name. |
| LOW | paddleformers/transformers/minimax_m2/modeling.py | 953 | # Step 1: Transpose fleet weight |
| LOW | paddleformers/transformers/minimax_m2/modeling.py | 956 | # Step 2: Split into per-group chunks along axis=0 |
| LOW | paddleformers/transformers/minimax_m2/modeling.py | 978 | # Step 3: Reassemble q_proj (interleaved Q+Gate) |
| LOW | paddleformers/transformers/auto/feature_extraction.py | 176 | # not all of these are nested. We need to check if it was saved recently as nested or if it is legacy style |
| LOW | paddleformers/transformers/deepseek_v4/modeling.py | 943 | # Step 1: split up_gate_proj back to w1/w3 (intermediate, no transpose yet) |
| LOW | paddleformers/transformers/deepseek_v4/modeling.py | 949 | # Step 2: transpose each piece to HF shape |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 254 | # Step 1: Split q_proj into 2*num_heads equal chunks (each = head_dim) |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 259 | # Step 2: Split k_proj and v_proj into num_kv_heads chunks |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 264 | # Step 3: Assemble per-group in fleet order and concat |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 279 | # Step 4: Transpose the fused weight |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 319 | # Step 1: Split in_proj_qkv [qk_dim+qk_dim+v_dim, hidden] into q, k, v along axis=0 |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 335 | # Step 2: 6 sources (q, k, v, z, b, a) → fused_in_proj with TP interleaving |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 339 | # Step 3: Transpose to Fleet layout [hidden, in_proj_dim] |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 624 | # Step 1: Transpose fleet weight [in, out] -> [out, in] |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 627 | # Step 2: Split into per-group chunks along axis=0 |
| LOW | paddleformers/transformers/qwen3_5/modeling.py | 644 | # Step 3: Reassemble into HF format |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 46 | # Step 1: mock _add_accumulator |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 56 | # Step 2: mock _C_ops.adamw_ and _C_ops.adamw |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 77 | # Step 3: mock _insert_sync |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 95 | # Step 4: mock Muon._muon_update and Muon._apply_optimize |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 177 | # Step 1: mock _add_accumulator |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 187 | # Step 2: mock _C_ops.adamw_ and _C_ops.adamw |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 207 | # Step 3: mock _insert_sync |
| LOW | paddleformers/trainer/utils/offload_optimizer.py | 225 | # Step 4: mock Muon._muon_update and Muon._apply_optimize |
| LOW | paddleformers/generation/utils.py | 389 | # Step 1: Process input mask to generate basic expanded mask |
| LOW | paddleformers/generation/utils.py | 447 | # Step 2: Convert boolean mask to numerical mask (adapt to different devices) |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 77 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 79 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 80 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 85 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 90 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 91 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 99 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 111 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 112 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 116 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 117 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 118 | |
| MEDIUM | …e_pretrain/ernie/src/callbacks/moe_logging_callback.py | 120 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 78 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 80 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 81 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 86 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 91 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 92 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 100 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 112 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 113 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 117 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 118 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 119 | |
| MEDIUM | …n/ernie_pretrain/src/callbacks/moe_logging_callback.py | 121 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | tests/generation/test_logits_process.py | 330 | # scores = 0 to facilitate checks |
| LOW | paddleformers/datasets/DPODataset.py | 386 | # The sequnece is too long, just return None |
| LOW | paddleformers/peft/lora/lora_model.py | 101 | # If paddle_xpu is not installed, just use PaddleFormers's native lora layers |
| LOW | paddleformers/transformers/linear_utils.py | 82 | # If paddle_xpu is not installed, just use Paddle's native Linear implementations |
| MEDIUM | paddleformers/transformers/auto/tokenizer.py | 234 | # First, let's see whether the tokenizer_type is passed so that we can leverage it |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | paddleformers/nn/moe_deepep/modular_moe_layer.py | 314 | # the current expert. We need to make sure to multiply the output hidden |
| LOW | paddleformers/transformers/qwen2_moe/modeling.py | 370 | # the current expert. We need to make sure to multiply the output hidden |
| LOW | paddleformers/transformers/qwen3_moe/modeling.py | 368 | # the current expert. We need to make sure to multiply the output hidden |
| LOW | paddleformers/trainer/training_args.py | 353 | If you set this value, `greater_is_better` will default to `True`. Don't forget to set it to `False` if |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/ai_edited_test/nn/test_ai_loss_utils.py | 78 | def my_function(x): |
| LOW | tests/ai_edited_test/trainer/test_ai_zero_cost_ckpt.py | 109 | def my_function(state_dict): |
| LOW | paddleformers/data/data_collator.py | 507 | def process_data(self, data, pad_idx, max_len): |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | …ctices/tutorials/how_to_train_a_function_call_model.md | 96 | {"messages": [{"role": "user", "content": "I need to generate an invoice for a customer named John Doe. He bought 2 appl |