marioiseli commited on
Commit
c4c83dd
·
verified ·
1 Parent(s): 77cc23d

Upload gemma4_patched.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. gemma4_patched.py +0 -5
gemma4_patched.py CHANGED
@@ -1027,9 +1027,6 @@ class Gemma4Model(nn.Module):
1027
  if is_pp_missing_parameter(moe_name, self):
1028
  continue
1029
  param = params_dict[moe_name]
1030
- # Debug: log first expert of first layer
1031
- if expert_id == 0 and "layers.0." in name:
1032
- print(f"[PATCH LOAD] {name} -> {moe_name} | wl={wl_name} shard={shard_id} eid={expert_id} | weight:{list(loaded_weight.shape)} param:{list(param.shape)}")
1033
  weight_loader = param.weight_loader
1034
  weight_loader(
1035
  param,
@@ -1049,7 +1046,6 @@ class Gemma4Model(nn.Module):
1049
  if is_pp_missing_parameter(name, self):
1050
  continue
1051
  if name not in params_dict:
1052
- print(f"[PATCH DEBUG] Skipping unknown key: {name}")
1053
  continue
1054
  param = params_dict[name]
1055
  weight_loader = getattr(
@@ -1060,7 +1056,6 @@ class Gemma4Model(nn.Module):
1060
  import inspect
1061
  sig = inspect.signature(weight_loader)
1062
  if len(sig.parameters) > 3 and "expert_id" in sig.parameters:
1063
- print(f"[PATCH DEBUG] Skipping FusedMoE param that fell through mapping: {name}")
1064
  continue
1065
  weight_loader(param, loaded_weight)
1066
  loaded_params.add(name)
 
1027
  if is_pp_missing_parameter(moe_name, self):
1028
  continue
1029
  param = params_dict[moe_name]
 
 
 
1030
  weight_loader = param.weight_loader
1031
  weight_loader(
1032
  param,
 
1046
  if is_pp_missing_parameter(name, self):
1047
  continue
1048
  if name not in params_dict:
 
1049
  continue
1050
  param = params_dict[name]
1051
  weight_loader = getattr(
 
1056
  import inspect
1057
  sig = inspect.signature(weight_loader)
1058
  if len(sig.parameters) > 3 and "expert_id" in sig.parameters:
 
1059
  continue
1060
  weight_loader(param, loaded_weight)
1061
  loaded_params.add(name)