update bid to match each layers MTP source (#23237)
* update bid to match each layers MTP source * Update conversion/qwen.py Co-authored-by: Sigbjørn Skjæret <sigbjorn.skjaeret@scala.com> --------- Co-authored-by: Sigbjørn Skjæret <sigbjorn.skjaeret@scala.com>
This commit is contained in:
@@ -600,6 +600,7 @@ class _Qwen35MtpMixin:
|
|||||||
if name.find("layers.") != -1:
|
if name.find("layers.") != -1:
|
||||||
assert bid is not None
|
assert bid is not None
|
||||||
name = name.replace(f"mtp.layers.{bid}", f"model.layers.{bid + n_layer}")
|
name = name.replace(f"mtp.layers.{bid}", f"model.layers.{bid + n_layer}")
|
||||||
|
bid = bid + n_layer
|
||||||
else:
|
else:
|
||||||
remapper = {
|
remapper = {
|
||||||
"mtp.fc": "model.layers.{bid}.eh_proj",
|
"mtp.fc": "model.layers.{bid}.eh_proj",
|
||||||
|
|||||||
Reference in New Issue
Block a user