mirror of
https://github.com/exo-explore/exo.git
synced 2025-10-23 02:57:14 +03:00
undo diff
This commit is contained in:
@@ -51,6 +51,7 @@ def build_transformer(model_path: Path, shard: Shard, model_size="8B", device=No
|
|||||||
weights = load(str(model_path), shard)
|
weights = load(str(model_path), shard)
|
||||||
weights = convert_from_huggingface(weights, model, MODEL_PARAMS[model_size]["args"]["n_heads"], MODEL_PARAMS[model_size]["args"]["n_kv_heads"])
|
weights = convert_from_huggingface(weights, model, MODEL_PARAMS[model_size]["args"]["n_heads"], MODEL_PARAMS[model_size]["args"]["n_kv_heads"])
|
||||||
weights = fix_bf16(weights)
|
weights = fix_bf16(weights)
|
||||||
|
|
||||||
with Context(BEAM=0):
|
with Context(BEAM=0):
|
||||||
# replace weights in model
|
# replace weights in model
|
||||||
load_state_dict(model, weights, strict=False, consume=False) # consume=True
|
load_state_dict(model, weights, strict=False, consume=False) # consume=True
|
||||||
|
|||||||
Reference in New Issue
Block a user