[NPU] update convert script based on latest usage (#12617)
This commit is contained in:
parent
ef585d3360
commit
d841e1dc0d
1 changed files with 0 additions and 2 deletions
|
|
@ -60,7 +60,6 @@ if __name__ == "__main__":
|
||||||
t0 = time.perf_counter()
|
t0 = time.perf_counter()
|
||||||
model = AutoModelForCausalLM.from_pretrained(model_path,
|
model = AutoModelForCausalLM.from_pretrained(model_path,
|
||||||
optimize_model=True,
|
optimize_model=True,
|
||||||
pipeline=True,
|
|
||||||
load_in_low_bit=args.low_bit,
|
load_in_low_bit=args.low_bit,
|
||||||
max_context_len=args.max_context_len,
|
max_context_len=args.max_context_len,
|
||||||
max_prompt_len=args.max_prompt_len,
|
max_prompt_len=args.max_prompt_len,
|
||||||
|
|
@ -69,7 +68,6 @@ if __name__ == "__main__":
|
||||||
attn_implementation="eager",
|
attn_implementation="eager",
|
||||||
transpose_value_cache=not args.disable_transpose_value_cache,
|
transpose_value_cache=not args.disable_transpose_value_cache,
|
||||||
trust_remote_code=True,
|
trust_remote_code=True,
|
||||||
convert_model=True,
|
|
||||||
save_directory=save_dir)
|
save_directory=save_dir)
|
||||||
t1 = time.perf_counter()
|
t1 = time.perf_counter()
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue