abhigoyal1997 · August 7, 2024 08:57 · llsj14 · Dec 19, 2024
diff --git a/convert_EAGLE_ckpt_to_vllm_compatible.py b/convert_EAGLE_ckpt_to_vllm_compatible.py
 import json

 import torch
 from safetensors.torch import load_file, save_file

 ckpt = torch.load("EAGLE-LLaMA3-Instruct-8B/pytorch_model.bin")
 ref_ckpt = load_file("Meta-Llama-3-8B-Instruct/model-00004-of-00004.safetensors")

 ckpt['lm_head.weight'] = ref_ckpt['lm_head.weight']

 save_file(ckpt, "EAGLE-LLaMA3-Instruct-8B/model.safetensors")

 with open("EAGLE-LLaMA3-Instruct-8B/config.json") as rf:
    cfg = json.load(rf)

 cfg = {"model_type": "eagle", "model": cfg}

 with open("EAGLE-LLaMA3-Instruct-8B/config.json", "w") as wf:
    json.dump(cfg, wf)

 # delete EAGLE-LLaMA3-Instruct-8B/pytorch_model.bin
	import json

	import torch
	from safetensors.torch import load_file, save_file

	ckpt = torch.load("EAGLE-LLaMA3-Instruct-8B/pytorch_model.bin")
	ref_ckpt = load_file("Meta-Llama-3-8B-Instruct/model-00004-of-00004.safetensors")

	ckpt['lm_head.weight'] = ref_ckpt['lm_head.weight']

	save_file(ckpt, "EAGLE-LLaMA3-Instruct-8B/model.safetensors")

	with open("EAGLE-LLaMA3-Instruct-8B/config.json") as rf:
	cfg = json.load(rf)

	cfg = {"model_type": "eagle", "model": cfg}

	with open("EAGLE-LLaMA3-Instruct-8B/config.json", "w") as wf:
	json.dump(cfg, wf)

	# delete EAGLE-LLaMA3-Instruct-8B/pytorch_model.bin