File size: 713 Bytes
5c89bcb |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 |
import sys
import torch
import model.configuration_deepseek as cds
import model.modeling_deepseek as mds
from safetensors.torch import load_file
@torch.no_grad
def main():
config = cds.DeepseekV3Config.from_pretrained("model")
with torch.device("meta"):
model = mds.DeepseekV3Attention(config)
model.load_state_dict(load_file("model/weights.safetensors", device="cuda"), assign=True, strict=True)
inputs = load_file("model/nan_input.safetensors", device="cuda")
result = model.forward(**inputs)
print(result[0][0][163])
if __name__ == "__main__":
try:
main()
except KeyboardInterrupt:
print("\nScript interrupted by user, exiting...")
sys.exit(1)
|