Sergei Skvortsov commited on
Commit
5f51568
·
1 Parent(s): ea3f247

Fixed vocab

Browse files
Files changed (2) hide show
  1. model.safetensors +2 -2
  2. test.ipynb +100 -0
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9523886352217ded3aeeef552b381af79d568c6d49a4b9e423288cea56b0a44
3
- size 988097824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:468681d96c9d987f5f923dda6c9918a10a5d711278a189b4e24975bf647ea326
3
+ size 988327168
test.ipynb ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 29,
6
+ "metadata": {},
7
+ "outputs": [],
8
+ "source": [
9
+ "from safetensors.torch import load_file, save_file\n",
10
+ "import torch"
11
+ ]
12
+ },
13
+ {
14
+ "cell_type": "code",
15
+ "execution_count": 34,
16
+ "metadata": {},
17
+ "outputs": [],
18
+ "source": [
19
+ "file_path = \"/Qwen2.5-1.5B-Instruct/model.safetensors\"\n",
20
+ "tensors = load_file(file_path)"
21
+ ]
22
+ },
23
+ {
24
+ "cell_type": "code",
25
+ "execution_count": 35,
26
+ "metadata": {},
27
+ "outputs": [
28
+ {
29
+ "name": "stdout",
30
+ "output_type": "stream",
31
+ "text": [
32
+ "model.embed_tokens.weight torch.Size([151936, 1536])\n"
33
+ ]
34
+ }
35
+ ],
36
+ "source": [
37
+ "# 152064\n",
38
+ "# 151642\n",
39
+ "for name in tensors.keys():\n",
40
+ " if 151936 in tensors[name].shape:\n",
41
+ " print(name, tensors[name].shape)"
42
+ ]
43
+ },
44
+ {
45
+ "cell_type": "code",
46
+ "execution_count": 36,
47
+ "metadata": {},
48
+ "outputs": [],
49
+ "source": [
50
+ "embed = \"model.embed_tokens.weight\"\n",
51
+ "new_vocab = 152064\n",
52
+ "source_shape = tensors[embed].shape\n",
53
+ "target_shape = torch.Size((new_vocab, source_shape[-1]))\n",
54
+ "\n",
55
+ "source = tensors[embed]\n",
56
+ "\n",
57
+ "target = torch.zeros(target_shape, dtype=source.dtype, device=source.device)\n",
58
+ "target[:source_shape[0], :] = source"
59
+ ]
60
+ },
61
+ {
62
+ "cell_type": "code",
63
+ "execution_count": 37,
64
+ "metadata": {},
65
+ "outputs": [],
66
+ "source": [
67
+ "updated_tensors = {**tensors, embed: target}\n",
68
+ "save_file(updated_tensors, file_path)"
69
+ ]
70
+ },
71
+ {
72
+ "cell_type": "code",
73
+ "execution_count": null,
74
+ "metadata": {},
75
+ "outputs": [],
76
+ "source": []
77
+ }
78
+ ],
79
+ "metadata": {
80
+ "kernelspec": {
81
+ "display_name": "base",
82
+ "language": "python",
83
+ "name": "python3"
84
+ },
85
+ "language_info": {
86
+ "codemirror_mode": {
87
+ "name": "ipython",
88
+ "version": 3
89
+ },
90
+ "file_extension": ".py",
91
+ "mimetype": "text/x-python",
92
+ "name": "python",
93
+ "nbconvert_exporter": "python",
94
+ "pygments_lexer": "ipython3",
95
+ "version": "3.11.10"
96
+ }
97
+ },
98
+ "nbformat": 4,
99
+ "nbformat_minor": 2
100
+ }