qqc1989 commited on
Commit
f8f79a4
·
verified ·
1 Parent(s): bede825

update the axmodel for ax630c

Browse files
Files changed (31) hide show
  1. .gitattributes +1 -0
  2. internvl2_5_1b_364_ax630c/model.embed_tokens.weight.bfloat16.bin +3 -0
  3. internvl2_5_1b_364_ax630c/qwen2_p256_l0_together.axmodel +3 -0
  4. internvl2_5_1b_364_ax630c/qwen2_p256_l10_together.axmodel +3 -0
  5. internvl2_5_1b_364_ax630c/qwen2_p256_l11_together.axmodel +3 -0
  6. internvl2_5_1b_364_ax630c/qwen2_p256_l12_together.axmodel +3 -0
  7. internvl2_5_1b_364_ax630c/qwen2_p256_l13_together.axmodel +3 -0
  8. internvl2_5_1b_364_ax630c/qwen2_p256_l14_together.axmodel +3 -0
  9. internvl2_5_1b_364_ax630c/qwen2_p256_l15_together.axmodel +3 -0
  10. internvl2_5_1b_364_ax630c/qwen2_p256_l16_together.axmodel +3 -0
  11. internvl2_5_1b_364_ax630c/qwen2_p256_l17_together.axmodel +3 -0
  12. internvl2_5_1b_364_ax630c/qwen2_p256_l18_together.axmodel +3 -0
  13. internvl2_5_1b_364_ax630c/qwen2_p256_l19_together.axmodel +3 -0
  14. internvl2_5_1b_364_ax630c/qwen2_p256_l1_together.axmodel +3 -0
  15. internvl2_5_1b_364_ax630c/qwen2_p256_l20_together.axmodel +3 -0
  16. internvl2_5_1b_364_ax630c/qwen2_p256_l21_together.axmodel +3 -0
  17. internvl2_5_1b_364_ax630c/qwen2_p256_l22_together.axmodel +3 -0
  18. internvl2_5_1b_364_ax630c/qwen2_p256_l23_together.axmodel +3 -0
  19. internvl2_5_1b_364_ax630c/qwen2_p256_l2_together.axmodel +3 -0
  20. internvl2_5_1b_364_ax630c/qwen2_p256_l3_together.axmodel +3 -0
  21. internvl2_5_1b_364_ax630c/qwen2_p256_l4_together.axmodel +3 -0
  22. internvl2_5_1b_364_ax630c/qwen2_p256_l5_together.axmodel +3 -0
  23. internvl2_5_1b_364_ax630c/qwen2_p256_l6_together.axmodel +3 -0
  24. internvl2_5_1b_364_ax630c/qwen2_p256_l7_together.axmodel +3 -0
  25. internvl2_5_1b_364_ax630c/qwen2_p256_l8_together.axmodel +3 -0
  26. internvl2_5_1b_364_ax630c/qwen2_p256_l9_together.axmodel +3 -0
  27. internvl2_5_1b_364_ax630c/qwen2_post.axmodel +3 -0
  28. internvl2_5_1b_364_ax630c/vit_intern_sim_space2depth.axmodel +3 -0
  29. internvl2_5_tokenizer_364.py +153 -0
  30. main +3 -0
  31. run_internvl2_5_364_ax630c.sh +20 -0
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  *.axmodel filter=lfs diff=lfs merge=lfs -textmain_internvl2_5_448_prefill filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  *.axmodel filter=lfs diff=lfs merge=lfs -textmain_internvl2_5_448_prefill filter=lfs diff=lfs merge=lfs -text
37
+ main filter=lfs diff=lfs merge=lfs -text
internvl2_5_1b_364_ax630c/model.embed_tokens.weight.bfloat16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c075733fbd78ce7da59e83318795095432ab287547e61ba21ad3fb05a4bb896b
3
+ size 271799808
internvl2_5_1b_364_ax630c/qwen2_p256_l0_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af330da9bcebf41e4aea08de49d074954486d08d0b56131097d1aedbec7accb8
3
+ size 16009622
internvl2_5_1b_364_ax630c/qwen2_p256_l10_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d672ce000c86706709e885e6aa586d299688a825fa9b2492743c068d0a3dcff
3
+ size 16009646
internvl2_5_1b_364_ax630c/qwen2_p256_l11_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:944652ed5157021334e990b9df3460a698853b2e4dbffd62255e701747467723
3
+ size 16009654
internvl2_5_1b_364_ax630c/qwen2_p256_l12_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc2318e042d12e21108c0a7fd23e35978131da04408337319fa651cbb0ce8197
3
+ size 16009622
internvl2_5_1b_364_ax630c/qwen2_p256_l13_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edaccef791b600fb84a94e1117b23b97b5ebd6f69a02875c3feef5f207740325
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_p256_l14_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aba074ab790ce3a9048732c0c8606ba1e3a9606754d37f38a481762faa170ea
3
+ size 16009670
internvl2_5_1b_364_ax630c/qwen2_p256_l15_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26d04515a1c97525d79e506865ddb527555bae3b4ce738519dff9693d63dd800
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l16_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7e9c61713e674f37f3e1eb570085bda050aa7739718e4cb11f33a43a13d4250
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l17_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:682e958761bab38381aa38667adc6715f0b83e18062c884105ee92e135f0d5d1
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l18_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29defdfafd3ab57cca9e3602e6c92e3547788cba1ee9c2a627fd04f8ad07d3c6
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_p256_l19_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6897a6b66af8d9ef98bf1ea2aa810b9a2ef612f0b64ee47c8faec8e2b635122d
3
+ size 16009614
internvl2_5_1b_364_ax630c/qwen2_p256_l1_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a920d53223aa0a4746802b1705fef467763f371d09e0e1918d8e3b5c54311cb3
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_p256_l20_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09f120a2b2f6619c90610c5027bf02f20ddadd12df5051e1c358f73c03cb2cf6
3
+ size 16009646
internvl2_5_1b_364_ax630c/qwen2_p256_l21_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1209e8c33c9765d19bed54410aa83573aea3eab04754ff5d14885e401a2d5a2
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l22_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d47a40712c2d33989bd2e4c6889b458399edf4f72de9149942f484ebde0e972b
3
+ size 16009646
internvl2_5_1b_364_ax630c/qwen2_p256_l23_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:924a41dcf1618069182896f4a2e5e3058a8d72d26f5e537f6d7cf7162c2cc319
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l2_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9df37aad5c393dd516157551018b5c7bd1440d94959d6ee30229074bbf68a916
3
+ size 16009646
internvl2_5_1b_364_ax630c/qwen2_p256_l3_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2d3efd9edcaf1eaeb613ddfd4f4d1568477e46426e20392d44e6b62190afa9e
3
+ size 16009622
internvl2_5_1b_364_ax630c/qwen2_p256_l4_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16bef5efe6ddf2609db42aca42c5beb3bce6ccbecb5d4465a091c75e2e6ddc0d
3
+ size 16009646
internvl2_5_1b_364_ax630c/qwen2_p256_l5_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df32fcff11d33fe96622734da6c9f11f05856c8494c1a853a8822efe6af9479e
3
+ size 16009614
internvl2_5_1b_364_ax630c/qwen2_p256_l6_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccaf9ab7a2fd7e412e4992f8da48b4473ad417bf725df3332f1229ed5a68e6c1
3
+ size 16009630
internvl2_5_1b_364_ax630c/qwen2_p256_l7_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cba84fcf8fd8cfe8f5b3bb2d097d2d423b80e9f8c2104b0eead26685a668a3d
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_p256_l8_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08765f4dfbe87fe193b619285c289464fd16e9ac17b5f803af188c03726a5c2f
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_p256_l9_together.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:017870640a743a73853a903d8b03ef0b5998767e911b8f19a336cab3c4160cc2
3
+ size 16009638
internvl2_5_1b_364_ax630c/qwen2_post.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb764b0fd3d62f22003eb3bc05c03a7250eb779d3cc1c440962c584c304b004c
3
+ size 139700408
internvl2_5_1b_364_ax630c/vit_intern_sim_space2depth.axmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c6a517a273eb945cb45922486db00cc884671dc38378f504c8d181de47fd024
3
+ size 402545119
internvl2_5_tokenizer_364.py ADDED
@@ -0,0 +1,153 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoTokenizer, PreTrainedTokenizerFast
2
+ from http.server import HTTPServer, BaseHTTPRequestHandler
3
+ import json
4
+ import argparse
5
+
6
+
7
+ class Tokenizer_Http():
8
+
9
+ def __init__(self):
10
+
11
+ path = 'internvl2_5_tokenizer'
12
+ self.tokenizer = AutoTokenizer.from_pretrained(path,
13
+ trust_remote_code=True,
14
+ use_fast=False)
15
+
16
+ def encode(self, content):
17
+ prompt = f"<|im_start|>system\n你是由上海人工智能实验室联合商汤科技开发的书生多模态大模型,英文名叫InternVL, 是一个有用无害的人工智能助手。<|im_end|><|im_start|>user\n{content}<|im_end|><|im_start|>assistant\n"
18
+ input_ids = self.tokenizer.encode(prompt)
19
+ return input_ids
20
+
21
+ def encode_vpm(self, content="Please describe the image shortly."):
22
+ prompt = f"<|im_start|>system\n你是由上海人工智能实验室联合商汤科技开发的书生多模态大模型,英文名叫InternVL, 是一个有用无害的人工智能助手。<|im_end|><|im_start|>user\n<img>" + "<IMG_CONTEXT>" * 169 + f"</img>\n{content}<|im_end|><|im_start|>assistant\n"
23
+ input_ids = self.tokenizer.encode(prompt)
24
+ return input_ids
25
+
26
+ def decode(self, token_ids):
27
+ return self.tokenizer.decode(token_ids,
28
+ clean_up_tokenization_spaces=False)
29
+
30
+ @property
31
+ def bos_id(self):
32
+ return self.tokenizer.bos_token_id
33
+
34
+ @property
35
+ def eos_id(self):
36
+ return self.tokenizer.eos_token_id
37
+
38
+ @property
39
+ def bos_token(self):
40
+ return self.tokenizer.bos_token
41
+
42
+ @property
43
+ def eos_token(self):
44
+ return self.tokenizer.eos_token
45
+
46
+
47
+ tokenizer = Tokenizer_Http()
48
+
49
+ print(tokenizer.bos_id, tokenizer.bos_token, tokenizer.eos_id,
50
+ tokenizer.eos_token)
51
+ token_ids = tokenizer.encode_vpm()
52
+ # [151644, 8948, 198, 56568, 104625, 100633, 104455, 104800, 101101, 32022, 102022, 99602, 100013, 9370, 90286, 21287, 42140, 53772, 35243, 26288, 104949, 3837, 105205, 109641, 67916, 30698, 11, 54851, 46944, 115404, 42192, 99441, 100623, 48692, 100168, 110498, 1773, 151645, 151644, 872, 198,
53
+ # 151646,
54
+ # 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648, 151648,
55
+ # 151647,
56
+ # 198, 5501, 7512, 279, 2168, 19620, 13, 151645, 151644, 77091, 198]
57
+ # 118
58
+ print(token_ids)
59
+ print(len(token_ids))
60
+ token_ids = tokenizer.encode("hello world")
61
+ # [151644, 8948, 198, 56568, 104625, 100633, 104455, 104800, 101101, 32022, 102022, 99602, 100013, 9370, 90286, 21287, 42140, 53772, 35243, 26288, 104949, 3837, 105205, 109641, 67916, 30698, 11, 54851, 46944, 115404, 42192, 99441, 100623, 48692, 100168, 110498, 1773, 151645, 151644, 872, 198, 14990, 1879, 151645, 151644, 77091, 198]
62
+ # 47
63
+ print(token_ids)
64
+ print(len(token_ids))
65
+
66
+
67
+ class Request(BaseHTTPRequestHandler):
68
+ #通过类继承,新定义类
69
+ timeout = 5
70
+ server_version = 'Apache'
71
+
72
+ def do_GET(self):
73
+ print(self.path)
74
+ #在新类中定义get的内容(当客户端向该服务端使用get请求时,本服务端将如下运行)
75
+ self.send_response(200)
76
+ self.send_header("type", "get") #设置响应头,可省略或设置多个
77
+ self.end_headers()
78
+
79
+ if self.path == '/bos_id':
80
+ bos_id = tokenizer.bos_id
81
+ # print(bos_id)
82
+ # to json
83
+ if bos_id is None:
84
+ msg = json.dumps({'bos_id': -1})
85
+ else:
86
+ msg = json.dumps({'bos_id': bos_id})
87
+ elif self.path == '/eos_id':
88
+ eos_id = tokenizer.eos_id
89
+ if eos_id is None:
90
+ msg = json.dumps({'eos_id': -1})
91
+ else:
92
+ msg = json.dumps({'eos_id': eos_id})
93
+ else:
94
+ msg = 'error'
95
+
96
+ print(msg)
97
+ msg = str(msg).encode() #转为str再转为byte格式
98
+
99
+ self.wfile.write(msg) #将byte格式的信息返回给客户端
100
+
101
+ def do_POST(self):
102
+ #在新类中定义post的内容(当客户端向该服务端使用post请求时,本服务端将如下运行)
103
+ data = self.rfile.read(int(
104
+ self.headers['content-length'])) #获取从客户端传入的参数(byte格式)
105
+ data = data.decode() #将byte格式转为str格式
106
+
107
+ self.send_response(200)
108
+ self.send_header("type", "post") #设置响应头,可省略或设置多个
109
+ self.end_headers()
110
+
111
+ if self.path == '/encode':
112
+ req = json.loads(data)
113
+ print(req)
114
+ prompt = req['text']
115
+ b_img_prompt = False
116
+ if 'img_prompt' in req:
117
+ b_img_prompt = req['img_prompt']
118
+ if b_img_prompt:
119
+ token_ids = tokenizer.encode_vpm(prompt)
120
+ else:
121
+ token_ids = tokenizer.encode(prompt)
122
+ if token_ids is None:
123
+ msg = json.dumps({'token_ids': -1})
124
+ else:
125
+ msg = json.dumps({'token_ids': token_ids})
126
+
127
+ elif self.path == '/decode':
128
+ req = json.loads(data)
129
+ token_ids = req['token_ids']
130
+ text = tokenizer.decode(token_ids)
131
+ if text is None:
132
+ msg = json.dumps({'text': ""})
133
+ else:
134
+ msg = json.dumps({'text': text})
135
+ else:
136
+ msg = 'error'
137
+ print(msg)
138
+ msg = str(msg).encode() #转为str再转为byte格式
139
+
140
+ self.wfile.write(msg) #将byte格式的信息返回给客户端
141
+
142
+
143
+ if __name__ == "__main__":
144
+
145
+ args = argparse.ArgumentParser()
146
+ args.add_argument('--host', type=str, default='localhost')
147
+ args.add_argument('--port', type=int, default=8080)
148
+ args = args.parse_args()
149
+
150
+ host = (args.host, args.port) #设定地址与端口号,'localhost'等价于'127.0.0.1'
151
+ print('http://%s:%s' % host)
152
+ server = HTTPServer(host, Request) #根据地址端口号和新定义的类,创建服务器实例
153
+ server.serve_forever() #开启服务
main ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5f93a06d217f9eb57a7438e0cbb43f9a8d47f0bf8e61b6c6c9c0059a6abaee
3
+ size 6534536
run_internvl2_5_364_ax630c.sh ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ./main \
2
+ --template_filename_axmodel "internvl2_5_1b_364_ax630c/qwen2_p256_l%d_together.axmodel" \
3
+ --axmodel_num 24 \
4
+ --filename_vpm_resampler_axmodedl "internvl2_5_1b_364_ax630c/vit_intern_sim_space2depth.axmodel" \
5
+ --tokenizer_type 2 \
6
+ --bos 0 --eos 0 \
7
+ --dynamic_load_axmodel_layer 0 \
8
+ --use_mmap_load_embed 1 \
9
+ --filename_tokenizer_model "http://127.0.0.1:12345" \
10
+ --filename_post_axmodel "internvl2_5_1b_364_ax630c/qwen2_post.axmodel" \
11
+ --use_topk 0 \
12
+ --filename_tokens_embed "internvl2_5_1b_364_ax630c/model.embed_tokens.weight.bfloat16.bin" \
13
+ --tokens_embed_num 151674 \
14
+ --tokens_embed_size 896 \
15
+ --live_print 1 \
16
+ --continue 1 \
17
+ --img_height 364 \
18
+ --img_width 364 \
19
+ --img_token_id 151667 \
20
+ --prompt "$1" --image "$2"