Refine modeling and demo.
This commit is contained in:
parent
332d27cc05
commit
90fbc2642e
|
@ -0,0 +1,42 @@
|
|||
# q matmul k
|
||||
|
||||
## model
|
||||
|
||||
qwen/Qwen-1_8B-Chat
|
||||
|
||||
## input
|
||||
|
||||
```python
|
||||
<|im_start|>system
|
||||
You are a helpful assistant.<|im_end|>
|
||||
<|im_start|>user
|
||||
你好<|im_end|>
|
||||
<|im_start|>assistant
|
||||
莎是现代汉语的男性的名字,出自《诗经》中的“采采卷耳
|
||||
```
|
||||
|
||||
|
||||
data:image/s3,"s3://crabby-images/864f8/864f81ef8ccadd43bff53558da725934a7bcbbfe" alt=""
|
||||
data:image/s3,"s3://crabby-images/07731/0773172cb6ab976e1fd10433a9b0d80d216b3f9e" alt=""
|
||||
data:image/s3,"s3://crabby-images/36e7c/36e7c303a65ef94f6e6d2bff824760f8b18f13c4" alt=""
|
||||
data:image/s3,"s3://crabby-images/d359d/d359d701e96488389275dd027eed65cb6d63c5aa" alt=""
|
||||
data:image/s3,"s3://crabby-images/fee87/fee875de00c3511734f778aecd2b62e2ba56ab80" alt=""
|
||||
data:image/s3,"s3://crabby-images/2968b/2968bdaaa6a339a0110257a13c048e41d672494d" alt=""
|
||||
data:image/s3,"s3://crabby-images/2fbc4/2fbc46d3c193a63101dda6da34c54087be624f7f" alt=""
|
||||
data:image/s3,"s3://crabby-images/3f4ae/3f4ae455b63badc5c10819aaa67db7c4eed6c823" alt=""
|
||||
data:image/s3,"s3://crabby-images/8a2cf/8a2cf3000212c2408aca0cafed28ee1a577c07ee" alt=""
|
||||
data:image/s3,"s3://crabby-images/6dfef/6dfef4220b74f1c010134120770b569745449dc3" alt=""
|
||||
data:image/s3,"s3://crabby-images/bb44b/bb44ba4f04566615852af5820400395986579b12" alt=""
|
||||
data:image/s3,"s3://crabby-images/1ffe3/1ffe3c056c6e1d62b21a2751fa8f843d814ac128" alt=""
|
||||
data:image/s3,"s3://crabby-images/05280/05280a870326e119383029a7544e8e1b9779eeb7" alt=""
|
||||
data:image/s3,"s3://crabby-images/0d3eb/0d3ebf77253ac02e20d462369c520f474f839815" alt=""
|
||||
data:image/s3,"s3://crabby-images/869f5/869f536f5ff64ccd0dad67ebda4a5d54b460f0de" alt=""
|
||||
data:image/s3,"s3://crabby-images/44fe0/44fe0ec8bda37ff03504aeb698ceb5560cda2c0e" alt=""
|
||||
data:image/s3,"s3://crabby-images/e00fd/e00fdc0e31eda45fa4c07de567ec88c3d052a80c" alt=""
|
||||
data:image/s3,"s3://crabby-images/9a8a3/9a8a347f731746d84417808b5cc02d51c8dc6c9e" alt=""
|
||||
data:image/s3,"s3://crabby-images/8dc58/8dc585ad30be79425e395516efed908004e83bbd" alt=""
|
||||
data:image/s3,"s3://crabby-images/2a5e2/2a5e2408546f92c35758fa5fd7c6f82f20ae8e3f" alt=""
|
||||
data:image/s3,"s3://crabby-images/1183f/1183ff4718fb3c1bcdb64f9fe847ac7e3226de65" alt=""
|
||||
data:image/s3,"s3://crabby-images/60322/6032276515ce594e28b23c7186e5463693ffb266" alt=""
|
||||
data:image/s3,"s3://crabby-images/9779f/9779fe3b3e542ee5ab454ab7b0cc30a7f0c0bbc5" alt=""
|
||||
data:image/s3,"s3://crabby-images/8abec/8abec15468ac268571e4852b480c05189264fb7a" alt=""
|
28
qwen/demo.py
28
qwen/demo.py
|
@ -64,26 +64,28 @@ model = model.from_pretrained(
|
|||
# )
|
||||
|
||||
# 第一轮对话
|
||||
response, history, decode_tokens = model.chat(tokenizer, "你好", "莎是现代汉语的男性的名字,出自《诗经》中的“采采卷", history=None)
|
||||
response, history, decode_tokens = model.chat(tokenizer, "东南亚国家日本的首都是什么市", "", history=None)
|
||||
print(decode_tokens)
|
||||
# 你好!很高兴为你提供帮助。
|
||||
# <|im_start|>system
|
||||
# You are a helpful assistant.<|im_end|>
|
||||
# <|im_start|>user
|
||||
# 东南亚国家日本的首都是什么市<|im_end|>
|
||||
# <|im_start|>assistant
|
||||
# 日本的首都东京。<|im_end|><|endoftext|>
|
||||
|
||||
|
||||
|
||||
|
||||
# # 第一轮对话
|
||||
# response, history, decode_tokens = model.chat(tokenizer, "你好", "", history=None)
|
||||
# print(decode_tokens)
|
||||
# # 你好!很高兴为你提供帮助。
|
||||
|
||||
# 第二轮对话
|
||||
# response, history = model.chat(tokenizer, "给我讲一个年轻人奋斗创业最终取得成功的故事。", history=None)
|
||||
# print(response)
|
||||
|
||||
|
||||
|
||||
# <|im_start|>system
|
||||
# You are a helpful assistant.<|im_end|>
|
||||
# <|im_start|>user
|
||||
# 你好<|im_end|>
|
||||
# <|im_start|>assistant
|
||||
# 莎是现代汉语的男性的名字,出自《诗经》中的“采采卷耳
|
||||
|
||||
|
||||
|
||||
|
||||
# <|im_start|>system
|
||||
# You are a helpful assistant.<|im_end|>
|
||||
# <|im_start|>user
|
||||
|
|
|
@ -148,6 +148,10 @@ class QWenAttention(nn.Module):
|
|||
# qk = query @ key.transpose(-2, -1)
|
||||
# qk = qk[0]
|
||||
# show.DumpTensorToImage(qk,"q_matmul_k_layer_"+str(self.index)+".png")
|
||||
# print("layer:" + str(self.index) + " query.shape:"+ str(query.shape))
|
||||
# print("layer:" + str(self.index) + " key.shape:"+ str(key.shape))
|
||||
# print("layer:" + str(self.index) + " value.shape:"+ str(value.shape))
|
||||
# print("\n")
|
||||
|
||||
attn_output = F.scaled_dot_product_attention(query, key, value, attn_mask=attention_mask).transpose(1, 2)
|
||||
context_layer = self._merge_heads(attn_output, self.num_heads, self.head_dim)
|
||||
|
|
Loading…
Reference in New Issue