|
|
@@ -25,32 +25,32 @@ import torch
|
|
|
|
|
|
IGNORE_ID = -1
|
|
|
|
|
|
-instruct_list = ["You are a helpful assistant. 请用广东话表达。",
|
|
|
- "You are a helpful assistant. 请用东北话表达。",
|
|
|
- "You are a helpful assistant. 请用甘肃话表达。",
|
|
|
- "You are a helpful assistant. 请用贵州话表达。",
|
|
|
- "You are a helpful assistant. 请用河南话表达。",
|
|
|
- "You are a helpful assistant. 请用湖北话表达。",
|
|
|
- "You are a helpful assistant. 请用湖南话表达。",
|
|
|
- "You are a helpful assistant. 请用江西话表达。",
|
|
|
- "You are a helpful assistant. 请用闽南话表达。",
|
|
|
- "You are a helpful assistant. 请用宁夏话表达。",
|
|
|
- "You are a helpful assistant. 请用山西话表达。",
|
|
|
- "You are a helpful assistant. 请用陕西话表达。",
|
|
|
- "You are a helpful assistant. 请用山东话表达。",
|
|
|
- "You are a helpful assistant. 请用上海话表达。",
|
|
|
- "You are a helpful assistant. 请用四川话表达。",
|
|
|
- "You are a helpful assistant. 请用天津话表达。",
|
|
|
- "You are a helpful assistant. 请用云南话表达。",
|
|
|
- "You are a helpful assistant. Please say a sentence as loudly as possible.",
|
|
|
- "You are a helpful assistant. Please say a sentence in a very soft voice.",
|
|
|
- "You are a helpful assistant. 请用尽可能慢地语速说一句话。",
|
|
|
- "You are a helpful assistant. 请用尽可能快地语速说一句话。",
|
|
|
- "You are a helpful assistant. 请非常开心地说一句话。",
|
|
|
- "You are a helpful assistant. 请非常伤心地说一句话。",
|
|
|
- "You are a helpful assistant. 请非常生气地说一句话。",
|
|
|
- "You are a helpful assistant. 我想体验一下小猪佩奇风格,可以吗?",
|
|
|
- "You are a helpful assistant. 你可以尝试用机器人的方式解答吗?"]
|
|
|
+instruct_list = ["You are a helpful assistant. 请用广东话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用东北话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用甘肃话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用贵州话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用河南话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用湖北话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用湖南话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用江西话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用闽南话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用宁夏话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用山西话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用陕西话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用山东话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用上海话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用四川话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用天津话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用云南话表达。<endofprompt>",
|
|
|
+ "You are a helpful assistant. Please say a sentence as loudly as possible.<endofprompt>",
|
|
|
+ "You are a helpful assistant. Please say a sentence in a very soft voice.<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用尽可能慢地语速说一句话。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请用尽可能快地语速说一句话。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请非常开心地说一句话。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请非常伤心地说一句话。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 请非常生气地说一句话。<endofprompt>",
|
|
|
+ "You are a helpful assistant. 我想体验一下小猪佩奇风格,可以吗?<endofprompt>",
|
|
|
+ "You are a helpful assistant. 你可以尝试用机器人的方式解答吗?<endofprompt>"]
|
|
|
|
|
|
def pad_list(xs: List[torch.Tensor], pad_value: int):
|
|
|
"""Perform padding for the list of tensors.
|
|
|
@@ -156,12 +156,12 @@ def nucleus_sampling(weighted_scores, top_p=0.8, top_k=25):
|
|
|
break
|
|
|
prob = torch.tensor(prob).to(weighted_scores)
|
|
|
indices = torch.tensor(indices, dtype=torch.long).to(weighted_scores.device)
|
|
|
- top_ids = indices[prob.multinomial(1, replacement=True)]
|
|
|
+ top_ids = indices[prob.multinomial(1, replacement=True)].item()
|
|
|
return top_ids
|
|
|
|
|
|
|
|
|
def random_sampling(weighted_scores, decoded_tokens, sampling):
|
|
|
- top_ids = weighted_scores.softmax(dim=0).multinomial(1, replacement=True)
|
|
|
+ top_ids = weighted_scores.softmax(dim=0).multinomial(1, replacement=True).item()
|
|
|
return top_ids
|
|
|
|
|
|
|