Checklist
Describe the bug
gen_config=GenerationConfig(
temperature=0.0,
top_k = 1,
output_logits='generation',
output_last_hidden_state='generation',
max_new_tokens=2048)
# pipe = pipeline(args.model_path, backend_config=backend_config)
pipe = pipeline(args.model_path)
response = pipe(['Hi, pls intro yourself', 'Shanghai is'],
gen_config=gen_config)
hidden_states = [x.last_hidden_state for x in response]
logits = [x.logits for x in response]
# pdb.set_trace()
print(hidden_states)
print(logits)
Reproduction
gen_config=GenerationConfig(
temperature=0.0,
top_k = 1,
output_logits='generation',
output_last_hidden_state='generation',
max_new_tokens=2048)
# pipe = pipeline(args.model_path, backend_config=backend_config)
pipe = pipeline(args.model_path)
response = pipe(['Hi, pls intro yourself', 'Shanghai is'],
gen_config=gen_config)
hidden_states = [x.last_hidden_state for x in response]
logits = [x.logits for x in response]
# pdb.set_trace()
print(hidden_states)
print(logits)
Environment
Error traceback
Checklist
Describe the bug
gen_config=GenerationConfig(
temperature=0.0,
top_k = 1,
output_logits='generation',
output_last_hidden_state='generation',
max_new_tokens=2048)
Reproduction
gen_config=GenerationConfig(
temperature=0.0,
top_k = 1,
output_logits='generation',
output_last_hidden_state='generation',
max_new_tokens=2048)
Environment
Error traceback