Fix api extension
This commit is contained in:
@@ -40,24 +40,27 @@ class Handler(BaseHTTPRequestHandler):
|
|||||||
prompt_lines.pop(0)
|
prompt_lines.pop(0)
|
||||||
|
|
||||||
prompt = '\n'.join(prompt_lines)
|
prompt = '\n'.join(prompt_lines)
|
||||||
|
generate_params = {
|
||||||
|
'max_new_tokens': int(body.get('max_length', 200)),
|
||||||
|
'do_sample': bool(body.get('do_sample', True)),
|
||||||
|
'temperature': float(body.get('temperature', 0.5)),
|
||||||
|
'top_p': float(body.get('top_p', 1)),
|
||||||
|
'typical_p': float(body.get('typical', 1)),
|
||||||
|
'repetition_penalty': float(body.get('rep_pen', 1.1)),
|
||||||
|
'encoder_repetition_penalty': 1,
|
||||||
|
'top_k': int(body.get('top_k', 0)),
|
||||||
|
'min_length': int(body.get('min_length', 0)),
|
||||||
|
'no_repeat_ngram_size': int(body.get('no_repeat_ngram_size',0)),
|
||||||
|
'num_beams': int(body.get('num_beams',1)),
|
||||||
|
'penalty_alpha': float(body.get('penalty_alpha', 0)),
|
||||||
|
'length_penalty': float(body.get('length_penalty', 1)),
|
||||||
|
'early_stopping': bool(body.get('early_stopping', False)),
|
||||||
|
'seed': int(body.get('seed', -1)),
|
||||||
|
}
|
||||||
|
|
||||||
generator = generate_reply(
|
generator = generate_reply(
|
||||||
question = prompt,
|
prompt,
|
||||||
max_new_tokens = int(body.get('max_length', 200)),
|
generate_params,
|
||||||
do_sample=bool(body.get('do_sample', True)),
|
|
||||||
temperature=float(body.get('temperature', 0.5)),
|
|
||||||
top_p=float(body.get('top_p', 1)),
|
|
||||||
typical_p=float(body.get('typical', 1)),
|
|
||||||
repetition_penalty=float(body.get('rep_pen', 1.1)),
|
|
||||||
encoder_repetition_penalty=1,
|
|
||||||
top_k=int(body.get('top_k', 0)),
|
|
||||||
min_length=int(body.get('min_length', 0)),
|
|
||||||
no_repeat_ngram_size=int(body.get('no_repeat_ngram_size',0)),
|
|
||||||
num_beams=int(body.get('num_beams',1)),
|
|
||||||
penalty_alpha=float(body.get('penalty_alpha', 0)),
|
|
||||||
length_penalty=float(body.get('length_penalty', 1)),
|
|
||||||
early_stopping=bool(body.get('early_stopping', False)),
|
|
||||||
seed=int(body.get('seed', -1)),
|
|
||||||
stopping_strings=body.get('stopping_strings', []),
|
stopping_strings=body.get('stopping_strings', []),
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user