iAkashPaul commited on
Commit
3ea94cd
·
verified ·
1 Parent(s): 52af7e5

Update server.py

Browse files
Files changed (1) hide show
  1. server.py +5 -2
server.py CHANGED
@@ -24,14 +24,17 @@ def base():
24
 
25
  prefix_prompt="""<s>[INST]Summarize the following transcript[/INST]\n"""
26
  suffix_prompt="""\n"""
 
 
 
27
  @app.post("/llm")
28
  async def main(request: Request):
29
  input_json = await request.json()
30
  print(input_json)
31
  final_prompt = prefix_prompt + str(input_json["prompt"]) + suffix_prompt
32
  resp = requests.post(
33
- "https://YOUR_MODEL_ID.api.baseten.co/production/predict",
34
- headers={"Authorization": "Api-Key YOUR_API_KEY"},
35
  json={'prompt': final_prompt ,'temperature': 0.001, 'max_new_tokens': 100, 'repetition_penalty':1.2},
36
  )
37
  llm_response = resp.json()
 
24
 
25
  prefix_prompt="""<s>[INST]Summarize the following transcript[/INST]\n"""
26
  suffix_prompt="""\n"""
27
+ import os
28
+ baseten_url = os.getenv("BASETEN_URL")
29
+ baseten_key = os.getenv("BASETEN_KEY")
30
  @app.post("/llm")
31
  async def main(request: Request):
32
  input_json = await request.json()
33
  print(input_json)
34
  final_prompt = prefix_prompt + str(input_json["prompt"]) + suffix_prompt
35
  resp = requests.post(
36
+ baseten_url,
37
+ headers={"Authorization": f"Api-Key {baseten_key}"},
38
  json={'prompt': final_prompt ,'temperature': 0.001, 'max_new_tokens': 100, 'repetition_penalty':1.2},
39
  )
40
  llm_response = resp.json()