Spaces:

oflakne26
/

New-Place

Sleeping

App Files Files Community

oflakne26 commited on May 25, 2024

Commit

c81e2b1

verified ·

1 Parent(s): 407b03e

Update main.py

Browse files

Files changed (1) hide show

main.py +2 -45

main.py CHANGED Viewed

@@ -87,48 +87,5 @@ async def generate_response(data: InputData) -> Any:
             return cleaned_response
     except Exception as e:
-        print(f"Primary model {data.model} failed with error: {e}")
-    # If the primary model fails, try fallback models
-    for model in FALLBACK_MODELS:
-        try:
-            client = InferenceClient(model=model, token=HF_TOKEN)
-            response = client.text_generation(inputs,
-                                              temperature=1.0,
-                                              max_new_tokens=1000,
-                                              seed=seed)
-            strict_response = str(response)
-            repaired_response = repair_json(strict_response,
-                                            return_objects=True)
-            if isinstance(repaired_response, str):
-                raise HTTPException(status_code=500, detail="Invalid response from model")
-            else:
-                cleaned_response = {}
-                for key, value in repaired_response.items():
-                    cleaned_key = key.replace("###", "")
-                    cleaned_response[cleaned_key] = value
-                for i, text in enumerate(cleaned_response["New response"]):
-                    if i <= 2:
-                        sentences = tokenizer.tokenize(text)
-                        if sentences:
-                            cleaned_response["New response"][i] = sentences[0]
-                    else:
-                        del cleaned_response["New response"][i]
-                if cleaned_response.get("Sentence count"):
-                    if cleaned_response["Sentence count"] > 3:
-                        cleaned_response["Sentence count"] = 3
-                else:
-                    cleaned_response["Sentence count"] = len(cleaned_response["New response"])
-                data.history += str(cleaned_response)
-                return cleaned_response
-        except Exception as e:
-            print(f"Model {model} failed with error: {e}")
-    raise HTTPException(status_code=500, detail="All models failed to generate response")

             return cleaned_response
     except Exception as e:
+        print(f"Model {data.model} failed with error: {e}")
+        raise HTTPException(status_code=500, detail=f"Model {data.model} failed to generate response")