Spaces:
Runtime error
Runtime error
Create app.py
Browse files
app.py
ADDED
@@ -0,0 +1,742 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import datetime
|
2 |
+
import hmac
|
3 |
+
import os
|
4 |
+
import uuid
|
5 |
+
|
6 |
+
import openai
|
7 |
+
import requests
|
8 |
+
import streamlit as st
|
9 |
+
from azure.cosmos import ContainerProxy, CosmosClient
|
10 |
+
from bs4 import BeautifulSoup, NavigableString
|
11 |
+
from dotenv import load_dotenv
|
12 |
+
from st_copy_to_clipboard import st_copy_to_clipboard
|
13 |
+
|
14 |
+
load_dotenv()
|
15 |
+
|
16 |
+
|
17 |
+
def get_related_studies(article: str):
|
18 |
+
with st.spinner("Extrahiere Studien..."):
|
19 |
+
url = f'https://serpapi.com/search.json?engine=google_scholar&api_key={os.getenv("SERP_API_KEY")}&as_ylo=2018&q='
|
20 |
+
url += extract_scholar_query(article).replace('"', "")
|
21 |
+
|
22 |
+
try:
|
23 |
+
response = requests.get(url)
|
24 |
+
if response.status_code == 200:
|
25 |
+
data = response.json()
|
26 |
+
if data.get("organic_results"):
|
27 |
+
results = []
|
28 |
+
for result in data["organic_results"]:
|
29 |
+
if not result.get("title"):
|
30 |
+
continue
|
31 |
+
if not result.get("link"):
|
32 |
+
continue
|
33 |
+
results.append(
|
34 |
+
{
|
35 |
+
"title": result["title"],
|
36 |
+
"link": result["link"],
|
37 |
+
}
|
38 |
+
)
|
39 |
+
st.session_state["studie_links"] = results
|
40 |
+
else:
|
41 |
+
st.session_state["studie_links"] = []
|
42 |
+
else:
|
43 |
+
st.session_state["studie_links"] = []
|
44 |
+
except Exception as e:
|
45 |
+
print(f"Fehler beim extrahieren der Studien: {str(e)}")
|
46 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
47 |
+
|
48 |
+
|
49 |
+
def get_takeaways(article : str):
|
50 |
+
openai.api_key = os.environ.get("OPEN_API_KEY")
|
51 |
+
openai.api_base = os.environ.get("OPEN_API_BASE")
|
52 |
+
openai.api_type = os.environ.get("OPEN_API_TYPE")
|
53 |
+
openai.api_version = os.environ.get("OPEN_API_VERSION")
|
54 |
+
takeaway_query = os.environ.get("takeaway")
|
55 |
+
with st.spinner("Creating Takeaways"):
|
56 |
+
try:
|
57 |
+
res = openai.ChatCompletion.create(
|
58 |
+
engine="gpt-4-1106",
|
59 |
+
temperature=0.2,
|
60 |
+
messages=[
|
61 |
+
{
|
62 |
+
"role": "system",
|
63 |
+
"content": f" The article you have written is as follows: {article}.",
|
64 |
+
}
|
65 |
+
],
|
66 |
+
)
|
67 |
+
st.session_state["takeaways"] = res["choices"][0]["message"]["content"]
|
68 |
+
except Exception as e:
|
69 |
+
print(f"Fehler beim extrahieren der Query: {str(e)}")
|
70 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
71 |
+
st.session_state["takeaways"] = None
|
72 |
+
|
73 |
+
|
74 |
+
|
75 |
+
def get_faq(article : str):
|
76 |
+
openai.api_key = os.environ.get("OPEN_API_KEY")
|
77 |
+
openai.api_base = os.environ.get("OPEN_API_BASE")
|
78 |
+
openai.api_type = os.environ.get("OPEN_API_TYPE")
|
79 |
+
openai.api_version = os.environ.get("OPEN_API_VERSION")
|
80 |
+
faq_query = os.environ.get("faq")
|
81 |
+
|
82 |
+
with st.spinner("Creating FAQ"):
|
83 |
+
try:
|
84 |
+
res = openai.ChatCompletion.create(
|
85 |
+
engine="gpt-4-1106",
|
86 |
+
temperature=0.2,
|
87 |
+
messages=[
|
88 |
+
{
|
89 |
+
"role": "system",
|
90 |
+
"content": f" The article you have written is as follows: {article}.",
|
91 |
+
}
|
92 |
+
],
|
93 |
+
)
|
94 |
+
st.session_state["faq"] = res["choices"][0]["message"]["content"]
|
95 |
+
except Exception as e:
|
96 |
+
print(f"Fehler beim extrahieren der Query: {str(e)}")
|
97 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
98 |
+
st.session_state["faq"] = None
|
99 |
+
|
100 |
+
def extract_scholar_query(article: str):
|
101 |
+
openai.api_key = os.environ.get("OPEN_API_KEY")
|
102 |
+
openai.api_base = os.environ.get("OPEN_API_BASE")
|
103 |
+
openai.api_type = os.environ.get("OPEN_API_TYPE")
|
104 |
+
openai.api_version = os.environ.get("OPEN_API_VERSION")
|
105 |
+
try:
|
106 |
+
res = openai.ChatCompletion.create(
|
107 |
+
engine="gpt-4-1106",
|
108 |
+
temperature=0.2,
|
109 |
+
messages=[
|
110 |
+
{
|
111 |
+
"role": "system",
|
112 |
+
"content": f"You are a professional journalist whose task is to find related studies based on an article you have written. Please write a query that you would use to search for related studies on Google Scholar. Please make sure that the query is specific enough and cotains a maximum of 4 words. Only include one query in your output. Do not write multiple querys with an AND or OR. The article you have written is as follows: {article}.",
|
113 |
+
}
|
114 |
+
],
|
115 |
+
)
|
116 |
+
return res["choices"][0]["message"]["content"]
|
117 |
+
except Exception as e:
|
118 |
+
print(f"Fehler beim extrahieren der Query: {str(e)}")
|
119 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
120 |
+
return ""
|
121 |
+
|
122 |
+
|
123 |
+
def create_article(length_option, articles, params, web_page_option):
|
124 |
+
|
125 |
+
if length_option == "Kurz":
|
126 |
+
length = os.environ.get("SHORT_LENGTH")
|
127 |
+
elif length_option == "Mittel":
|
128 |
+
length = os.environ.get("MEDIUM_LENGTH")
|
129 |
+
elif length_option == "Lang":
|
130 |
+
length = os.environ.get("LONG_LENGTH")
|
131 |
+
elif length_option == "SEO":
|
132 |
+
length = os.environ.get("SEO_LENGTH")
|
133 |
+
elif length_option == "SEO Plus":
|
134 |
+
length = os.environ.get("SEO_PLUS_LENGTH")
|
135 |
+
|
136 |
+
openai.api_key = os.environ.get("OPEN_API_KEY")
|
137 |
+
openai.api_base = os.environ.get("OPEN_API_BASE")
|
138 |
+
openai.api_type = os.environ.get("OPEN_API_TYPE")
|
139 |
+
openai.api_version = os.environ.get("OPEN_API_VERSION")
|
140 |
+
|
141 |
+
if web_page_option == "Boulevard":
|
142 |
+
writing_style = os.environ.get("WRITING_STYLE_HEUTE")
|
143 |
+
elif web_page_option == "Health Blog":
|
144 |
+
writing_style = os.environ.get("WRITING_STYLE_GESUND")
|
145 |
+
elif web_page_option == "Newspaper":
|
146 |
+
writing_style = os.environ.get("WRITING_STYLE_NEWSPAPER")
|
147 |
+
elif web_page_option == "Tech/Lifestyle Blog":
|
148 |
+
writing_style = os.environ.get("WRITING_STYLE_TECH_BLOG")
|
149 |
+
elif web_page_option == "Public Relations":
|
150 |
+
writing_style = os.environ.get("WRITING_STYLE_PR")
|
151 |
+
elif web_page_option == "Sales":
|
152 |
+
writing_style = os.environ.get("WRITING_STYLE_SALES")
|
153 |
+
elif web_page_option == "Lifestyle Blog":
|
154 |
+
writing_style = os.environ.get("WRITING_STYLE_LIFESTYLE")
|
155 |
+
|
156 |
+
try:
|
157 |
+
if len(articles) > 0:
|
158 |
+
article_string = "; ".join(
|
159 |
+
f"Artikel {index + 1}: {artikel}"
|
160 |
+
for index, artikel in enumerate(articles)
|
161 |
+
)
|
162 |
+
messages = [
|
163 |
+
{
|
164 |
+
"role": "system",
|
165 |
+
"content": f"You are a professional journalist whose task is to write your own article based on one or more articles. This article should combine the content of the original articles, but have its own writing style, which is as follows: {writing_style} Do not use unusual phrases or neologisms from the original articles. It is important that the length of your article should be {length} words long.",
|
166 |
+
},
|
167 |
+
{"role": "system", "content": f"Source articles: {article_string}"},
|
168 |
+
{
|
169 |
+
"role": "system",
|
170 |
+
"content": f"Please also note the following instructions defined by the user: {params}",
|
171 |
+
},
|
172 |
+
{
|
173 |
+
"role": "system",
|
174 |
+
"content": "Schreibe den Artikel immer in deutscher Sprache.",
|
175 |
+
},
|
176 |
+
]
|
177 |
+
else:
|
178 |
+
messages = [
|
179 |
+
{
|
180 |
+
"role": "system",
|
181 |
+
"content": f"You are a professional journalist whose task is to write an article based on your own notes. This article should be written in the following writing style: {writing_style} .It is important that the length of your article should be {length} words long.",
|
182 |
+
},
|
183 |
+
{
|
184 |
+
"role": "system",
|
185 |
+
"content": f"Please write the article based on the following user input: {params}",
|
186 |
+
},
|
187 |
+
{
|
188 |
+
"role": "system",
|
189 |
+
"content": "Schreibe den Artikel immer in deutscher Sprache.",
|
190 |
+
},
|
191 |
+
]
|
192 |
+
res = openai.ChatCompletion.create(
|
193 |
+
engine="gpt-35-16k",
|
194 |
+
temperature=0.4,
|
195 |
+
max_tokens=8000,
|
196 |
+
messages=messages,
|
197 |
+
)
|
198 |
+
return res["choices"][0]["message"]["content"]
|
199 |
+
except Exception as e:
|
200 |
+
print(f"Fehler beim erstellen des artikels: {str(e)}")
|
201 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
202 |
+
|
203 |
+
|
204 |
+
def create_headline(article, web_page_option):
|
205 |
+
openai.api_key = os.environ.get("OPEN_API_KEY")
|
206 |
+
openai.api_base = os.environ.get("OPEN_API_BASE")
|
207 |
+
openai.api_type = os.environ.get("OPEN_API_TYPE")
|
208 |
+
openai.api_version = os.environ.get("OPEN_API_VERSION")
|
209 |
+
|
210 |
+
if web_page_option == "Boulevard":
|
211 |
+
writing_style = os.environ.get("WRITING_STYLE_HEUTE")
|
212 |
+
else:
|
213 |
+
writing_style = os.environ.get("WRITING_STYLE_GESUND")
|
214 |
+
|
215 |
+
try:
|
216 |
+
res = openai.ChatCompletion.create(
|
217 |
+
engine="gpt-4-1106",
|
218 |
+
temperature=0.4,
|
219 |
+
messages=[
|
220 |
+
{
|
221 |
+
"role": "system",
|
222 |
+
"content": f"You are a professional journalist and have the task of generating a headline for an article you have written. I will give you the writing style that was used to create the article as info. Writing style: {writing_style} The headline should be as short as possible, but still capture the essence of the article. It should be a maximum of 10 words long",
|
223 |
+
},
|
224 |
+
{"role": "system", "content": f"Source article: {article}"},
|
225 |
+
{
|
226 |
+
"role": "system",
|
227 |
+
"content": "Schreibe die Headline immer in deutscher Sprache.",
|
228 |
+
},
|
229 |
+
],
|
230 |
+
)
|
231 |
+
return res["choices"][0]["message"]["content"]
|
232 |
+
except Exception as e:
|
233 |
+
print(f"Fehler beim erstellen der headline: {str(e)}")
|
234 |
+
st.error(f"Something went wrong: {str(e)}", icon="🚨")
|
235 |
+
|
236 |
+
|
237 |
+
def extract_text_from_element(element):
|
238 |
+
# Initialisiere einen leeren Textstring
|
239 |
+
text_content = ""
|
240 |
+
|
241 |
+
# Überprüfe, ob das Element ein <p>, <ul> oder <ol>-Tag ist
|
242 |
+
if element.name in ["p", "ul", "ol"]:
|
243 |
+
# Extrahiere den Text des Tags und füge ihn zum Textstring hinzu
|
244 |
+
text_content += element.get_text() + "\n"
|
245 |
+
|
246 |
+
# Überprüfe, ob das Element ein Tag mit Kindern ist (kein Textknoten)
|
247 |
+
if not isinstance(element, NavigableString):
|
248 |
+
# Rekursiv durch jedes Child-Element gehen und den Text hinzufügen
|
249 |
+
for child in element.children:
|
250 |
+
text_content += extract_text_from_element(child)
|
251 |
+
|
252 |
+
return text_content
|
253 |
+
|
254 |
+
|
255 |
+
def get_article_summary(article: str) -> str:
|
256 |
+
try:
|
257 |
+
response = requests.post(
|
258 |
+
os.environ.get("SUMMARY_API"),
|
259 |
+
headers={
|
260 |
+
"Content-Type": "application/json",
|
261 |
+
"Authorization": os.environ.get("SUMMARY_API_KEY"),
|
262 |
+
"azureml-model-deployment": "heute-summary-api",
|
263 |
+
},
|
264 |
+
data={"article": article},
|
265 |
+
)
|
266 |
+
response.raise_for_status()
|
267 |
+
return response.json()["summary"]
|
268 |
+
except Exception as e:
|
269 |
+
print(f"Fehler beim erstellen der Zusammenfassung: {str(e)}")
|
270 |
+
return ""
|
271 |
+
|
272 |
+
|
273 |
+
def extract_article(url):
|
274 |
+
# Webseite herunterladen
|
275 |
+
headers = {
|
276 |
+
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.3'
|
277 |
+
}
|
278 |
+
response = requests.get(url, headers=headers)
|
279 |
+
|
280 |
+
# Überprüfen, ob die Anfrage erfolgreich war (Status-Code 200)
|
281 |
+
if response.status_code == 200:
|
282 |
+
# HTML-Inhalt parsen
|
283 |
+
soup = BeautifulSoup(response.text, "html.parser")
|
284 |
+
|
285 |
+
# Finden Sie das <article>-Tag (nehmen Sie an, dass es eins gibt)
|
286 |
+
article_tag = soup.find("article")
|
287 |
+
|
288 |
+
if article_tag:
|
289 |
+
# Starte die Rekursion für jedes Child-Element des <article>-Tags
|
290 |
+
extracted_text = extract_text_from_element(article_tag)
|
291 |
+
stripped_text = filter_empty_lines(extracted_text)
|
292 |
+
return stripped_text
|
293 |
+
else:
|
294 |
+
print("Kein <article>-Tag gefunden.")
|
295 |
+
return None
|
296 |
+
else:
|
297 |
+
# Falls die Anfrage nicht erfolgreich war, eine Fehlermeldung ausgeben
|
298 |
+
print(f"Fehler: {response.status_code}")
|
299 |
+
return None
|
300 |
+
|
301 |
+
|
302 |
+
def filter_empty_lines(text):
|
303 |
+
# Teile den Text in Zeilen auf
|
304 |
+
lines = text.split("\n")
|
305 |
+
|
306 |
+
# Filtere leere Zeilen heraus
|
307 |
+
non_empty_lines = filter(lambda line: line.strip() != "", lines)
|
308 |
+
|
309 |
+
# Verbinde die nicht leeren Zeilen zu einem String
|
310 |
+
filtered_text = "\n".join(non_empty_lines)
|
311 |
+
|
312 |
+
return filtered_text
|
313 |
+
|
314 |
+
|
315 |
+
def extract_article_links(**kwargs):
|
316 |
+
# print(len(kwargs["links"]))
|
317 |
+
with st.spinner("Extrahiere..."):
|
318 |
+
results = []
|
319 |
+
for link in kwargs["links"]:
|
320 |
+
results.append(extract_article(link))
|
321 |
+
st.session_state["extracted_articles"] = results
|
322 |
+
if st.session_state["process_step"] < 1:
|
323 |
+
st.session_state["process_step"] += 1
|
324 |
+
st.session_state["selected_page"] = 1
|
325 |
+
|
326 |
+
|
327 |
+
def extract_article_links_for_heading(**kwargs):
|
328 |
+
article = extract_article(kwargs["link"])
|
329 |
+
|
330 |
+
|
331 |
+
def finalize_articles():
|
332 |
+
final_articles = []
|
333 |
+
for i in range(len(st.session_state["extracted_articles"])):
|
334 |
+
final_articles.append(st.session_state["final_article_" + str(i + 1)])
|
335 |
+
st.session_state["final_articles"] = final_articles
|
336 |
+
if st.session_state["process_step"] < 2:
|
337 |
+
st.session_state["process_step"] += 1
|
338 |
+
st.session_state["selected_page"] += 1
|
339 |
+
|
340 |
+
|
341 |
+
def increase_page():
|
342 |
+
if st.session_state["selected_page"] <= st.session_state["process_step"]:
|
343 |
+
st.session_state["selected_page"] += 1
|
344 |
+
|
345 |
+
|
346 |
+
def decrease_page():
|
347 |
+
if st.session_state["selected_page"] > 0:
|
348 |
+
st.session_state["selected_page"] -= 1
|
349 |
+
|
350 |
+
|
351 |
+
def on_click_handler_generate_article(**kwargs):
|
352 |
+
with st.spinner("Generiere Artikel..."):
|
353 |
+
created_article = create_article(
|
354 |
+
kwargs["length_option"],
|
355 |
+
kwargs["final_articles"],
|
356 |
+
kwargs["add_info"],
|
357 |
+
kwargs["webpage_option"],
|
358 |
+
)
|
359 |
+
headline = create_headline(created_article, kwargs["webpage_option"])
|
360 |
+
db_analytics_item = {
|
361 |
+
"id": str(uuid.uuid4()),
|
362 |
+
"oparation": "article_generation",
|
363 |
+
"timestamp": str(datetime.datetime.now()),
|
364 |
+
}
|
365 |
+
client: ContainerProxy = st.session_state["db_container"]
|
366 |
+
client.create_item(body=db_analytics_item)
|
367 |
+
st.session_state["generated_article"] = created_article
|
368 |
+
st.session_state["generated_headline"] = headline
|
369 |
+
st.session_state["article_summary"] = get_article_summary(created_article)
|
370 |
+
if st.session_state["process_step"] < 3:
|
371 |
+
st.session_state["process_step"] += 1
|
372 |
+
st.session_state["selected_page"] += 1
|
373 |
+
|
374 |
+
|
375 |
+
def on_click_handler_generate_generate_article_keywords(**kwargs):
|
376 |
+
with st.spinner("Generiere Artikel..."):
|
377 |
+
created_article = create_article(
|
378 |
+
kwargs["length_option"],
|
379 |
+
"",
|
380 |
+
kwargs["artikel_input"],
|
381 |
+
kwargs["webpage_option"],
|
382 |
+
)
|
383 |
+
headline = create_headline(created_article, kwargs["webpage_option"])
|
384 |
+
summary = get_article_summary(created_article)
|
385 |
+
db_analytics_item = {
|
386 |
+
"id": str(uuid.uuid4()),
|
387 |
+
"oparation": "article_generation",
|
388 |
+
"timestamp": str(datetime.datetime.now()),
|
389 |
+
}
|
390 |
+
client: ContainerProxy = st.session_state["db_container"]
|
391 |
+
client.create_item(body=db_analytics_item)
|
392 |
+
st.session_state["generated_article"] = created_article
|
393 |
+
st.session_state["generated_headline"] = headline
|
394 |
+
st.session_state["article_summary"] = summary
|
395 |
+
|
396 |
+
|
397 |
+
def reset_session_state():
|
398 |
+
st.session_state["extracted_articles"] = []
|
399 |
+
st.session_state["article_links"] = []
|
400 |
+
st.session_state["final_articles"] = []
|
401 |
+
st.session_state["process_step"] = 0
|
402 |
+
st.session_state["selected_page"] = 0
|
403 |
+
st.session_state["generated_article"] = ""
|
404 |
+
st.session_state["studie_links"] = []
|
405 |
+
st.session_state["article_summary"] = ""
|
406 |
+
|
407 |
+
|
408 |
+
if "extracted_articles" not in st.session_state:
|
409 |
+
st.session_state["extracted_articles"] = []
|
410 |
+
if "article_links" not in st.session_state:
|
411 |
+
st.session_state["article_links"] = []
|
412 |
+
if "final_articles" not in st.session_state:
|
413 |
+
st.session_state["final_articles"] = []
|
414 |
+
if "process_step" not in st.session_state:
|
415 |
+
st.session_state["process_step"] = 0
|
416 |
+
if "selected_page" not in st.session_state:
|
417 |
+
st.session_state["selected_page"] = 0
|
418 |
+
if "generated_article" not in st.session_state:
|
419 |
+
st.session_state["generated_article"] = ""
|
420 |
+
if "function_state" not in st.session_state:
|
421 |
+
st.session_state["function_state"] = True
|
422 |
+
if "generated_headline" not in st.session_state:
|
423 |
+
st.session_state["generated_headline"] = ""
|
424 |
+
if "webpage_option" not in st.session_state:
|
425 |
+
st.session_state["webpage_option"] = "Boulevard"
|
426 |
+
if "studie_links" not in st.session_state:
|
427 |
+
st.session_state["studie_links"] = []
|
428 |
+
if "db_container" not in st.session_state:
|
429 |
+
client = (
|
430 |
+
CosmosClient(os.environ["DB_ENDPOINT"], os.environ["DB_KEY"])
|
431 |
+
.get_database_client(os.environ["DB_NAME"])
|
432 |
+
.get_container_client("tina-analytics")
|
433 |
+
)
|
434 |
+
db_analytics_item = {
|
435 |
+
"id": str(uuid.uuid4()),
|
436 |
+
"oparation": "page_load",
|
437 |
+
"timestamp": str(datetime.datetime.now()),
|
438 |
+
}
|
439 |
+
client.create_item(body=db_analytics_item)
|
440 |
+
st.session_state["db_container"] = client
|
441 |
+
if "article_summary" not in st.session_state:
|
442 |
+
st.session_state["article_summary"] = ""
|
443 |
+
|
444 |
+
PROCESS_STEPS = [
|
445 |
+
"Artikel Extraktion",
|
446 |
+
"Artikel Finalisierung",
|
447 |
+
"Artikel Generierung",
|
448 |
+
"Artikel Ausgabe",
|
449 |
+
]
|
450 |
+
|
451 |
+
|
452 |
+
# def check_password():
|
453 |
+
# """Returns `True` if the user had the correct password."""
|
454 |
+
|
455 |
+
# def password_entered():
|
456 |
+
# """Checks whether a password entered by the user is correct."""
|
457 |
+
# if hmac.compare_digest(
|
458 |
+
# st.session_state["password"], os.environ.get("PASSWORD")
|
459 |
+
# ):
|
460 |
+
# st.session_state["password_correct"] = True
|
461 |
+
# del st.session_state["password"] # Don't store the password.
|
462 |
+
# else:
|
463 |
+
# st.session_state["password_correct"] = False
|
464 |
+
|
465 |
+
# # Return True if the password is validated.
|
466 |
+
# if st.session_state.get("password_correct", False):
|
467 |
+
# return True
|
468 |
+
|
469 |
+
# # Show input for password.
|
470 |
+
# st.text_input(
|
471 |
+
# "Password", type="password", on_change=password_entered, key="password"
|
472 |
+
# )
|
473 |
+
# if "password_correct" in st.session_state:
|
474 |
+
# st.error("😕 Password incorrect")
|
475 |
+
# return False
|
476 |
+
|
477 |
+
|
478 |
+
# if not check_password():
|
479 |
+
# st.stop() # Do not continue if check_password is not True.
|
480 |
+
|
481 |
+
col1, col2 = st.columns([2, 1])
|
482 |
+
|
483 |
+
col1.title("TINA")
|
484 |
+
col2.image("tensora_logo.png")
|
485 |
+
|
486 |
+
st.radio(
|
487 |
+
"Wähle den Schreibstil für Artikel aus",
|
488 |
+
[
|
489 |
+
"Boulevard",
|
490 |
+
"Health Blog",
|
491 |
+
"Newspaper",
|
492 |
+
"Tech/Lifestyle Blog",
|
493 |
+
"Public Relations",
|
494 |
+
"Sales",
|
495 |
+
"Lifestyle Blog",
|
496 |
+
],
|
497 |
+
key="webpage_option",
|
498 |
+
)
|
499 |
+
|
500 |
+
with st.sidebar:
|
501 |
+
st.title("Funktions Auswahl")
|
502 |
+
st.write("Hier kannst Du zwischen der Art der Artikelgenerierung wählen.")
|
503 |
+
st.button(
|
504 |
+
"Artikel Generierung mit Links",
|
505 |
+
key="article_gen_btn",
|
506 |
+
use_container_width=True,
|
507 |
+
on_click=lambda: st.session_state.update({"function_state": True}),
|
508 |
+
)
|
509 |
+
st.button(
|
510 |
+
"Artikel Generierung mit Stichpunkten",
|
511 |
+
key="headline_gen_btn",
|
512 |
+
use_container_width=True,
|
513 |
+
on_click=lambda: st.session_state.update({"function_state": False}),
|
514 |
+
)
|
515 |
+
|
516 |
+
if st.session_state["function_state"]:
|
517 |
+
tab_col1, tab_col2, tab_col3, tab_col4 = st.columns([1, 1, 1, 1])
|
518 |
+
|
519 |
+
tab_col1.button(
|
520 |
+
"Artikel Extraktion",
|
521 |
+
key="tab1",
|
522 |
+
use_container_width=True,
|
523 |
+
on_click=lambda: st.session_state.update({"selected_page": 0}),
|
524 |
+
disabled=st.session_state["selected_page"] == 0,
|
525 |
+
)
|
526 |
+
tab_col2.button(
|
527 |
+
"Artikel Finalisierung",
|
528 |
+
key="tab2",
|
529 |
+
use_container_width=True,
|
530 |
+
on_click=lambda: st.session_state.update({"selected_page": 1}),
|
531 |
+
disabled=st.session_state["process_step"] < 1
|
532 |
+
or st.session_state["selected_page"] == 1,
|
533 |
+
)
|
534 |
+
tab_col3.button(
|
535 |
+
"Artikel Generierung",
|
536 |
+
key="tab3",
|
537 |
+
use_container_width=True,
|
538 |
+
on_click=lambda: st.session_state.update({"selected_page": 2}),
|
539 |
+
disabled=st.session_state["process_step"] < 2
|
540 |
+
or st.session_state["selected_page"] == 2,
|
541 |
+
)
|
542 |
+
tab_col4.button(
|
543 |
+
"Artikel Ausgabe",
|
544 |
+
key="tab4",
|
545 |
+
use_container_width=True,
|
546 |
+
on_click=lambda: st.session_state.update({"selected_page": 3}),
|
547 |
+
disabled=st.session_state["process_step"] < 3
|
548 |
+
or st.session_state["selected_page"] == 3,
|
549 |
+
)
|
550 |
+
|
551 |
+
nav_col1, nav_col2, nav_col3 = st.columns([1, 4, 1])
|
552 |
+
|
553 |
+
nav_col1.button(
|
554 |
+
"◀️",
|
555 |
+
key="nav1",
|
556 |
+
use_container_width=True,
|
557 |
+
on_click=decrease_page,
|
558 |
+
disabled=st.session_state["selected_page"] == 0,
|
559 |
+
)
|
560 |
+
nav_col2.markdown(
|
561 |
+
f"<div style='text-align: center;'>{PROCESS_STEPS[st.session_state['selected_page']]}</div>",
|
562 |
+
unsafe_allow_html=True,
|
563 |
+
)
|
564 |
+
nav_col3.button(
|
565 |
+
"▶️",
|
566 |
+
key="nav2",
|
567 |
+
use_container_width=True,
|
568 |
+
on_click=increase_page,
|
569 |
+
disabled=st.session_state["selected_page"] == st.session_state["process_step"],
|
570 |
+
)
|
571 |
+
|
572 |
+
if st.session_state["selected_page"] == 0:
|
573 |
+
st.write(
|
574 |
+
"Bitte gebe die Links der Artikel ein, welche Du extrahiert haben möchtest."
|
575 |
+
)
|
576 |
+
st.text_input(
|
577 |
+
"Gebe den "
|
578 |
+
+ str(len(st.session_state["article_links"]) + 1)
|
579 |
+
+ ". Link ein:",
|
580 |
+
key="link_input_" + str(len(st.session_state["article_links"]) + 1),
|
581 |
+
)
|
582 |
+
if st.session_state[
|
583 |
+
"link_input_" + str(len(st.session_state["article_links"]) + 1)
|
584 |
+
]:
|
585 |
+
st.session_state["article_links"].append(
|
586 |
+
st.session_state[
|
587 |
+
"link_input_" + str(len(st.session_state["article_links"]) + 1)
|
588 |
+
]
|
589 |
+
)
|
590 |
+
st.rerun()
|
591 |
+
for i in range(len(st.session_state["article_links"])):
|
592 |
+
st.write(f"Link nr. {i+1}:\n\n{st.session_state['article_links'][i]}")
|
593 |
+
|
594 |
+
if len(st.session_state["article_links"]) > 0:
|
595 |
+
try:
|
596 |
+
st.button(
|
597 |
+
"Extrahiere Artikel",
|
598 |
+
on_click=extract_article_links,
|
599 |
+
kwargs={"links": st.session_state["article_links"]},
|
600 |
+
)
|
601 |
+
except Exception as e:
|
602 |
+
print(f"Fehler beim extrahieren der artikel: {str(e)}")
|
603 |
+
st.error(
|
604 |
+
f"Du hast einen oder mehrere Links nicht in dem korrekten Format angegeben. Bitte Lade die Seite neu und benutze korrekte Links: {str(e)}",
|
605 |
+
icon="🚨",
|
606 |
+
)
|
607 |
+
elif st.session_state["selected_page"] == 1:
|
608 |
+
st.write(
|
609 |
+
"Hier kannst Du die extrahierten Artikel ansehen und bei Bedarf anpassen."
|
610 |
+
)
|
611 |
+
for i, article in enumerate(st.session_state["extracted_articles"]):
|
612 |
+
with st.expander(f"Artikel {i+1}"):
|
613 |
+
if article:
|
614 |
+
st.text_area(
|
615 |
+
"Editiere die Artikel, falls nötig:",
|
616 |
+
value=article,
|
617 |
+
key="final_article_" + str(i + 1),
|
618 |
+
height=500,
|
619 |
+
)
|
620 |
+
else:
|
621 |
+
st.info(
|
622 |
+
"Die Webseite des Artikels blockiert das automatische extrahieren von Artikeln. Wenn Du den Artikel dennoch benutzen möchtest, dann kannst Du diesen kopieren und einfügen.",
|
623 |
+
icon="ℹ️",
|
624 |
+
)
|
625 |
+
st.text_area(
|
626 |
+
"Füge den Artikel ein, falls nötig:",
|
627 |
+
value=article,
|
628 |
+
key="final_article_" + str(i + 1),
|
629 |
+
height=500,
|
630 |
+
)
|
631 |
+
st.button("Artikel finalisieren", on_click=finalize_articles)
|
632 |
+
elif st.session_state["selected_page"] == 2:
|
633 |
+
for i in range(len(st.session_state["final_articles"])):
|
634 |
+
if st.session_state["final_articles"][i]:
|
635 |
+
with st.expander("Artikel " + str(i + 1)):
|
636 |
+
st.write(st.session_state["final_articles"][i])
|
637 |
+
|
638 |
+
if len(st.session_state["final_articles"]) > 0:
|
639 |
+
st.write("Benutzte Artikel:")
|
640 |
+
for i, link in enumerate(st.session_state["article_links"]):
|
641 |
+
st.write(f"Link {i+1}: {link}")
|
642 |
+
st.text_area(
|
643 |
+
"Füge weitere Informationen für den Prompt hinzu, falls nötig:",
|
644 |
+
key="add_info",
|
645 |
+
)
|
646 |
+
st.write("Artikellänge")
|
647 |
+
st.radio("Optionen", ["Kurz", "Mittel", "Lang", "SEO", "SEO Plus"], key="length_option")
|
648 |
+
st.button(
|
649 |
+
"Artikel generieren",
|
650 |
+
key="article_btn",
|
651 |
+
on_click=on_click_handler_generate_article,
|
652 |
+
kwargs={
|
653 |
+
"length_option": st.session_state["length_option"],
|
654 |
+
"final_articles": st.session_state["final_articles"],
|
655 |
+
"add_info": st.session_state["add_info"],
|
656 |
+
"webpage_option": st.session_state["webpage_option"],
|
657 |
+
},
|
658 |
+
)
|
659 |
+
elif st.session_state["selected_page"] == 3:
|
660 |
+
st.write(f"**{st.session_state['generated_headline']}**")
|
661 |
+
st.write(st.session_state["generated_article"])
|
662 |
+
st.write("**Zusammenfassung:**")
|
663 |
+
st.write(st.session_state["article_summary"])
|
664 |
+
st.write("Kopieren Sie den Artikel: ")
|
665 |
+
st_copy_to_clipboard(
|
666 |
+
st.session_state["generated_headline"]
|
667 |
+
+ "\n"
|
668 |
+
+ st.session_state["generated_article"]
|
669 |
+
)
|
670 |
+
if st.session_state["studie_links"]:
|
671 |
+
st.write("Hier sind einige Studien, die relevant sein könnten:")
|
672 |
+
for result in st.session_state["studie_links"]:
|
673 |
+
st.write(f"- [{result['title']}]({result['link']})")
|
674 |
+
else:
|
675 |
+
st.write("Keine relevanten Studien gefunden.")
|
676 |
+
|
677 |
+
if "takeaways" in st.session_state:
|
678 |
+
st.write("Hier sind einige Takeaways die wichtig sein könnten:")
|
679 |
+
st.write(st.session_state["takeaways"])
|
680 |
+
|
681 |
+
if "faq" in st.session_state:
|
682 |
+
st.write("Hier sind FAQs zu dem Artikel:")
|
683 |
+
st.write(st.session_state["faq"])
|
684 |
+
|
685 |
+
st.button(
|
686 |
+
"Relevante Studien finden",
|
687 |
+
on_click=get_related_studies,
|
688 |
+
args=(st.session_state["generated_article"],),
|
689 |
+
)
|
690 |
+
st.button(
|
691 |
+
"Key Takeaways generieren",
|
692 |
+
onclick=get_takeaways(st.session_state["generated_article"])
|
693 |
+
)
|
694 |
+
st.button(
|
695 |
+
"FAQ generieren",
|
696 |
+
onclick=get_faq(st.session_state["generated_article"])
|
697 |
+
)
|
698 |
+
st.button(
|
699 |
+
"Neuen Artikel generieren", key="reset_btn", on_click=reset_session_state
|
700 |
+
)
|
701 |
+
else:
|
702 |
+
st.write(
|
703 |
+
"Bitte trage die Stichpunkte ein, die Du in den Artikel einbauen möchtest. Der Textinput ist essenziell für die Generierung des Artikels."
|
704 |
+
)
|
705 |
+
st.text_area(label="Artikel input:", key="keyword_article_input")
|
706 |
+
st.write("Artikellänge")
|
707 |
+
st.radio("Optionen", ["Kurz", "Mittel", "Lang", "SEO", "SEO Plus"], key="length_option")
|
708 |
+
st.button(
|
709 |
+
"Artikel generieren",
|
710 |
+
key="article_btn",
|
711 |
+
on_click=on_click_handler_generate_generate_article_keywords,
|
712 |
+
kwargs={
|
713 |
+
"length_option": st.session_state["length_option"],
|
714 |
+
"artikel_input": st.session_state["keyword_article_input"],
|
715 |
+
"webpage_option": st.session_state["webpage_option"],
|
716 |
+
},
|
717 |
+
)
|
718 |
+
if st.session_state["generated_article"] and st.session_state["generated_headline"]:
|
719 |
+
st.write(f"**{st.session_state['generated_headline']}**")
|
720 |
+
st.write(st.session_state["generated_article"])
|
721 |
+
st.write("**Zusammenfassung:**")
|
722 |
+
st.write(st.session_state["article_summary"])
|
723 |
+
st.write("Kopieren Sie den Artikel: ")
|
724 |
+
st_copy_to_clipboard(
|
725 |
+
st.session_state["generated_headline"]
|
726 |
+
+ "\n"
|
727 |
+
+ st.session_state["generated_article"]
|
728 |
+
)
|
729 |
+
if st.session_state["studie_links"]:
|
730 |
+
st.write("Hier sind einige Studien, die relevant sein könnten:")
|
731 |
+
for result in st.session_state["studie_links"]:
|
732 |
+
st.write(f"- [{result['title']}]({result['link']})")
|
733 |
+
# else:
|
734 |
+
# st.write("Keine relevanten Studien gefunden.")
|
735 |
+
st.button(
|
736 |
+
"Relevante Studien finden",
|
737 |
+
on_click=get_related_studies,
|
738 |
+
args=(st.session_state["generated_article"],),
|
739 |
+
)
|
740 |
+
st.button(
|
741 |
+
"Neuen Artikel generieren", key="reset_btn", on_click=reset_session_state
|
742 |
+
)
|