podcastgen

Paused

Rausda6 commited on May 25

Commit

39f08bf

verified ·

1 Parent(s): 18be79e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -161,8 +161,8 @@ class PodcastGenerator:
 You are a podcast formatter.
 Take the following input conversation, and reformat it so that:
-- Every line begins with exactly `Speaker 1:` or `Speaker 2:` (with colon)
-- No timestamps, names, parentheses, or extra formatting
 - No blank lines
 - Do not invent or change the content
@@ -241,8 +241,18 @@ Now format the following:
         """Convert speaker-formatted text to podcast JSON structure"""
         # Allow leading whitespace and enforce full line match
-        lines = re.findall(r'^\s*Speaker\s*([12])\s*:\s*(.+)', text, flags=re.MULTILINE)
-        podcast = [{"speaker": int(s), "line": l.strip()} for s, l in lines]
         return {
             "topic": "Generated from Input",
             "podcast": podcast

 You are a podcast formatter.
 Take the following input conversation, and reformat it so that:
+- Every line begins with exactly and strictily with `Speaker 1:` or `Speaker 2:` (with colon)
+- No timestamps, names, parentheses, or extra formatting, no chapter names, no special characters beside ":"
 - No blank lines
 - Do not invent or change the content
         """Convert speaker-formatted text to podcast JSON structure"""
         # Allow leading whitespace and enforce full line match
+        cleaned_lines = []
+        for line in text.splitlines():
+            if re.match(r'^\s*Speaker\s*[12]\s*:', line.strip()):
+                cleaned_lines.append(line.strip())
+        podcast = []
+        for line in cleaned_lines:
+            match = re.match(r'^Speaker\s*([12])\s*:\s*(.+)', line)
+            if match:
+                speaker, content = match.groups()
+                podcast.append({"speaker": int(speaker), "line": content.strip()})
         return {
             "topic": "Generated from Input",
             "podcast": podcast