podcast

Running

App Files Files Community

orrinin commited on Jun 5, 2024

Commit

561aac5

verified ·

1 Parent(s): 71debf1

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -5

app.py CHANGED Viewed

@@ -3,7 +3,9 @@ import json
 import httpx
 import os
 import re
 import asyncio
 import edge_tts
 import tempfile
 import gradio as gr
@@ -13,18 +15,18 @@ from pydub import AudioSegment
 from moviepy.editor import AudioFileClip, concatenate_audioclips
 system_prompt = '''
-    You are an talk-show podcast generator. You have to create short conversations between Xiaoxiao and Yunjian that gives an overview of the News given by the user.
     Please provide the script and output strictly in the following JSON format:
     {
       "title": "[string]",
       "content": {
-        "Xiaoxiao_0: "[string]",
-        "Yunjian_0": "[string]",
         ...
       }
     }
     #Please note that the [string] you generate now must be in easy-and-understandable Chinese.
-    #Be concise. No less than three rounds of conversation.
 '''
 DESCRIPTION = '''
@@ -49,10 +51,39 @@ footer {
 }
 """
 apikey = os.environ.get("API_KEY")
 client = OpenAI(api_key=apikey, base_url="https://api.deepseek.com")
 def validate_url(url):
     try:
         response = httpx.get(url, timeout=60.0)
@@ -73,6 +104,7 @@ def fetch_text(url):
     print("Exited Webpage Extraction")
     return validate_url(full_url)
 async def text_to_speech(text, voice, filename):
     communicate = edge_tts.Communicate(text, voice)
     await communicate.save(filename)
@@ -88,7 +120,7 @@ async def gen_show(script):
     for key, text in content.items():
         speaker = key.split('_')[0]  # Extract the speaker name
         index = key.split('_')[1]    # Extract the dialogue index
-        voice = "zh-CN-XiaoxiaoNeural" if speaker == "Xiaoxiao" else "zh-CN-YunjianNeural"
         # Create temporary file for each speaker's dialogue
         temp_file = tempfile.NamedTemporaryFile(suffix='.mp3', delete=False)
@@ -178,11 +210,13 @@ with gr.Blocks(theme='soft', css=css, title="听说") as iface:
         input_box = gr.Textbox(label="网址", placeholder="请输入https开头的网址")
     with gr.Row():
         submit_btn = gr.Button("🚀 发送")  # Create a submit button
         clear_btn = gr.ClearButton(output_box, value="🗑️ 清除") # Create a clear button
     gr.Examples(examples=Examples, inputs=input_box, outputs=output_box, fn=main, label="示例", cache_examples="lazy")
     # Set up the event listeners
     submit_btn.click(main, inputs=input_box, outputs=output_box)
 #gr.close_all()

 import httpx
 import os
 import re
+import feedparser
 import asyncio
+import random
 import edge_tts
 import tempfile
 import gradio as gr
 from moviepy.editor import AudioFileClip, concatenate_audioclips
 system_prompt = '''
+    You are an news podcast generator. You have to create short conversations between Chen and Yun that gives an overview of the News given by the user.
     Please provide the script and output strictly in the following JSON format:
     {
       "title": "[string]",
       "content": {
+        "Chen_0: "[string]",
+        "Yun_0": "[string]",
         ...
       }
     }
     #Please note that the [string] you generate now must be in easy-and-understandable Chinese.
+    #Be concise. No less than five rounds of conversation.
 '''
 DESCRIPTION = '''
 }
 """
+rss_feed = 'https://www.yahoo.com/news/rss'
 apikey = os.environ.get("API_KEY")
 client = OpenAI(api_key=apikey, base_url="https://api.deepseek.com")
+# RSS feeds
+def is_url(string):
+    url_pattern = re.compile(
+        r'^(?:http|ftp)s?://'  # http:// or https://
+        r'(?:(?:[A-Z0-9](?:[A-Z0-9-]{0,61}[A-Z0-9])?\.)+(?:[A-Z]{2,6}\.?|[A-Z0-9-]{2,}\.?)|'  # domain...
+        r'localhost|'  # localhost...
+        r'\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3})'  # ...or ip
+        r'(?::\d+)?'  # optional port
+        r'(?:/?|[/?]\S+)$', re.IGNORECASE)
+    return re.match(url_pattern, string) is not None
+def random_news():
+    global rss_feed
+    if not is_url(rss_feed):
+        raise ValueError(f"{rss_feed} is not a valid RSS feed.")
+    news = []
+    feed = feedparser.parse(rss_feed)
+    for entry in feed.entries:
+        news.append(entry.title)
+    print(news)
+    main(random.choice(news))
 def validate_url(url):
     try:
         response = httpx.get(url, timeout=60.0)
     print("Exited Webpage Extraction")
     return validate_url(full_url)
 async def text_to_speech(text, voice, filename):
     communicate = edge_tts.Communicate(text, voice)
     await communicate.save(filename)
     for key, text in content.items():
         speaker = key.split('_')[0]  # Extract the speaker name
         index = key.split('_')[1]    # Extract the dialogue index
+        voice = "zh-TW-HsiaoYuNeural" if speaker == "Chen" else "zh-CN-YunyangNeural"
         # Create temporary file for each speaker's dialogue
         temp_file = tempfile.NamedTemporaryFile(suffix='.mp3', delete=False)
         input_box = gr.Textbox(label="网址", placeholder="请输入https开头的网址")
     with gr.Row():
         submit_btn = gr.Button("🚀 发送")  # Create a submit button
+        random_btn = gr.Button("🤙 随机")
         clear_btn = gr.ClearButton(output_box, value="🗑️ 清除") # Create a clear button
     gr.Examples(examples=Examples, inputs=input_box, outputs=output_box, fn=main, label="示例", cache_examples="lazy")
     # Set up the event listeners
     submit_btn.click(main, inputs=input_box, outputs=output_box)
+    random_btn.click(fn=random_news, outputs=output_box)
 #gr.close_all()