Spaces:

RanaZaeem12
/

file_type_convertor

Sleeping

App Files Files Community

RanaZaeem12 commited on May 6

Commit

82c991c

verified ·

1 Parent(s): 6392c48

Update app.py

Browse files

Files changed (1) hide show

app.py +148 -142

app.py CHANGED Viewed

@@ -7,146 +7,153 @@ from reportlab.pdfgen import canvas
 from docx import Document
 from pptx import Presentation
 import fitz  # PyMuPDF
-def convert_file(file_obj, output_format):
-    name = file_obj.name
-    ext = name.split(".")[-1].lower()
-    file_bytes = file_obj.read()
-    def to_pdf():
-        buf = BytesIO()
-        if ext in ["png", "jpg", "jpeg"]:
-            img = Image.open(BytesIO(file_bytes)).convert("RGB")
-            img.save(buf, format="PDF")
-        elif ext == "docx":
-            doc = Document(BytesIO(file_bytes))
-            c = canvas.Canvas(buf)
-            for i, para in enumerate(doc.paragraphs):
-                c.drawString(10, 800 - 15 * i, para.text)
-            c.save()
-        elif ext == "pptx":
-            ppt = Presentation(BytesIO(file_bytes))
-            c = canvas.Canvas(buf)
-            y = 800
-            for slide in ppt.slides:
-                for shape in slide.shapes:
-                    if hasattr(shape, "text"):
-                        c.drawString(10, y, shape.text)
-                        y -= 15
-            c.save()
-        elif ext == "xlsx":
-            df = pd.read_excel(BytesIO(file_bytes))
-            c = canvas.Canvas(buf)
-            for i, row in df.iterrows():
-                c.drawString(10, 800 - i * 15, str(row.to_list()))
-            c.save()
-        elif ext == "pdf":
-            return file_bytes, "converted.pdf"
-        return buf.getvalue(), "converted.pdf"
-    def to_word():
-        doc = Document()
-        if ext in ["png", "jpg", "jpeg"]:
-            image = Image.open(BytesIO(file_bytes))
-            image.save("temp_img.jpg")
-            doc.add_picture("temp_img.jpg")
-        elif ext == "pdf":
-            pdf = fitz.open(stream=file_bytes, filetype="pdf")
-            for page in pdf:
-                doc.add_paragraph(page.get_text())
-        elif ext == "pptx":
-            ppt = Presentation(BytesIO(file_bytes))
-            for slide in ppt.slides:
-                for shape in slide.shapes:
-                    if hasattr(shape, "text"):
-                        doc.add_paragraph(shape.text)
-        elif ext == "xlsx":
-            df = pd.read_excel(BytesIO(file_bytes))
-            for _, row in df.iterrows():
-                doc.add_paragraph(" | ".join(map(str, row)))
-        elif ext == "docx":
-            return file_bytes, name
-        buf = BytesIO()
-        doc.save(buf)
-        return buf.getvalue(), "converted.docx"
-    def to_excel():
-        if ext == "xlsx":
-            return file_bytes, name
-        df = pd.DataFrame()
-        if ext in ["png", "jpg", "jpeg"]:
-            df = pd.DataFrame([["Image file", name]])
-        elif ext == "pdf":
-            pdf = fitz.open(stream=file_bytes, filetype="pdf")
-            df = pd.DataFrame([page.get_text() for page in pdf], columns=["Text"])
-        elif ext == "docx":
-            doc = Document(BytesIO(file_bytes))
-            df = pd.DataFrame([[para.text] for para in doc.paragraphs], columns=["Text"])
-        elif ext == "pptx":
-            ppt = Presentation(BytesIO(file_bytes))
-            texts = []
-            for slide in ppt.slides:
-                text = "\n".join([shape.text for shape in slide.shapes if hasattr(shape, "text")])
-                texts.append([text])
-            df = pd.DataFrame(texts, columns=["Slide Text"])
-        buf = BytesIO()
-        df.to_excel(buf, index=False)
-        return buf.getvalue(), "converted.xlsx"
-    def to_ppt():
-        prs = Presentation()
-        slide_layout = prs.slide_layouts[1]
-        if ext == "pdf":
-            pdf = fitz.open(stream=file_bytes, filetype="pdf")
-            for page in pdf:
-                slide = prs.slides.add_slide(slide_layout)
-                slide.shapes.title.text = "Page"
-                slide.placeholders[1].text = page.get_text()
-        elif ext == "docx":
-            doc = Document(BytesIO(file_bytes))
-            for para in doc.paragraphs:
-                slide = prs.slides.add_slide(slide_layout)
-                slide.shapes.title.text = "Paragraph"
-                slide.placeholders[1].text = para.text
-        elif ext == "xlsx":
-            df = pd.read_excel(BytesIO(file_bytes))
-            for i, row in df.iterrows():
                 slide = prs.slides.add_slide(slide_layout)
-                slide.shapes.title.text = f"Row {i}"
-                slide.placeholders[1].text = " | ".join(map(str, row))
-        elif ext in ["png", "jpg", "jpeg"]:
-            slide = prs.slides.add_slide(slide_layout)
-            slide.shapes.title.text = "Image"
-            img_path = f"img_{name}"
-            Image.open(BytesIO(file_bytes)).save(img_path)
-            slide.shapes.add_picture(img_path, 100, 100, width=400, height=300)
-        buf = BytesIO()
-        prs.save(buf)
-        return buf.getvalue(), "converted.pptx"
-    def to_image():
-        if ext in ["png", "jpg", "jpeg"]:
-            return file_bytes, "converted.png"
-        elif ext == "pdf":
-            images = convert_from_bytes(file_bytes)
             buf = BytesIO()
-            images[0].save(buf, format="PNG")
-            return buf.getvalue(), "converted.png"
-        return None, None
-    converters = {
-        "PDF": to_pdf,
-        "Word": to_word,
-        "Excel": to_excel,
-        "PowerPoint": to_ppt,
-        "HD Image": to_image
-    }
-    try:
-        data, filename = converters[output_format]()
-        return filename, data
-    except Exception as e:
-        return "Error.txt", str(e).encode()
 with gr.Blocks(title="Universal File Converter", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
@@ -155,7 +162,6 @@ with gr.Blocks(title="Universal File Converter", theme=gr.themes.Soft()) as demo
         Convert your **images**, **documents**, and **presentations** to 📄 PDF, 📝 Word, 📊 Excel, 📽️ PowerPoint, or 🖼️ HD Image!
         > Supported formats: `.jpg`, `.png`, `.pdf`, `.docx`, `.pptx`, `.xlsx`
         ---
         """
     )
@@ -163,9 +169,9 @@ with gr.Blocks(title="Universal File Converter", theme=gr.themes.Soft()) as demo
     with gr.Row():
         with gr.Column(scale=1):
             file_input = gr.File(
-                label="📤 Upload File",
                 file_types=[".png", ".jpg", ".jpeg", ".pdf", ".docx", ".pptx", ".xlsx"],
-                file_count="single"
             )
             output_format = gr.Radio(
                 ["PDF", "Word", "Excel", "PowerPoint", "HD Image"],
@@ -175,9 +181,9 @@ with gr.Blocks(title="Universal File Converter", theme=gr.themes.Soft()) as demo
             convert_btn = gr.Button("🚀 Convert Now")
         with gr.Column(scale=1):
-            output_file = gr.File(label="📥 Download Converted File")
-    convert_btn.click(fn=convert_file, inputs=[file_input, output_format], outputs=output_file)
     gr.Markdown("---")
     gr.Markdown("Made with ❤️ using [Gradio](https://gradio.app/)")

 from docx import Document
 from pptx import Presentation
 import fitz  # PyMuPDF
+import os
+def convert_file(files, output_format):
+    results = []
+    for file_obj in files:
+        name = file_obj.name
+        ext = name.split(".")[-1].lower()
+        file_bytes = file_obj.read()
+        def to_pdf():
+            buf = BytesIO()
+            if ext in ["png", "jpg", "jpeg"]:
+                img = Image.open(BytesIO(file_bytes)).convert("RGB")
+                img.save(buf, format="PDF")
+            elif ext == "docx":
+                doc = Document(BytesIO(file_bytes))
+                c = canvas.Canvas(buf)
+                for i, para in enumerate(doc.paragraphs):
+                    c.drawString(10, 800 - 15 * i, para.text)
+                c.save()
+            elif ext == "pptx":
+                ppt = Presentation(BytesIO(file_bytes))
+                c = canvas.Canvas(buf)
+                y = 800
+                for slide in ppt.slides:
+                    for shape in slide.shapes:
+                        if hasattr(shape, "text"):
+                            c.drawString(10, y, shape.text)
+                            y -= 15
+                c.save()
+            elif ext == "xlsx":
+                df = pd.read_excel(BytesIO(file_bytes))
+                c = canvas.Canvas(buf)
+                for i, row in df.iterrows():
+                    c.drawString(10, 800 - i * 15, str(row.to_list()))
+                c.save()
+            elif ext == "pdf":
+                return file_bytes, "converted.pdf"
+            return buf.getvalue(), "converted.pdf"
+        def to_word():
+            doc = Document()
+            if ext in ["png", "jpg", "jpeg"]:
+                image = Image.open(BytesIO(file_bytes))
+                image.save("temp_img.jpg")
+                doc.add_picture("temp_img.jpg")
+                os.remove("temp_img.jpg")
+            elif ext == "pdf":
+                pdf = fitz.open(stream=file_bytes, filetype="pdf")
+                for page in pdf:
+                    doc.add_paragraph(page.get_text())
+            elif ext == "pptx":
+                ppt = Presentation(BytesIO(file_bytes))
+                for slide in ppt.slides:
+                    for shape in slide.shapes:
+                        if hasattr(shape, "text"):
+                            doc.add_paragraph(shape.text)
+            elif ext == "xlsx":
+                df = pd.read_excel(BytesIO(file_bytes))
+                for _, row in df.iterrows():
+                    doc.add_paragraph(" | ".join(map(str, row)))
+            elif ext == "docx":
+                return file_bytes, name
+            buf = BytesIO()
+            doc.save(buf)
+            return buf.getvalue(), "converted.docx"
+        def to_excel():
+            if ext == "xlsx":
+                return file_bytes, name
+            df = pd.DataFrame()
+            if ext in ["png", "jpg", "jpeg"]:
+                df = pd.DataFrame([["Image file", name]])
+            elif ext == "pdf":
+                pdf = fitz.open(stream=file_bytes, filetype="pdf")
+                df = pd.DataFrame([page.get_text() for page in pdf], columns=["Text"])
+            elif ext == "docx":
+                doc = Document(BytesIO(file_bytes))
+                df = pd.DataFrame([[para.text] for para in doc.paragraphs], columns=["Text"])
+            elif ext == "pptx":
+                ppt = Presentation(BytesIO(file_bytes))
+                texts = []
+                for slide in ppt.slides:
+                    text = "\n".join([shape.text for shape in slide.shapes if hasattr(shape, "text")])
+                    texts.append([text])
+                df = pd.DataFrame(texts, columns=["Slide Text"])
+            buf = BytesIO()
+            df.to_excel(buf, index=False)
+            return buf.getvalue(), "converted.xlsx"
+        def to_ppt():
+            prs = Presentation()
+            slide_layout = prs.slide_layouts[1]
+            if ext == "pdf":
+                pdf = fitz.open(stream=file_bytes, filetype="pdf")
+                for page in pdf:
+                    slide = prs.slides.add_slide(slide_layout)
+                    slide.shapes.title.text = "Page"
+                    slide.placeholders[1].text = page.get_text()
+            elif ext == "docx":
+                doc = Document(BytesIO(file_bytes))
+                for para in doc.paragraphs:
+                    slide = prs.slides.add_slide(slide_layout)
+                    slide.shapes.title.text = "Paragraph"
+                    slide.placeholders[1].text = para.text
+            elif ext == "xlsx":
+                df = pd.read_excel(BytesIO(file_bytes))
+                for i, row in df.iterrows():
+                    slide = prs.slides.add_slide(slide_layout)
+                    slide.shapes.title.text = f"Row {i}"
+                    slide.placeholders[1].text = " | ".join(map(str, row))
+            elif ext in ["png", "jpg", "jpeg"]:
                 slide = prs.slides.add_slide(slide_layout)
+                slide.shapes.title.text = "Image"
+                img_path = f"img_{name}"
+                Image.open(BytesIO(file_bytes)).save(img_path)
+                slide.shapes.add_picture(img_path, 100, 100, width=400, height=300)
+                os.remove(img_path)
             buf = BytesIO()
+            prs.save(buf)
+            return buf.getvalue(), "converted.pptx"
+        def to_image():
+            if ext in ["png", "jpg", "jpeg"]:
+                return file_bytes, "converted.png"
+            elif ext == "pdf":
+                images = convert_from_bytes(file_bytes)
+                buf = BytesIO()
+                images[0].save(buf, format="PNG")
+                return buf.getvalue(), "converted.png"
+            return None, None
+        converters = {
+            "PDF": to_pdf,
+            "Word": to_word,
+            "Excel": to_excel,
+            "PowerPoint": to_ppt,
+            "HD Image": to_image
+        }
+        try:
+            data, filename = converters[output_format]()
+            results.append((filename, data))
+        except Exception as e:
+            results.append(("Error.txt", str(e).encode()))
+    return [(fname, BytesIO(content)) for fname, content in results]
 with gr.Blocks(title="Universal File Converter", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
         Convert your **images**, **documents**, and **presentations** to 📄 PDF, 📝 Word, 📊 Excel, 📽️ PowerPoint, or 🖼️ HD Image!
         > Supported formats: `.jpg`, `.png`, `.pdf`, `.docx`, `.pptx`, `.xlsx`
         ---
         """
     )
     with gr.Row():
         with gr.Column(scale=1):
             file_input = gr.File(
+                label="📤 Upload Files",
                 file_types=[".png", ".jpg", ".jpeg", ".pdf", ".docx", ".pptx", ".xlsx"],
+                file_count="multiple"
             )
             output_format = gr.Radio(
                 ["PDF", "Word", "Excel", "PowerPoint", "HD Image"],
             convert_btn = gr.Button("🚀 Convert Now")
         with gr.Column(scale=1):
+            output_files = gr.Files(label="📥 Download Converted Files")
+    convert_btn.click(fn=convert_file, inputs=[file_input, output_format], outputs=output_files)
     gr.Markdown("---")
     gr.Markdown("Made with ❤️ using [Gradio](https://gradio.app/)")