|
import gradio as gr |
|
import pandas as pd |
|
from io import BytesIO |
|
|
|
def convert_file(input_file, conversion_type): |
|
|
|
if input_file is None: |
|
raise ValueError("Please upload a file.") |
|
|
|
file_name = input_file.name |
|
file_extension = file_name.lower().split('.')[-1] |
|
file_bytes = input_file.read() |
|
|
|
df = None |
|
output_file = None |
|
converted_format = None |
|
|
|
|
|
if conversion_type == "CSV to Parquet": |
|
if file_extension != "csv": |
|
raise ValueError("For CSV to Parquet conversion, please upload a CSV file.") |
|
df = pd.read_csv(BytesIO(file_bytes)) |
|
output_file = "output.parquet" |
|
df.to_parquet(output_file, index=False) |
|
converted_format = "Parquet" |
|
|
|
elif conversion_type == "Parquet to CSV": |
|
if file_extension != "parquet": |
|
raise ValueError("For Parquet to CSV conversion, please upload a Parquet file.") |
|
df = pd.read_parquet(BytesIO(file_bytes)) |
|
output_file = "output.csv" |
|
df.to_csv(output_file, index=False) |
|
converted_format = "CSV" |
|
else: |
|
raise ValueError("Invalid conversion type selected.") |
|
|
|
|
|
preview = df.head(10).to_string(index=False) |
|
info_message = ( |
|
f"Input file: {file_name}\n" |
|
f"Converted file format: {converted_format}\n\n" |
|
f"Preview (Top 10 Rows):\n{preview}" |
|
) |
|
return output_file, info_message |
|
|
|
demo = gr.Interface( |
|
fn=convert_file, |
|
inputs=[ |
|
gr.File(label="Upload CSV or Parquet File"), |
|
gr.Radio(choices=["CSV to Parquet", "Parquet to CSV"], label="Conversion Type") |
|
], |
|
outputs=[ |
|
gr.File(label="Converted File"), |
|
gr.Textbox(label="Preview (Top 10 Rows)", lines=15) |
|
], |
|
title="CSV <-> Parquet Converter", |
|
description=( |
|
"Upload a CSV or Parquet file and select the conversion type. " |
|
"The app converts the file to the opposite format and displays a preview of the top 10 rows." |
|
) |
|
) |
|
|
|
if __name__ == "__main__": |
|
demo.launch() |
|
|