openfree commited on
Commit
1fd0c30
Β·
verified Β·
1 Parent(s): 2bf1e25

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +27 -20
app.py CHANGED
@@ -4,26 +4,33 @@ import requests
4
  from io import BytesIO
5
 
6
  def convert_file(input_file, file_url, conversion_type):
7
- # Use the file provided by upload; if not, use the URL input.
8
  if input_file is None and (file_url is None or file_url.strip() == ""):
9
- raise ValueError("Please provide a file or a URL.")
10
 
11
- # Read the file into a DataFrame based on conversion type.
12
- if input_file is not None:
13
- file_path = input_file.name
14
- if conversion_type == "CSV to Parquet":
15
- df = pd.read_csv(file_path)
16
- else: # Parquet to CSV
17
- df = pd.read_parquet(file_path)
18
- else:
19
  response = requests.get(file_url)
20
  response.raise_for_status()
21
  if conversion_type == "CSV to Parquet":
22
  df = pd.read_csv(BytesIO(response.content))
23
- else:
24
  df = pd.read_parquet(BytesIO(response.content))
 
 
 
 
 
 
 
25
 
26
- # Save the converted file.
27
  if conversion_type == "CSV to Parquet":
28
  output_file = "output.parquet"
29
  df.to_parquet(output_file, index=False)
@@ -31,7 +38,7 @@ def convert_file(input_file, file_url, conversion_type):
31
  output_file = "output.csv"
32
  df.to_csv(output_file, index=False)
33
 
34
- # Generate a preview of the top 10 rows.
35
  preview = df.head(10).to_string(index=False)
36
 
37
  return output_file, preview
@@ -39,16 +46,16 @@ def convert_file(input_file, file_url, conversion_type):
39
  demo = gr.Interface(
40
  fn=convert_file,
41
  inputs=[
42
- gr.File(label="Input File (CSV or Parquet)"),
43
- gr.Textbox(label="Input File URL (optional)", placeholder="Enter a URL to a CSV or Parquet file"),
44
- gr.Radio(choices=["CSV to Parquet", "Parquet to CSV"], label="Conversion Type")
45
  ],
46
  outputs=[
47
- gr.File(label="Converted File"),
48
- gr.Textbox(label="Preview (Top 10 Rows)")
49
  ],
50
- title="CSV <-> Parquet Converter",
51
- description="Choose a conversion type, upload a file or enter a URL, and convert between CSV and Parquet formats. A preview of the top 10 rows will be shown."
52
  )
53
 
54
  if __name__ == "__main__":
 
4
  from io import BytesIO
5
 
6
  def convert_file(input_file, file_url, conversion_type):
7
+ # 파일 μ—…λ‘œλ“œμ™€ URL μž…λ ₯ λ‘˜ λ‹€ μ—†μœΌλ©΄ μ—λŸ¬ λ°œμƒ
8
  if input_file is None and (file_url is None or file_url.strip() == ""):
9
+ raise ValueError("파일 μ—…λ‘œλ“œ λ˜λŠ” URL을 μ œκ³΅ν•˜μ„Έμš”.")
10
 
11
+ df = None
12
+
13
+ # μ—…λ‘œλ“œλœ 파일이 μ—†μœΌλ©΄ URLμ—μ„œ 읽기
14
+ if input_file is None:
15
+ file_url = file_url.strip()
16
+ # URL μŠ€ν‚΄μ΄ μ—†μœΌλ©΄ 기본적으둜 "https://"λ₯Ό μΆ”κ°€
17
+ if not file_url.lower().startswith(("http://", "https://")):
18
+ file_url = "https://" + file_url
19
  response = requests.get(file_url)
20
  response.raise_for_status()
21
  if conversion_type == "CSV to Parquet":
22
  df = pd.read_csv(BytesIO(response.content))
23
+ else: # Parquet to CSV
24
  df = pd.read_parquet(BytesIO(response.content))
25
+ else:
26
+ # 파일 μ—…λ‘œλ“œκ°€ μžˆλŠ” 경우
27
+ file_path = input_file.name
28
+ if conversion_type == "CSV to Parquet":
29
+ df = pd.read_csv(file_path)
30
+ else:
31
+ df = pd.read_parquet(file_path)
32
 
33
+ # λ³€ν™˜ μ‹€ν–‰: CSV to Parquet ν˜Ήμ€ Parquet to CSV
34
  if conversion_type == "CSV to Parquet":
35
  output_file = "output.parquet"
36
  df.to_parquet(output_file, index=False)
 
38
  output_file = "output.csv"
39
  df.to_csv(output_file, index=False)
40
 
41
+ # μƒμœ„ 10쀄 미리보기 생성
42
  preview = df.head(10).to_string(index=False)
43
 
44
  return output_file, preview
 
46
  demo = gr.Interface(
47
  fn=convert_file,
48
  inputs=[
49
+ gr.File(label="μž…λ ₯ 파일 (CSV λ˜λŠ” Parquet)"),
50
+ gr.Textbox(label="μž…λ ₯ 파일 URL (선택)", placeholder="CSV λ˜λŠ” Parquet 파일의 URL을 μž…λ ₯ν•˜μ„Έμš”."),
51
+ gr.Radio(choices=["CSV to Parquet", "Parquet to CSV"], label="λ³€ν™˜ μœ ν˜•")
52
  ],
53
  outputs=[
54
+ gr.File(label="λ³€ν™˜λœ 파일"),
55
+ gr.Textbox(label="미리보기 (μƒμœ„ 10쀄)")
56
  ],
57
+ title="CSV <-> Parquet λ³€ν™˜κΈ°",
58
+ description="λ³€ν™˜ μœ ν˜•μ„ μ„ νƒν•˜κ³ , νŒŒμΌμ„ μ—…λ‘œλ“œν•˜κ±°λ‚˜ URL을 μž…λ ₯ν•˜μ—¬ CSV와 Parquet νŒŒμΌμ„ μƒν˜Έ λ³€ν™˜ν•©λ‹ˆλ‹€. μƒμœ„ 10쀄 미리보기도 μ œκ³΅ν•©λ‹ˆλ‹€."
59
  )
60
 
61
  if __name__ == "__main__":