Datasets-Convertor

Sleeping

App Files Files Community

openfree commited on Feb 17

Commit

1fd0c30

verified ·

1 Parent(s): 2bf1e25

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -20

app.py CHANGED Viewed

@@ -4,26 +4,33 @@ import requests
 from io import BytesIO
 def convert_file(input_file, file_url, conversion_type):
-    # Use the file provided by upload; if not, use the URL input.
     if input_file is None and (file_url is None or file_url.strip() == ""):
-        raise ValueError("Please provide a file or a URL.")
-    # Read the file into a DataFrame based on conversion type.
-    if input_file is not None:
-        file_path = input_file.name
-        if conversion_type == "CSV to Parquet":
-            df = pd.read_csv(file_path)
-        else:  # Parquet to CSV
-            df = pd.read_parquet(file_path)
-    else:
         response = requests.get(file_url)
         response.raise_for_status()
         if conversion_type == "CSV to Parquet":
             df = pd.read_csv(BytesIO(response.content))
-        else:
             df = pd.read_parquet(BytesIO(response.content))
-    # Save the converted file.
     if conversion_type == "CSV to Parquet":
         output_file = "output.parquet"
         df.to_parquet(output_file, index=False)
@@ -31,7 +38,7 @@ def convert_file(input_file, file_url, conversion_type):
         output_file = "output.csv"
         df.to_csv(output_file, index=False)
-    # Generate a preview of the top 10 rows.
     preview = df.head(10).to_string(index=False)
     return output_file, preview
@@ -39,16 +46,16 @@ def convert_file(input_file, file_url, conversion_type):
 demo = gr.Interface(
     fn=convert_file,
     inputs=[
-        gr.File(label="Input File (CSV or Parquet)"),
-        gr.Textbox(label="Input File URL (optional)", placeholder="Enter a URL to a CSV or Parquet file"),
-        gr.Radio(choices=["CSV to Parquet", "Parquet to CSV"], label="Conversion Type")
     ],
     outputs=[
-        gr.File(label="Converted File"),
-        gr.Textbox(label="Preview (Top 10 Rows)")
     ],
-    title="CSV <-> Parquet Converter",
-    description="Choose a conversion type, upload a file or enter a URL, and convert between CSV and Parquet formats. A preview of the top 10 rows will be shown."
 )
 if __name__ == "__main__":

 from io import BytesIO
 def convert_file(input_file, file_url, conversion_type):
+    # 파일 업로드와 URL 입력 둘 다 없으면 에러 발생
     if input_file is None and (file_url is None or file_url.strip() == ""):
+        raise ValueError("파일 업로드 또는 URL을 제공하세요.")
+    df = None
+    # 업로드된 파일이 없으면 URL에서 읽기
+    if input_file is None:
+        file_url = file_url.strip()
+        # URL 스킴이 없으면 기본적으로 "https://"를 추가
+        if not file_url.lower().startswith(("http://", "https://")):
+            file_url = "https://" + file_url
         response = requests.get(file_url)
         response.raise_for_status()
         if conversion_type == "CSV to Parquet":
             df = pd.read_csv(BytesIO(response.content))
+        else:  # Parquet to CSV
             df = pd.read_parquet(BytesIO(response.content))
+    else:
+        # 파일 업로드가 있는 경우
+        file_path = input_file.name
+        if conversion_type == "CSV to Parquet":
+            df = pd.read_csv(file_path)
+        else:
+            df = pd.read_parquet(file_path)
+    # 변환 실행: CSV to Parquet 혹은 Parquet to CSV
     if conversion_type == "CSV to Parquet":
         output_file = "output.parquet"
         df.to_parquet(output_file, index=False)
         output_file = "output.csv"
         df.to_csv(output_file, index=False)
+    # 상위 10줄 미리보기 생성
     preview = df.head(10).to_string(index=False)
     return output_file, preview
 demo = gr.Interface(
     fn=convert_file,
     inputs=[
+        gr.File(label="입력 파일 (CSV 또는 Parquet)"),
+        gr.Textbox(label="입력 파일 URL (선택)", placeholder="CSV 또는 Parquet 파일의 URL을 입력하세요."),
+        gr.Radio(choices=["CSV to Parquet", "Parquet to CSV"], label="변환 유형")
     ],
     outputs=[
+        gr.File(label="변환된 파일"),
+        gr.Textbox(label="미리보기 (상위 10줄)")
     ],
+    title="CSV <-> Parquet 변환기",
+    description="변환 유형을 선택하고, 파일을 업로드하거나 URL을 입력하여 CSV와 Parquet 파일을 상호 변환합니다. 상위 10줄 미리보기도 제공합니다."
 )
 if __name__ == "__main__":