Spaces:

Genius-Society
/

data_converter

Running

App Files Files

admin commited on 11 days ago

Commit

0a5fc93

1 Parent(s): af319cd

2 en

Browse files

Files changed (2) hide show

app.py +9 -9
utils.py +0 -8

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ def infer(input_file: str):
         return output_file, pd.DataFrame(data_list)
     except Exception as e:
-        return None, pd.DataFrame([{"请上传标准的数据文件": f"{e}"}])
 if __name__ == "__main__":
@@ -26,21 +26,21 @@ if __name__ == "__main__":
                                 f"{types[0]} → {types[1]}",
                                 f"{types[0]} ← {types[1]}",
                             ],
-                            label="模式 Mode",
                             value=f"{types[0]} → {types[1]}",
                         )
                         input_file = gr.components.File(
                             type="filepath",
-                            label="上传原数据 Upload input file",
                             file_types=[f".{types[0]}", f".{types[1]}"],
                         )
-                        convert_btn = gr.Button("转换 Convert")
                     with gr.Column():
                         output_file = gr.components.File(
-                            type="filepath", label="下载转换数据 Download output file"
                         )
-                        data_viewer = gr.Dataframe(label="数据预览 Data viewer")
             option.change(change_mode, inputs=option)
             tab.select(change_mode, inputs=option)
@@ -50,7 +50,7 @@ if __name__ == "__main__":
         gr.Markdown(
             """
-## 支持的 JSON 格式 (Supported JSON format)
 ```
 [
     {
@@ -66,13 +66,13 @@ if __name__ == "__main__":
     ...
 ]
 ```
-## 支持的 JSON Lines 格式 (Supported jsonl format)
 ```
 {"key1": "val11", "key2": "val12", ...}
 {"key1": "val21", "key2": "val22", ...}
 ...
 ```
-## 支持的 CSV 格式 (Supported CSV format)
 ```
 key1, key2, ...
 val11, val12, ...

         return output_file, pd.DataFrame(data_list)
     except Exception as e:
+        return None, pd.DataFrame([{"Please upload a standard data file": f"{e}"}])
 if __name__ == "__main__":
                                 f"{types[0]} → {types[1]}",
                                 f"{types[0]} ← {types[1]}",
                             ],
+                            label="Mode",
                             value=f"{types[0]} → {types[1]}",
                         )
                         input_file = gr.components.File(
                             type="filepath",
+                            label="Upload input file",
                             file_types=[f".{types[0]}", f".{types[1]}"],
                         )
+                        convert_btn = gr.Button("Convert")
                     with gr.Column():
                         output_file = gr.components.File(
+                            type="filepath", label="Download output file"
                         )
+                        data_viewer = gr.Dataframe(label="Data viewer")
             option.change(change_mode, inputs=option)
             tab.select(change_mode, inputs=option)
         gr.Markdown(
             """
+## Supported JSON format
 ```
 [
     {
     ...
 ]
 ```
+## Supported jsonl format
 ```
 {"key1": "val11", "key2": "val12", ...}
 {"key1": "val21", "key2": "val22", ...}
 ...
 ```
+## Supported CSV format
 ```
 key1, key2, ...
 val11, val12, ...

utils.py CHANGED Viewed

@@ -4,9 +4,7 @@ import json
 import shutil
 TMP_DIR = "./__pycache__"
 TAB_CONFIG = ["jsonl ⇆ csv", "json ⇆ csv", "json ⇆ jsonl"]
 MODE = {"from": "jsonl", "to": "csv"}
@@ -29,7 +27,6 @@ def encoder_jsonl(file_path: str):
     data_list = []
     with open(file_path, "r", encoding="utf-8") as file:
         for line in file:
-            # 加载每一行的 JSON 数据
             json_data = json.loads(line.strip())
             data_list.append(json_data)
@@ -49,7 +46,6 @@ def encoder_csv(file_path: str):
 def decoder_json(data_list: list, file_path=f"{TMP_DIR}/output.json"):
     if data_list:
         with open(file_path, "w", encoding="utf-8") as file:
-            # 将整个列表转换成 JSON 格式并写入文件
             json.dump(data_list, file, ensure_ascii=False, indent=4)
     return file_path
@@ -57,13 +53,10 @@ def decoder_json(data_list: list, file_path=f"{TMP_DIR}/output.json"):
 def decoder_csv(data_list: list, file_path=f"{TMP_DIR}/output.csv"):
     if data_list:
-        # 提取第一个字典的键作为表头
         header = list(data_list[0].keys())
         with open(file_path, "w", newline="", encoding="utf-8") as file:
             csv_writer = csv.writer(file)
-            # 写入表头
             csv_writer.writerow(header)
-            # 逐项写入字典的值
             for item in data_list:
                 csv_writer.writerow([item[key] for key in header])
@@ -74,7 +67,6 @@ def decoder_jsonl(data_list: list, file_path=f"{TMP_DIR}/output.jsonl"):
     if data_list:
         with open(file_path, "w", encoding="utf-8") as file:
             for data in data_list:
-                # 将每个 JSON 对象转换成字符串并写入文件，每行一个对象
                 json_line = json.dumps(data, ensure_ascii=False)
                 file.write(json_line + "\n")

 import shutil
 TMP_DIR = "./__pycache__"
 TAB_CONFIG = ["jsonl ⇆ csv", "json ⇆ csv", "json ⇆ jsonl"]
 MODE = {"from": "jsonl", "to": "csv"}
     data_list = []
     with open(file_path, "r", encoding="utf-8") as file:
         for line in file:
             json_data = json.loads(line.strip())
             data_list.append(json_data)
 def decoder_json(data_list: list, file_path=f"{TMP_DIR}/output.json"):
     if data_list:
         with open(file_path, "w", encoding="utf-8") as file:
             json.dump(data_list, file, ensure_ascii=False, indent=4)
     return file_path
 def decoder_csv(data_list: list, file_path=f"{TMP_DIR}/output.csv"):
     if data_list:
         header = list(data_list[0].keys())
         with open(file_path, "w", newline="", encoding="utf-8") as file:
             csv_writer = csv.writer(file)
             csv_writer.writerow(header)
             for item in data_list:
                 csv_writer.writerow([item[key] for key in header])
     if data_list:
         with open(file_path, "w", encoding="utf-8") as file:
             for data in data_list:
                 json_line = json.dumps(data, ensure_ascii=False)
                 file.write(json_line + "\n")