Spaces:

phate334
/

gguf-parser-web

Running

App Files Files Community

phate334 commited on Nov 2, 2024

Commit

a793e12

1 Parent(s): 7c11711

[modify] update main.py

Browse files

Files changed (4) hide show

README.md +1 -1
app/__init__.py +0 -0
app.py → app/main.py +20 -29
app/utils.py +15 -0

README.md CHANGED Viewed

@@ -5,7 +5,7 @@ colorFrom: green
 colorTo: indigo
 sdk: gradio
 sdk_version: 5.3.0
-app_file: app.py
 pinned: false
 license: mit
 short_description: This project is a GUI for the gpustack/gguf-parser-go

 colorTo: indigo
 sdk: gradio
 sdk_version: 5.3.0
+app_file: app/main.py
 pinned: false
 license: mit
 short_description: This project is a GUI for the gpustack/gguf-parser-go

app/__init__.py ADDED Viewed

File without changes

app.py → app/main.py RENAMED Viewed

@@ -8,15 +8,22 @@ import pandas as pd
 GGUF_PARSER_VERSION = os.getenv("GGUF_PARSER_VERSION", "v0.12.0")
 gguf_parser = Path("gguf-parser-linux-amd64")
 gguf_parser_url = f"https://github.com/gpustack/gguf-parser-go/releases/download/{GGUF_PARSER_VERSION}/{gguf_parser}"
-def process_url(url):
     try:
-        res = os.popen(f"./{gguf_parser} -url {url} --json").read()
         data = json.loads(res)
         architecture_df = pd.DataFrame([data["architecture"]])
         estimate_df = pd.DataFrame(
             [
                 {
@@ -32,47 +39,31 @@ def process_url(url):
             ]
         )
-        metadata_df = pd.DataFrame([data["metadata"]])
-        tokenizer_df = pd.DataFrame([data["tokenizer"]])
-        return architecture_df, estimate_df, metadata_df, tokenizer_df
     except Exception as e:
         return e
 if __name__ == "__main__":
     if not gguf_parser.exists():
-        os.system(f"wget {gguf_parser_url}")
-        os.system(f"chmod +x {gguf_parser}")
     with open("devices.json", "r", encoding="utf-8") as f:
         device_list = json.load(f)
-    with gr.Blocks(title="GGUF 分析器") as iface:
-        url_input = gr.Textbox(label="輸入 GGUF URL")
-        submit_btn = gr.Button("送出")
-        gr.Markdown("### 模型架構")
-        architecture_table = gr.DataFrame()
-        gr.Markdown("### 效能評估")
-        estimate_table = gr.DataFrame()
-        gr.Markdown("### 中繼資料")
-        metadata_table = gr.DataFrame()
-        gr.Markdown("### 分詞器")
-        tokenizer_table = gr.DataFrame()
         submit_btn.click(
             fn=process_url,
-            inputs=url_input,
             outputs=[
-                architecture_table,
-                estimate_table,
-                metadata_table,
-                tokenizer_table,
             ],
         )
     iface.launch()

 GGUF_PARSER_VERSION = os.getenv("GGUF_PARSER_VERSION", "v0.12.0")
 gguf_parser = Path("gguf-parser-linux-amd64")
 gguf_parser_url = f"https://github.com/gpustack/gguf-parser-go/releases/download/{GGUF_PARSER_VERSION}/{gguf_parser}"
+DEFAULT_URL = "https://huggingface.co/phate334/Llama-3.1-8B-Instruct-Q4_K_M-GGUF/resolve/main/llama-3.1-8b-instruct-q4_k_m.gguf"
+def process_url(url, context_length):
     try:
+        res = os.popen(
+            f"./{gguf_parser} --ctx-size={context_length} -url {url} --json"
+        ).read()
         data = json.loads(res)
+        metadata_df = pd.DataFrame([data["metadata"]])
         architecture_df = pd.DataFrame([data["architecture"]])
+        tokenizer_df = pd.DataFrame([data["tokenizer"]])
         estimate_df = pd.DataFrame(
             [
                 {
             ]
         )
+        return metadata_df, architecture_df, tokenizer_df, estimate_df
     except Exception as e:
         return e
 if __name__ == "__main__":
     if not gguf_parser.exists():
+        os.system(f"wget {gguf_parser_url}&&chmod +x {gguf_parser}")
     with open("devices.json", "r", encoding="utf-8") as f:
         device_list = json.load(f)
+    with gr.Blocks(title="GGUF Parser") as iface:
+        url_input = gr.Textbox(placeholder="Enter GGUF URL", value=DEFAULT_URL)
+        context_length = gr.Number(label="Context Length", value=8192)
+        submit_btn = gr.Button("Send")
         submit_btn.click(
             fn=process_url,
+            inputs=[url_input, context_length],
             outputs=[
+                gr.DataFrame(label="METADATA"),
+                gr.DataFrame(label="ARCHITECTURE"),
+                gr.DataFrame(label="TOKENIZER"),
+                gr.DataFrame(label="ESTIMATE"),
             ],
         )
     iface.launch()

app/utils.py ADDED Viewed

	@@ -0,0 +1,15 @@

+def human_readable_size(size_in_bytes: int) -> str:
+    # 將檔案大小轉換為人類可讀的格式
+    for unit in ["B", "KB", "MB", "GB", "TB", "PB"]:
+        if size_in_bytes < 1024:
+            return f"{size_in_bytes:.2f}{unit}"
+        size_in_bytes /= 1024
+    return f"{size_in_bytes:.2f}EB"
+def abbreviate_number(number: int) -> str:
+    # 將大數字轉換為縮寫格式
+    for unit, threshold in [("B", 1e9), ("M", 1e6), ("K", 1e3)]:
+        if number >= threshold:
+            return f"{number/threshold:.2f}{unit}"
+    return str(number)