Spaces:

ggml-org
/

gguf-my-repo

Running on A10G

reach-vb HF staff commited on May 30, 2024

Commit

1504cda

verified ·

1 Parent(s): 3ad22ce

Remove references to convert.py (#73)

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,19 +15,8 @@ from apscheduler.schedulers.background import BackgroundScheduler
 from textwrap import dedent
-LLAMA_LIKE_ARCHS = ["MistralForCausalLM",]
 HF_TOKEN = os.environ.get("HF_TOKEN")
-def script_to_use(model_id, api):
-    info = api.model_info(model_id)
-    if info.config is None:
-        return None
-    arch = info.config.get("architectures", None)
-    if arch is None:
-        return None
-    arch = arch[0]
-    return "convert.py" if arch in LLAMA_LIKE_ARCHS else "convert-hf-to-gguf.py"
 def split_upload_model(model_path, repo_id, oauth_token: gr.OAuthToken | None, split_max_tensors=256, split_max_size=None):
     if oauth_token.token is None:
         raise ValueError("You have to be logged in.")
@@ -98,7 +87,7 @@ def process_model(model_id, q_method, private_repo, split_model, split_max_tenso
         print(f"Current working directory: {os.getcwd()}")
         print(f"Model directory contents: {os.listdir(model_name)}")
-        conversion_script = script_to_use(model_id, api)
         fp16_conversion = f"python llama.cpp/{conversion_script} {model_name} --outtype f16 --outfile {fp16}"
         result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
         print(result)

 from textwrap import dedent
 HF_TOKEN = os.environ.get("HF_TOKEN")
 def split_upload_model(model_path, repo_id, oauth_token: gr.OAuthToken | None, split_max_tensors=256, split_max_size=None):
     if oauth_token.token is None:
         raise ValueError("You have to be logged in.")
         print(f"Current working directory: {os.getcwd()}")
         print(f"Model directory contents: {os.listdir(model_name)}")
+        conversion_script = "convert-hf-to-gguf.py"
         fp16_conversion = f"python llama.cpp/{conversion_script} {model_name} --outtype f16 --outfile {fp16}"
         result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
         print(result)