mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 17:14:36 +00:00
* examples : add model conversion tool/example This commit adds an "example/tool" that is intended to help in the process of converting models to GGUF. Currently it supports normal causal models and embedding models. The readme contains instructions and command to guide through the process. The motivation for this to have a structured and repeatable process for model conversions and hopefully with time improve upon it to make the process easier and more reliable. We have started to use this for new model conversions internally and will continue doing so and improve it as we go along. Perhaps with time this should be placed in a different directory than the examples directory, but for now it seems like a good place to keep it while we are still developing it. * squash! examples : add model conversion tool/example Remove dependency on scikit-learn in model conversion example. * squash! examples : add model conversion tool/example Update transformer dep to use non-dev version. And also import `AutoModelForCausalLM` instead of `AutoModel` to ensure compatibility with the latest version. * squash! examples : add model conversion tool/example Remove the logits requirements file from the all requirements file.
63 lines
2 KiB
Python
Executable file
63 lines
2 KiB
Python
Executable file
#!/usr/bin/env python3
|
|
|
|
from huggingface_hub import HfApi
|
|
import argparse
|
|
|
|
# This script requires that the environment variable HF_TOKEN is set with your
|
|
# Hugging Face API token.
|
|
api = HfApi()
|
|
|
|
def load_template_and_substitute(template_path, **kwargs):
|
|
try:
|
|
with open(template_path, 'r', encoding='utf-8') as f:
|
|
template_content = f.read()
|
|
|
|
return template_content.format(**kwargs)
|
|
except FileNotFoundError:
|
|
print(f"Template file '{template_path}' not found!")
|
|
return None
|
|
except KeyError as e:
|
|
print(f"Missing template variable: {e}")
|
|
return None
|
|
|
|
parser = argparse.ArgumentParser(description='Create a new Hugging Face model repository')
|
|
parser.add_argument('--model-name', '-m', help='Name for the model', required=True)
|
|
parser.add_argument('--namespace', '-ns', help='Namespace to add the model to', required=True)
|
|
parser.add_argument('--org-base-model', '-b', help='Original Base model name', default="")
|
|
parser.add_argument('--no-card', action='store_true', help='Skip creating model card')
|
|
parser.add_argument('--private', '-p', action='store_true', help='Create private model')
|
|
|
|
args = parser.parse_args()
|
|
|
|
repo_id = f"{args.namespace}/{args.model_name}-GGUF"
|
|
print("Repository ID: ", repo_id)
|
|
|
|
repo_url = api.create_repo(
|
|
repo_id=repo_id,
|
|
repo_type="model",
|
|
private=args.private,
|
|
exist_ok=False
|
|
)
|
|
|
|
if not args.no_card:
|
|
template_path = "scripts/readme.md.template"
|
|
model_card_content = load_template_and_substitute(
|
|
template_path,
|
|
model_name=args.model_name,
|
|
namespace=args.namespace,
|
|
base_model=args.org_base_model,
|
|
)
|
|
|
|
if model_card_content:
|
|
api.upload_file(
|
|
path_or_fileobj=model_card_content.encode('utf-8'),
|
|
path_in_repo="README.md",
|
|
repo_id=repo_id
|
|
)
|
|
print("Model card created successfully.")
|
|
else:
|
|
print("Failed to create model card.")
|
|
|
|
print(f"Repository created: {repo_url}")
|
|
|
|
|