gguf-my-repo-ENHANCED

Sleeping

App Files Files Community

Oleg Shulyakov commited on Aug 7, 2025

Commit

f0c5d5e

1 Parent(s): 6475b9d

Update _generate_readme

Browse files

Files changed (1) hide show

app.py +13 -15

app.py CHANGED Viewed

@@ -337,51 +337,49 @@ class HuggingFaceModelProcessor:
         return new_repo_url
-    def _generate_readme(self, outdir: str, token: str, model_id: str,
-                        new_repo_id: str, gguf_name: str) -> str:
         """Generate README.md for the quantized model."""
-        creator = self._get_model_creator(model_id)
-        model_name = self._get_model_name(model_id)
-        username = whoami(token)["name"]
         try:
-            card = ModelCard.load(model_id, token=token)
         except:
             card = ModelCard("")
         if card.data.tags is None:
             card.data.tags = []
         card.data.tags.extend(["llama-cpp", "gguf-my-repo"])
-        card.data.base_model = model_id
         card.text = dedent(
             f"""
-# {model_name}
 **Model creator:** [{creator}](https://huggingface.co/{creator})<br/>
-**Original model**: [{model_id}](https://huggingface.co/{model_id})<br/>
 **GGUF quantization:** provided by [{username}](https:/huggingface.co/{username}) using `llama.cpp`<br/>
 ## Special thanks
 🙏 Special thanks to [Georgi Gerganov](https://github.com/ggerganov) and the whole team working on [llama.cpp](https://github.com/ggerganov/llama.cpp/) for making all of this possible.
 ## Use with Ollama
 ```bash
-ollama run "hf.co/{new_repo_id}:<quantization>"
 ```
 ## Use with LM Studio
 ```bash
-lms load "{new_repo_id}"
 ```
 ## Use with llama.cpp CLI
 ```bash
-llama-cli --hf-repo "{new_repo_id}" --hf-file "{gguf_name}" -p "The meaning to life and the universe is"
 ```
 ## Use with llama.cpp Server:
 ```bash
-llama-server --hf-repo "{new_repo_id}" --hf-file "{gguf_name}" -c 4096
 ```
             """
         )
-        readme_path = f"{outdir}/README.md"
         card.save(readme_path)
         return readme_path
@@ -422,7 +420,7 @@ llama-server --hf-repo "{new_repo_id}" --hf-file "{gguf_name}" -c 4096
                 raise GGUFConverterError(f"Error uploading imatrix.dat: {e}")
         # Upload README.md
-        readme_path = self._generate_readme(processing_config.outdir, processing_config.token, processing_config.model_id, processing_config.new_repo_id, output_config.filename)
         self._upload_file(processing_config, readme_path, "README.md")
         print(f"Uploaded successfully with {quant_config.imatrix_method if quant_config.use_imatrix else quant_config.method} option!")

         return new_repo_url
+    def _generate_readme(self, processing_config :ModelProcessingConfig) -> str:
         """Generate README.md for the quantized model."""
+        creator = self._get_model_creator(processing_config.model_id)
+        username = whoami(processing_config.token)["name"]
         try:
+            card = ModelCard.load(processing_config.model_id, token=processing_config.token)
         except:
             card = ModelCard("")
         if card.data.tags is None:
             card.data.tags = []
         card.data.tags.extend(["llama-cpp", "gguf-my-repo"])
+        card.data.base_model = processing_config.model_id
         card.text = dedent(
             f"""
+# {processing_config.model_name}
 **Model creator:** [{creator}](https://huggingface.co/{creator})<br/>
+**Original model**: [{processing_config.model_id}](https://huggingface.co/{processing_config.model_id})<br/>
 **GGUF quantization:** provided by [{username}](https:/huggingface.co/{username}) using `llama.cpp`<br/>
 ## Special thanks
 🙏 Special thanks to [Georgi Gerganov](https://github.com/ggerganov) and the whole team working on [llama.cpp](https://github.com/ggerganov/llama.cpp/) for making all of this possible.
 ## Use with Ollama
 ```bash
+ollama run "hf.co/{processing_config.new_repo_id}:<quantization>"
 ```
 ## Use with LM Studio
 ```bash
+lms load "{processing_config.new_repo_id}"
 ```
 ## Use with llama.cpp CLI
 ```bash
+llama-cli --hf-repo "{processing_config.new_repo_id}" --hf-file "{processing_config.output_config.filename}" -p "The meaning to life and the universe is"
 ```
 ## Use with llama.cpp Server:
 ```bash
+llama-server --hf-repo "{processing_config.new_repo_id}" --hf-file "{processing_config.output_config.filename}" -c 4096
 ```
             """
         )
+        readme_path = f"{processing_config.outdir}/README.md"
         card.save(readme_path)
         return readme_path
                 raise GGUFConverterError(f"Error uploading imatrix.dat: {e}")
         # Upload README.md
+        readme_path = self._generate_readme(processing_config)
         self._upload_file(processing_config, readme_path, "README.md")
         print(f"Uploaded successfully with {quant_config.imatrix_method if quant_config.use_imatrix else quant_config.method} option!")