Spaces:

ggml-org
/

gguf-my-repo

Running on A10G

App Files Files Community

191

reach-vb HF Staff

Wauplin HF Staff commited on Apr 30, 2024

Commit

5c54a1e

1 Parent(s): 0f15629

Use OAuth ("Sign in with Hugging Face") (#49)

Browse files

- Use OAuth ("Sign in with Hugging Face") (92b82ef8b9645fb1abecba93cf26b8476069d3a0)
- Update README.md (c3f2bda0b880d6cdb01c7d293fa3325684835444)
- Update Dockerfile (e16a272e4c3dff28f358a7b8001d958985b8a954)

Co-authored-by: Lucain Pouget <[email protected]>

Files changed (3) hide show

Dockerfile +1 -1
README.md +5 -0
app.py +13 -15

Dockerfile CHANGED Viewed

@@ -37,7 +37,7 @@ RUN pyenv install ${PYTHON_VERSION} && \
     pyenv global ${PYTHON_VERSION} && \
     pyenv rehash && \
     pip install --no-cache-dir -U pip setuptools wheel && \
-    pip install "huggingface-hub" "hf-transfer" "gradio>=4.26.0" "gradio_huggingfacehub_search==0.0.7"
 COPY --chown=1000 . ${HOME}/app
 RUN git clone https://github.com/ggerganov/llama.cpp

     pyenv global ${PYTHON_VERSION} && \
     pyenv rehash && \
     pip install --no-cache-dir -U pip setuptools wheel && \
+    pip install "huggingface-hub" "hf-transfer" "gradio>=4.28.0" "gradio_huggingfacehub_search==0.0.7"
 COPY --chown=1000 . ${HOME}/app
 RUN git clone https://github.com/ggerganov/llama.cpp

README.md CHANGED Viewed

@@ -4,6 +4,11 @@ emoji: 🦙
 colorFrom: gray
 colorTo: pink
 sdk: docker
 pinned: false
 ---

 colorFrom: gray
 colorTo: pink
 sdk: docker
+hf_oauth: true
+hf_oauth_scopes:
+  - read-repos
+  - write-repos
+  - manage-repos
 pinned: false
 ---

app.py CHANGED Viewed

@@ -25,12 +25,14 @@ def script_to_use(model_id, api):
     arch = arch[0]
     return "convert.py" if arch in LLAMA_LIKE_ARCHS else "convert-hf-to-gguf.py"
-def process_model(model_id, q_method, hf_token, private_repo):
     model_name = model_id.split('/')[-1]
     fp16 = f"{model_name}/{model_name.lower()}.fp16.bin"
     try:
-        api = HfApi(token=hf_token)
         dl_pattern = ["*.md", "*.json", "*.model"]
@@ -48,7 +50,7 @@ def process_model(model_id, q_method, hf_token, private_repo):
         dl_pattern += pattern
-        snapshot_download(repo_id=model_id, local_dir=model_name, local_dir_use_symlinks=False, token=hf_token, allow_patterns=dl_pattern)
         print("Model downloaded successully!")
         conversion_script = script_to_use(model_id, api)
@@ -72,11 +74,13 @@ def process_model(model_id, q_method, hf_token, private_repo):
         print("Repo created successfully!", new_repo_url)
         try:
-            card = ModelCard.load(model_id,)
         except:
             card = ModelCard("")
-        card.data.tags = ["llama-cpp"] if card.data.tags is None else card.data.tags + ["llama-cpp"]
-        card.data.tags += ["gguf-my-repo"]
         card.text = dedent(
             f"""
             # {new_repo_id}
@@ -155,25 +159,19 @@ iface = gr.Interface(
             value="Q4_K_M",
             filterable=False
         ),
-        gr.Textbox(
-            lines=1,
-            label="HF Write Token",
-            info="https://hf.co/settings/token",
-            type="password",
-        ),
         gr.Checkbox(
             value=False,
             label="Private Repo",
             info="Create a private repo under your username."
-        )
     ],
     outputs=[
         gr.Markdown(label="output"),
         gr.Image(show_label=False),
     ],
     title="Create your own GGUF Quants, blazingly fast ⚡!",
-    description="The space takes an HF repo as an input, quantises it and creates a Public repo containing the selected quant under your HF user namespace. You need to specify a write token obtained in https://hf.co/settings/tokens.",
-    article="<p>Find your write token at <a href='https://huggingface.co/settings/tokens' target='_blank'>token settings</a></p>",
 )
 # Launch the interface

     arch = arch[0]
     return "convert.py" if arch in LLAMA_LIKE_ARCHS else "convert-hf-to-gguf.py"
+def process_model(model_id, q_method, private_repo, oauth_token: gr.OAuthToken | None):
+    if token is None:
+        raise ValueError("You must be logged in to use GGUF-my-repo")
     model_name = model_id.split('/')[-1]
     fp16 = f"{model_name}/{model_name.lower()}.fp16.bin"
     try:
+        api = HfApi(token=oauth_token.token)
         dl_pattern = ["*.md", "*.json", "*.model"]
         dl_pattern += pattern
+        api.snapshot_download(repo_id=model_id, local_dir=model_name, local_dir_use_symlinks=False, allow_patterns=dl_pattern)
         print("Model downloaded successully!")
         conversion_script = script_to_use(model_id, api)
         print("Repo created successfully!", new_repo_url)
         try:
+            card = ModelCard.load(model_id, token=oauth_token.token)
         except:
             card = ModelCard("")
+        if card.data.tags is None:
+            card.data.tags = []
+        card.data.tags.append("llama-cpp")
+        card.data.tags.append("gguf-my-repo")
         card.text = dedent(
             f"""
             # {new_repo_id}
             value="Q4_K_M",
             filterable=False
         ),
         gr.Checkbox(
             value=False,
             label="Private Repo",
             info="Create a private repo under your username."
+        ),
+        gr.LoginButton(min_width=250),
     ],
     outputs=[
         gr.Markdown(label="output"),
         gr.Image(show_label=False),
     ],
     title="Create your own GGUF Quants, blazingly fast ⚡!",
+    description="The space takes an HF repo as an input, quantises it and creates a Public repo containing the selected quant under your HF user namespace.",
 )
 # Launch the interface