Spaces:

Nymbo
/

Serverless-TextGen-Hub

Running

App Files Files Community

Nymbo commited on May 1

Commit

9e12544

verified ·

1 Parent(s): 5292786

alright its too expensive yall, I gotta pull back a bit

Browse files

Files changed (1) hide show

app.py +47 -10

app.py CHANGED Viewed

@@ -15,8 +15,9 @@ def respond(
     top_p,
     frequency_penalty,
     seed,
-    provider,         # Moved before custom_model
-    custom_model,     # Moved after provider
     model_search_term,
     selected_model
 ):
@@ -25,14 +26,17 @@ def respond(
     print(f"System message: {system_message}")
     print(f"Max tokens: {max_tokens}, Temperature: {temperature}, Top-P: {top_p}")
     print(f"Frequency Penalty: {frequency_penalty}, Seed: {seed}")
-    print(f"Selected provider: {provider}")         # Updated order
-    print(f"Selected model (custom_model): {custom_model}")  # Updated order
     print(f"Model search term: {model_search_term}")
     print(f"Selected model from radio: {selected_model}")
-    # Initialize the Inference Client with the provider
-    # Provider is specified during initialization, not in the method call
-    client = InferenceClient(token=ACCESS_TOKEN, provider=provider)
     print(f"Hugging Face Inference Client initialized with {provider} provider.")
     # Convert seed to None if -1 (meaning random)
@@ -105,6 +109,13 @@ def respond(
     print("Completed response generation.")
 # GRADIO UI
 chatbot = gr.Chatbot(height=600, show_copy_button=True, placeholder="Select a model and begin chatting", layout="panel")
@@ -169,6 +180,15 @@ provider_radio = gr.Radio(
     info="[View all models here](https://huggingface.co/models?inference_provider=all&pipeline_tag=text-generation&sort=trending)"
 )
 # Custom model box
 custom_model_box = gr.Textbox(
     value="",
@@ -246,8 +266,9 @@ demo = gr.ChatInterface(
         top_p_slider,
         frequency_penalty_slider,
         seed_slider,
-        provider_radio,     # Provider selection (moved up)
-        custom_model_box,   # Custom Model (moved down)
         model_search_box,   # Model search box
         featured_model_radio # Featured model radio
     ],
@@ -273,9 +294,25 @@ with demo:
         outputs=custom_model_box
     )
     print("Featured model radio button change event linked.")
 print("Gradio interface initialized.")
 if __name__ == "__main__":
     print("Launching the demo application.")
-    demo.launch(show_api=True)  # Fixed typo: demo. Launch -> demo.launch

     top_p,
     frequency_penalty,
     seed,
+    provider,
+    custom_api_key,  # New parameter for BYOK
+    custom_model,
     model_search_term,
     selected_model
 ):
     print(f"System message: {system_message}")
     print(f"Max tokens: {max_tokens}, Temperature: {temperature}, Top-P: {top_p}")
     print(f"Frequency Penalty: {frequency_penalty}, Seed: {seed}")
+    print(f"Selected provider: {provider}")
+    print(f"Custom API Key provided: {bool(custom_api_key.strip())}")  # Log whether a custom key was provided without printing the key
+    print(f"Selected model (custom_model): {custom_model}")
     print(f"Model search term: {model_search_term}")
     print(f"Selected model from radio: {selected_model}")
+    # Determine which token to use - custom API key if provided, otherwise the ACCESS_TOKEN
+    token_to_use = custom_api_key if custom_api_key.strip() != "" else ACCESS_TOKEN
+    # Initialize the Inference Client with the provider and appropriate token
+    client = InferenceClient(token=token_to_use, provider=provider)
     print(f"Hugging Face Inference Client initialized with {provider} provider.")
     # Convert seed to None if -1 (meaning random)
     print("Completed response generation.")
+# Function to validate provider selection based on BYOK
+def validate_provider(api_key, provider):
+    # If no custom API key is provided, only "hf-inference" can be used
+    if not api_key.strip() and provider != "hf-inference":
+        return gr.update(value="hf-inference")
+    return gr.update(value=provider)
 # GRADIO UI
 chatbot = gr.Chatbot(height=600, show_copy_button=True, placeholder="Select a model and begin chatting", layout="panel")
     info="[View all models here](https://huggingface.co/models?inference_provider=all&pipeline_tag=text-generation&sort=trending)"
 )
+# New BYOK textbox - Added for the new feature
+byok_textbox = gr.Textbox(
+    value="",
+    label="BYOK (Bring Your Own Key)",
+    info="Enter a custom Hugging Face API key here. When empty, only 'hf-inference' provider can be used.",
+    placeholder="Enter your Hugging Face API token",
+    type="password"  # Hide the API key for security
+)
 # Custom model box
 custom_model_box = gr.Textbox(
     value="",
         top_p_slider,
         frequency_penalty_slider,
         seed_slider,
+        provider_radio,     # Provider selection
+        byok_textbox,       # New BYOK textbox
+        custom_model_box,   # Custom Model
         model_search_box,   # Model search box
         featured_model_radio # Featured model radio
     ],
         outputs=custom_model_box
     )
     print("Featured model radio button change event linked.")
+    # Connect the BYOK textbox to validate provider selection
+    byok_textbox.change(
+        fn=validate_provider,
+        inputs=[byok_textbox, provider_radio],
+        outputs=provider_radio
+    )
+    print("BYOK textbox change event linked.")
+    # Also validate provider when the radio changes to ensure consistency
+    provider_radio.change(
+        fn=validate_provider,
+        inputs=[byok_textbox, provider_radio],
+        outputs=provider_radio
+    )
+    print("Provider radio button change event linked.")
 print("Gradio interface initialized.")
 if __name__ == "__main__":
     print("Launching the demo application.")
+    demo.launch(show_api=True)