import gradio as gr gr.load("models/Qwen/QwQ-32B-Preview").launch() # from flask import Flask, request, jsonify # import requests # import os # from dotenv import load_dotenv # # Load environment variables # load_dotenv() # app = Flask(__name__) # HUGGINGFACE_API_URL = "https://api-inference.huggingface.co/models/Qwen/QwQ-32B-Preview" # API_KEY = os.getenv("HUGGINGFACE_API_KEY") # @app.route('/predict', methods=['POST']) # def predict(): # user_input = request.json.get('input') # headers = {"Authorization": f"Bearer {API_KEY}"} # payload = {"inputs": user_input} # response = requests.post(HUGGINGFACE_API_URL, headers=headers, json=payload) # return jsonify(response.json()) # if __name__ == '__main__': # app.run(debug=True)