Spaces:

mrfakename
/

NextStep-1

Runtime error

App Files Files Community

mrfakename commited on 10 days ago

Commit

b855287

verified ·

1 Parent(s): a543525

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -108

app.py CHANGED Viewed

@@ -1,122 +1,64 @@
-import spaces
 import gradio as gr
 import torch
-from transformers import AutoModel, AutoTokenizer
-# Load model and tokenizer
-model_path = "apple/DiffuCoder-7B-cpGRPO"
-device = "cuda" if torch.cuda.is_available() else "cpu"
-model = AutoModel.from_pretrained(
-    model_path,
-    torch_dtype=torch.bfloat16,
-    trust_remote_code=True
-).to(device).eval()
-tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
-tokenizer.eos_token = "<|im_end|>"
 @spaces.GPU
-def generate_code(query, temperature=0.4, top_p=0.95, max_new_tokens=256):
-    # Format prompt using chat template
-    messages = [
-        {"role": "system", "content": "You are a helpful coding assistant."},
-        {"role": "user", "content": query.strip()}
-    ]
-    # Apply chat template - this creates the prompt but doesn't include assistant response
-    prompt = tokenizer.apply_chat_template(
-        messages,
-        tokenize=False,
-        add_generation_prompt=True
-    )
-    # Tokenize only the prompt (without any assistant response)
-    inputs = tokenizer(prompt, return_tensors="pt")
-    input_ids = inputs.input_ids.to(device)
-    attention_mask = inputs.attention_mask.to(device)
-    # Calculate initial prompt length - this is where the assistant response will start
-    initial_prompt_len = input_ids.shape[1]
-    # Track EOS status
-    eos_detected = False
-    # Generate with token streaming
-    TOKEN_PER_STEP = 1
-    steps = min(max_new_tokens // TOKEN_PER_STEP, 512)  # Limit to max 512 steps
-    # This will accumulate only the assistant's response
-    assistant_response = ""
-    for i in range(steps):
-        if eos_detected:
-            break
-        output = model.diffusion_generate(
-            input_ids,
-            attention_mask=attention_mask,
-            max_new_tokens=TOKEN_PER_STEP,
-            output_history=True,
-            return_dict_in_generate=True,
-            steps=1,
-            temperature=temperature,
-            top_p=top_p,
-            alg="entropy",
-            alg_temp=0.,
-        )
-        # Get only the new tokens generated in this step
-        new_token_ids = output.sequences[0, -TOKEN_PER_STEP:]
-        # Check for EOS token in the new tokens
-        if tokenizer.eos_token_id in new_token_ids:
-            # If EOS is found, stop after this token
-            eos_detected = True
-            # Remove EOS token from output
-            new_token_ids = new_token_ids[new_token_ids != tokenizer.eos_token_id]
-            if new_token_ids.numel() == 0:
-                # Only EOS was generated, nothing to add
-                break
-        # Decode only the new tokens
-        new_text = tokenizer.decode(
-            new_token_ids,
-            skip_special_tokens=True,
-            clean_up_tokenization_spaces=False
-        )
-        # Update input for next step
-        input_ids = output.sequences
-        attention_mask = torch.cat([
-            attention_mask,
-            torch.ones(1, 1, dtype=attention_mask.dtype, device=device)
-        ], dim=1)
-        # Append to assistant response and yield
-        assistant_response += new_text
-        # Remove any trailing special tokens
-        clean_response = assistant_response.replace('<|dlm_pad|>', '').strip()
-        yield clean_response
-        if eos_detected:
-            break
-# Create Gradio interface
 demo = gr.Interface(
-    fn=generate_code,
     inputs=[
-        gr.Textbox(label="Code Request", lines=3,
-                  placeholder="Describe the code you want..."),
-        gr.Slider(0.1, 1.0, value=0.4, label="Temperature"),
-        gr.Slider(0.5, 1.0, value=0.95, label="Top-p"),
-        gr.Slider(32, 512, value=256, step=32, label="Max Tokens")
     ],
-    outputs=gr.Textbox(label="Generated Code", lines=10),
-    title="🧠 DiffuCoder Code Generator",
-    description="Generate code with Apple's DiffuCoder-7B model"
 )
-# Run the demo
 if __name__ == "__main__":
-    demo.queue().launch()

 import gradio as gr
 import torch
+from transformers import AutoTokenizer, AutoModel
+from nextstep.models.gen_pipeline import NextStepPipeline
+from spaces import GPU
+HF_HUB = "stepfun-ai/NextStep-1-Large"
+# Load model & tokenizer
+tokenizer = AutoTokenizer.from_pretrained(HF_HUB, local_files_only=True, trust_remote_code=True)
+model = AutoModel.from_pretrained(HF_HUB, local_files_only=True, trust_remote_code=True)
+pipeline = NextStepPipeline(tokenizer=tokenizer, model=model).to(device="cuda", dtype=torch.bfloat16)
+IMG_SIZE = 512
 @spaces.GPU
+def generate(main_prompt, positive_prompt, negative_prompt):
+    image = pipeline.generate_image(
+        main_prompt,
+        hw=(IMG_SIZE, IMG_SIZE),
+        num_images_per_caption=1,
+        positive_prompt=positive_prompt,
+        negative_prompt=negative_prompt,
+        cfg=7.5,
+        cfg_img=1.0,
+        cfg_schedule="constant",
+        use_norm=False,
+        num_sampling_steps=28,
+        timesteps_shift=1.0,
+        seed=3407,
+    )[0]
+    return image
 demo = gr.Interface(
+    fn=generate,
     inputs=[
+        gr.Textbox(label="Main Prompt", lines=2, placeholder="Describe your dream image..."),
+        gr.Textbox(label="Positive Prompt", lines=1, placeholder="Extra quality boosters..."),
+        gr.Textbox(label="Negative Prompt", lines=1, placeholder="Things to avoid..."),
     ],
+    outputs=gr.Image(label="Generated Image"),
+    title="NextStep Image Generator",
+    description="Simple Gradio demo for NextStep-1-Large with editable prompts.",
+    examples=[
+        [
+            'A realistic photograph of a wall with "NextStep-1.1 is coming" prominently displayed',
+            'masterpiece, film grained, best quality.',
+            'lowres, bad anatomy, bad hands, text, error, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality, normal quality, jpeg artifacts, signature, watermark, username, blurry.'
+        ],
+        [
+            'A cinematic shot of a futuristic city at sunset',
+            'ultra-detailed, 8k, volumetric lighting, masterpiece',
+            'blurry, lowres, noise, distortion'
+        ],
+        [
+            'A fantasy painting of a dragon flying over a castle',
+            'high detail, vibrant colors, epic composition',
+            'washed out colors, bad anatomy, low detail'
+        ],
+    ]
 )
 if __name__ == "__main__":
+    demo.launch()