|
import os |
|
import argparse |
|
from app.captioning import generate_caption |
|
from app.storytelling import generate_story |
|
from app.tts import speak_story |
|
|
|
def main(file_name): |
|
image_path = os.path.join(os.path.dirname(__file__), "assets",file_name) |
|
print("π Generating caption from image...") |
|
caption = generate_caption(image_path) |
|
print(f"\nπΌοΈ Caption: {caption}") |
|
|
|
print("\nβοΈ Generating story from caption...") |
|
story = generate_story(caption) |
|
print(f"\nπ Story:\n{story}") |
|
|
|
print("\nπ Converting story to speech...") |
|
audio_path = speak_story(story) |
|
print(f"\nβ
Audio saved at: {audio_path}") |
|
|
|
if __name__ == "__main__": |
|
parser = argparse.ArgumentParser(description="Run image β caption β story β speech pipeline") |
|
parser.add_argument("image_path", type=str, help="Path to the input image") |
|
|
|
args = parser.parse_args() |
|
main(args.image_path) |
|
|