Spaces:

teameight
/

fairytale_generator

Runtime error

App Files Files Community

je010112 commited on Jul 24

Commit

a2e0332

2 Parent(s): 57059f8 e8dd7e6

Merge branch 'main' of https://huggingface.co/spaces/teameight/fairytale_generator

Browse files

Files changed (2) hide show

blip-image-captioning-base01.py +104 -0
blip-image-captioning-base02.py +120 -0

blip-image-captioning-base01.py ADDED Viewed

	@@ -0,0 +1,104 @@

+# # 필요한 라이브러리 임포트
+# from transformers import BlipProcessor, BlipForConditionalGeneration        # 이미지 → 텍스트 설명 생성용
+# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline    # 텍스트 생성 (동화 생성)용
+# from PIL import Image                                                       # 이미지 처리용
+# import gradio as gr                                                         # 웹 인터페이스용
+# import torch                                                                # PyTorch (모델 구동)
+# # 1. BLIP 모델: 이미지 설명 생성용 모델 및 전처리기 로딩
+# caption_processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
+# caption_model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base")
+# # 2. KoT5 모델: 설명 → 동화 생성용 한국어 텍스트 생성 모델 로딩
+# story_tokenizer = AutoTokenizer.from_pretrained("paust/pko-t5-base")
+# story_model = AutoModelForSeq2SeqLM.from_pretrained("paust/pko-t5-base")
+# # Hugging Face pipeline으로 간편한 생성 함수 구성
+# story_generator = pipeline("text2text-generation", model=story_model, tokenizer=story_tokenizer)
+# # 3. 핵심 함수: 이미지 입력 → 설명 생성 → 동화 생성
+# def generate_fairytale(image):
+#     # 이미지 → 설명 생성 (BLIP)
+#     inputs = caption_processor(images=image, return_tensors="pt")              # 이미지 전처리
+#     outputs = caption_model.generate(**inputs)                                 # 설명 생성
+#     caption = caption_processor.decode(outputs[0], skip_special_tokens=True)   # 설명 텍스트 디코딩
+#     # 프롬프트 구성: 설명을 바탕으로 동화를 써달라고 요청
+#     prompt = f"다음 설명을 바탕으로 어린이 동화를 써줘:\n\"{caption}\""
+#     # 설명 → 동화 생성 (KoT5)
+#     story = story_generator(prompt, max_length=300, do_sample=True)[0]['generated_text']
+#     # Gradio에 표시할 두 개 결과 반환: 설명, 동화
+#     return caption, story
+# # 4. Gradio 인터페이스 구성
+# interface = gr.Interface(
+#     fn=generate_fairytale,                                         # 호출할 함수
+#     inputs=gr.Image(type="pil", label="🖼️ 그림을 업로드하세요"),   # 이미지 업로드 창
+#     outputs=[
+#         gr.Textbox(label="📌 이미지 설명"),                         # 텍스트 설명 출력
+#         gr.Textbox(label="📖 생성된 동화")                          # 생성된 동화 출력
+#     ],
+#     title="🎨 AI 이미지 동화 생성기",                                # 앱 제목
+#     description="이미지를 업로드하면 설명과 동화를 자동으로 생성해주는 서비스입니다.",
+#     theme="soft"                                                   # 부드러운 Gradio 테마
+# )
+# # 5. 웹 앱 실행 (URL 콘솔 출력)
+# interface.launch(share=True, debug=True, inbrowser=True)
+from transformers import BlipProcessor, BlipForConditionalGeneration
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
+from PIL import Image
+import gradio as gr
+import torch
+# 1. BLIP 이미지 캡셔닝 모델
+caption_processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
+caption_model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base")
+# 2. 영어 동화 생성 모델 (Flan-T5)
+story_tokenizer = AutoTokenizer.from_pretrained("google/flan-t5-base")
+story_model = AutoModelForSeq2SeqLM.from_pretrained("google/flan-t5-base")
+story_generator = pipeline("text2text-generation", model=story_model, tokenizer=story_tokenizer)
+# 3. 메인 함수
+def generate_fairytale(image):
+    # (1) 이미지 → 캡션 생성
+    inputs = caption_processor(images=image, return_tensors="pt").to(caption_model.device)
+    outputs = caption_model.generate(**inputs)
+    caption = caption_processor.decode(outputs[0], skip_special_tokens=True).strip()
+    # (2) 캡션이 너무 짧으면 보정
+    if len(caption.split()) < 5:
+        caption += ". They appear to be magical characters from a fantasy world."
+    # (3) 영어 프롬프트 구성
+    prompt = (
+        f"Write a short and magical fairytale for children based on the description below.\n"
+        f"Description: \"{caption}\"\n"
+        f"Story:"
+    )
+    # (4) 동화 생성
+    story = story_generator(prompt, max_length=300, do_sample=True)[0]['generated_text']
+    return caption, story
+# 4. Gradio UI
+interface = gr.Interface(
+    fn=generate_fairytale,
+    inputs=gr.Image(type="pil", label="🖼️ Upload an Image"),
+    outputs=[
+        gr.Textbox(label="📌 Image Description"),
+        gr.Textbox(label="📖 Generated Fairytale")
+    ],
+    title="🧚 AI Fairytale Generator from Image",
+    description="Upload an image, and this AI will create a magical story based on it!",
+    theme="soft"
+)
+# 5. 앱 실행
+interface.launch(share=True, debug=True, inbrowser=True)

blip-image-captioning-base02.py ADDED Viewed

	@@ -0,0 +1,120 @@

+from transformers import BlipProcessor, BlipForConditionalGeneration
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
+from PIL import Image
+import gradio as gr
+import torch
+# 1. 이미지 캡셔닝 모델 로드 (BLIP)
+caption_processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
+caption_model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base")
+# 2. 동화 생성 모델 (Flan-T5)
+story_tokenizer = AutoTokenizer.from_pretrained("google/flan-t5-base")
+story_model = AutoModelForSeq2SeqLM.from_pretrained("google/flan-t5-base")
+story_generator = pipeline("text2text-generation", model=story_model, tokenizer=story_tokenizer)
+# 3. 동화 생성 함수
+def generate_fairytale(image):
+    # (1) 이미지 → 캡션
+    inputs = caption_processor(images=image, return_tensors="pt").to(caption_model.device)
+    outputs = caption_model.generate(**inputs)
+    caption = caption_processor.decode(outputs[0], skip_special_tokens=True).strip()
+    # (2) 캡션이 짧으면 보완
+    if len(caption.split()) < 5:
+        caption += ". They look like magical characters from a fantasy story."
+    # (3) 프롬프트 설정
+    prompt = f"""
+Write a magical and imaginative fairytale for children based on the following image description.
+Description: "{caption}"
+Your story should:
+- Be at least 3 paragraphs long
+- Start with "Once upon a time"
+- Include fantasy, adventure, or mystery elements
+- Be creative and heartwarming
+Story:
+"""
+    # (4) 동화 생성 (길이 충분히 늘리기)
+    story = story_generator(prompt, max_length=500, do_sample=True)[0]['generated_text']
+    return caption, story
+# 4. Gradio 인터페이스
+interface = gr.Interface(
+    fn=generate_fairytale,
+    inputs=gr.Image(type="pil", label="🖼️ Upload an Image"),
+    outputs=[
+        gr.Textbox(label="📌 Image Description"),
+        gr.Textbox(label="📖 Generated Fairytale")
+    ],
+    title="🌟 AI Fairytale Generator from Image",
+    description="Upload an image and get a rich fairytale story created from it!",
+    theme="soft"
+)
+# 5. 실행
+interface.launch(share=True, debug=True, inbrowser=True)
+# from transformers import BlipProcessor, BlipForConditionalGeneration
+# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
+# from PIL import Image
+# import gradio as gr
+# import torch
+# # 1. 이미지 설명 생성 모델 (BLIP)
+# caption_processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
+# caption_model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base")
+# # 2. 영어 동화 생성 모델 (FLAN-T5)
+# story_tokenizer = AutoTokenizer.from_pretrained("google/flan-t5-base")
+# story_model = AutoModelForSeq2SeqLM.from_pretrained("google/flan-t5-base")
+# # 3. 동화 생성 함수
+# def generate_fairytale(image):
+#     # 1. 이미지 → 텍스트 설명 생성
+#     inputs = caption_processor(images=image, return_tensors="pt").to(caption_model.device)
+#     outputs = caption_model.generate(**inputs)
+#     caption = caption_processor.decode(outputs[0], skip_special_tokens=True).strip()
+#     # 2. 프롬프트 구성 (중복 방지 조건 추가)
+#     prompt = f"""Write a magical and imaginative children's story based on the following image description.
+# Description: "{caption}"
+# The story should be at least 3 paragraphs and must not repeat any sentences.
+# Story:"""
+#     # 3. 텍스트 생성
+#     input_ids = story_tokenizer(prompt, return_tensors="pt").input_ids.to(story_model.device)
+#     output_ids = story_model.generate(
+#         input_ids,
+#         max_length=600,             # 더 길고 풍부한 텍스트
+#         num_beams=4,                # 빔 탐색
+#         no_repeat_ngram_size=3,     # 반복 방지
+#         repetition_penalty=1.3,     # 반복 패널티
+#         early_stopping=True,
+#         do_sample=False             # 확정적 결과
+#     )
+#     story = story_tokenizer.decode(output_ids[0], skip_special_tokens=True)
+#     return caption, story
+# # 4. Gradio UI 인터페이스
+# interface = gr.Interface(
+#     fn=generate_fairytale,
+#     inputs=gr.Image(type="pil", label="📷 Upload an Image"),
+#     outputs=[
+#         gr.Textbox(label="📌 Image Description"),
+#         gr.Textbox(label="📖 Generated Fairytale")
+#     ],
+#     title="🌟 AI Fairytale Generator from Image",
+#     description="Upload an image and get a rich fairytale story created from it!",
+#     theme="default"
+# )
+# # 5. 실행
+# interface.launch(share=True)