허깅페이스 실습 및 스페이스에 프로젝트 등록

2026-05-26 22:32:53 +09:00
parent ba88ef63f1
commit 4e33fb82af
16 changed files with 1180 additions and 0 deletions
@@ -0,0 +1,82 @@
+import gradio as gr
+from transformers import pipeline
+from PIL import Image
+
+captioner = pipeline("image-to-text")
+generator = pipeline("text-generation", model="Qwen/Qwen2.5-1.5B-Instruct")
+
+
+current_caption = ""
+
+def chat(message, history) : 
+    
+    global current_caption
+    
+    # message {'text': 'text', 'files': []}
+    # message {'text': '', 'files': ['/private/var/folders/_x/jfhn2s8d6t512jvv5lndzw2m0000gn/T/gradio/f299e1f235318c3c17f47efef61fabb3f52e14158f3c4e1a2f15b1cf0fb8329d/Gemini_Generated_Image_e9k4qje9k4qje9k4.png']}
+    
+    # History[]
+    # History[{'role': 'user', 'metadata': None, 'content': [{'text': 'text', 'type': 'text'}], 'options': None}, {'role': 'assistant', ']
+    print("message", message) 
+    print("history", history)
+    
+    # message에서 텍스트와 이미지 분리
+    text = message["text"]
+
+    if message.get("files") :
+        image = message["files"][0]
+        if image :         
+            result = captioner(image)
+            caption_result = result[0]["generated_text"]
+            
+            # 전역변수에 저장
+            current_caption = caption_result
+            
+            prompt = f"""
+            이미지 설명:
+            {caption_result}
+
+            사용자 질문:
+            {text}            
+            """
+            return prompt
+    elif text :
+        if not current_caption:
+            return f"""
+            사용자 질문
+            {text}
+        """
+        
+        prompt = f"""
+            당신은 이미지 분석 AI 입니다.
+            다음 이미지 설명을 참고하여 사용자의 질문에
+            한 문장으로 답하세요.
+            
+            이미지 설명 :
+            {current_caption}
+            
+            질문
+            {text}
+            
+            답변:
+            
+        """
+        
+        # caption_result 값이 있다면 적절한 문장 생성하도록 만들기
+        result = generator(prompt, max_new_tokens = 50, return_full_text = False, pad_token_id=generator.tokenizer.eos_token_id)
+        
+        print("text result", result)
+        
+        response = result[0]['generated_text']
+        answer = response.split("\n")[1].strip()
+        
+        return answer
+    
+
+demo = gr.ChatInterface(
+    fn=chat, 
+    multimodal=True,
+    title="멀티 모달 AI 챗봇", 
+    description="이미지를 업로드하면 이미지에 대한 설명을 생성하는 챗봇입니다. 테스트로 질문도 가능합니다.", 
+)
+demo.launch()