ALBERT SITE

[Python] GPT를 활용하여 이미지내용으로 문제만들기

Posted by Albert 88Day 15Hour 40Min 23Sec ago [2025-11-10]
수행내용
data 폴더에 있는 jpg 이미지기준으로 loop 돌면서
quiz 문제 생성
생성후 생성된 영문 문제만 한하여 json 파일로 저장
실행코드
from glob import glob
import json
from openai import OpenAI
from dotenv import load_dotenv
import os
import base64

load_dotenv()
api_key = os.getenv("OPENAI_API_KEY")  ' 환경 변수에서 API 키 가져오기
client = OpenAI(api_key=api_key)  ' OpenAI 클라이언트의 인스턴스 생성

def encode_image(image_path):
    with open(image_path, "rb") as image_file:
        return base64.b64encode(image_file.read()).decode("utf-8")
    

def image_quiz(image_path, n_trial=0, max_trial=3):
    if n_trial >= max_trial: ' 최대 시도 회수에 도달하면 포기
        raise Exception("Failed to generate a quiz.")
    
    base64_image = encode_image(image_path) ' 이미지를 base64로 인코딩

    quiz_prompt = """
    제공된 이미지를 바탕으로, 다음과 같은 양식으로 퀴즈를 만들어주세요. 
    정답은 1~4 중 하나만 해당하도록 출제하세요.
    토익 리스닝 문제 스타일로 문제를 만들어주세요.
    아래는 예시입니다. 
    ----- 예시 -----

    Q: 다음 이미지에 대한 설명 중 옳지 않은 것은 무엇인가요?
    - (1) 베이커리에서 사람들이 빵을 사고 있는 모습이 담겨 있습니다.
    - (2) 맨 앞에 서 있는 사람은 빨간색 셔츠를 입고 있습니다.
    - (3) 기차를 타기 위해 줄을 서 있는 사람들이 있습니다.
    - (4) 점원은 노란색 티셔츠를 입고 있습니다.

    Listening: Which of the following descriptions of the image is incorrect?
    - (1) It shows people buying bread at a bakery.
    - (2) The person standing at the front is wearing a red shirt.
    - (3) There are people lining up to take a train.
    - (4) The clerk is wearing a yellow T-shirt.
        
    정답: (4) 점원은 노란색 티셔츠가 아닌 파란색 티셔츠를 입고 있습니다.
    (주의: 정답은 1~4 중 하나만 선택되도록 출제하세요.)
    ======
    """

    messages = [
        {
            "role": "user",
            "content": [
                {"type": "text", "text": quiz_prompt},
                {
                    "type": "image_url",
                    "image_url": {
                        "url": f"data:image/jpeg;base64,{base64_image}",
                    },
                },
            ],
        }
    ]

    try: 
        response = client.chat.completions.create(
            model="gpt-4o",  ' 응답 생성에 사용할 모델 지정
            messages=messages ' 대화 기록을 입력으로 전달
        )
    except Exception as e:
        print("failed\n" + e)
        return image_quiz(image_path, n_trial+1)
    
    content = response.choices[0].message.content

    if "Listening:" in content:
        return content, True
    else:
        return image_quiz(image_path, n_trial+1)


' q = image_quiz("./chap06/data/images/busan_dive.jpg")
' print(q)



txt = '' ' 문제들을 계속 붙여 나가기 위해 빈 문자열 선언
eng_dict = []
no = 1 ' 문제 번호를 위해 선언
for g in glob('./chap06/data/images/*.jpg'):  ' ②
    q, is_suceed = image_quiz(g)

    if not is_suceed:
        continue


    divider = f''' 문제 {no}\n\n'
    print(divider)
    
    txt += divider
    ' 파일명 추출해 이미지 링크 만들기
    filename = os.path.basename(g) ' 마크다운에 표시할 이미지 파일 경로 설정   
    txt += f'![image]({filename})\n\n' 

    ' 문제 추가
    print(q)
    txt += q + '\n\n---------------------\n\n'
    ' 마크다운 파일로 저장
    with open('./chap06/data/images/image_quiz_eng.md', 'w', encoding='utf-8') as f:
        f.write(txt)

    ' 영어 문제만 추출
    eng = q.split('Listening: ')[1].split('정답:')[0].strip()

    eng_dict.append({
        'no': no,
        'eng': eng,
        'img': filename
    })

    ' json 파일로 저장
    with open('./chap06/data/images/image_quiz_eng.json', 'w', encoding='utf-8') as f:
        json.dump(eng_dict, f, ensure_ascii=False, indent=4)
    
    
    no += 1 ' 문제 번호 증가
LIST