model/app.py at main · v21c/model · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
from flask import Flask, render_template, request, session, redirect, url_for, send_file, jsonify
from openai import OpenAI
from openai_api_key import OPENAI_API_KEY, URI, CLIENT_ID, CLIENT_SECRET
import re
import pandas as pd
from pymongo.mongo_client import MongoClient
from pymongo.server_api import ServerApi
from bson import ObjectId
from pathlib import Path
import os
import uuid
import requests
import random

app = Flask(__name__)
app.secret_key = 'secretkey123'  # 세션을 위한 비밀 키 설정

uri = URI
client = MongoClient(uri, server_api=ServerApi('1'))
db = client['intheview']
userId = ObjectId('66a3324a1cc4ca962e4c9afe')

client = OpenAI(api_key=OPENAI_API_KEY)
df = pd.read_csv('/Users/kbsoo/coding/codes/python/model_test2/all_temp.csv')

voices = ['alloy', 'echo', 'fable', 'nova', 'onyx', 'shimmer']

def get_score(question, answer):
    prompt = f"""
    Look at the following question and answer from the given interview and rate the answer on a scale from 0 to 100.

    Question: {question}
    Answer: {answer}

    Score:
    """
    completion = client.chat.completions.create(
        model='gpt-4o',
        messages=[
            {"role": "system", "content": "You are an interview rating assistant."},
            {"role": "user", "content": prompt}
        ]
    )
    content = completion.choices[0].message.content
    score = re.search(r'Score:\s*(\d+)', content)

    return int(score.group(1)) if score else 0

def get_question(message, chat_history):
    occupation, gender, experience = message.split('/')

    filtered_df = df[(df['occupation'] == occupation) &
                     (df['gender'] == gender) &
                     (df['experience'] == experience.upper())]

    existing_qa = filtered_df[['question_text', 'answer_text']].values.tolist()

    chat_history_text = "\n".join([f"질문: {item['content']}" if item['type'] == 'question' else f"답변: {item['content']}" for item in chat_history])

    qa_prompt = f"""
    Based on the following questions and answers for {occupation} professionals who are {gender} and {experience}:

    {existing_qa}

    Additionally, consider the previous conversation:
    {chat_history_text}

    Generate a new, relevant question about career development, industry trends, or challenges faced by this group.
    The question should be inspired by the themes and insights present in the previous questions and answers, and should follow naturally from the previous answer.

    For example, if the previous question was about self-development and the answer was about reading books, the next question could be about what books they have recently read.

    Format the output as:
    질문: [Your generated question]

    The question should be in Korean.
    """

    completion = client.chat.completions.create(
        model='gpt-4o',
        messages=[
            {"role": "system", "content": "You are an interviewer who refers to the given files and asks questions according to job occupation/gender/experience"},
            {"role": "user", "content": qa_prompt}
        ]
    )
    content = completion.choices[0].message.content

    match = re.search(r'질문:\s*(.*)', content, re.DOTALL)

    if match:
        return match.group(1).strip()
    else:
        return "질문을 생성할 수 없습니다."

def calculate_average_score(session_id):
    session_data = db['sessions'].find_one({"_id": session_id})
    if not session_data:
        return 0  # Session data가 없을 경우 0을 반환

    scores = [item.get('score', 0) for item in session_data.get('chat_history', []) if item.get('score') is not None]
    if len(scores) == 1:
        return round(scores[0])  # 점수가 하나인 경우 그 점수를 반올림하여 반환
    elif len(scores) > 1:
        return round(sum(scores) / len(scores))  # 점수가 여러 개일 때 평균을 계산하고 반올림하여 반환
    return 0  # 점수가 없는 경우 0을 반환

def generate_speech(text):

    unique_filename = f"{uuid.uuid4()}.mp3"
    speech_file_path = Path(app.root_path) / "static" / unique_filename
    with client.audio.speech.with_streaming_response.create(
        model='tts-1',
        voice=random.choice(voices),
        input=text,
    ) as response:
        response.stream_to_file(str(speech_file_path))
        return f"static/{unique_filename}"

@app.route('/', methods=['GET', 'POST'])
def index():
    if 'chat_history' not in session:
        session['chat_history'] = []

    session_collection = db['sessions']
    user_collection = db['users']

    if request.method == 'POST':
        if 'start_chat' in request.form:
            input_text = request.form['input']
            session['initial_input'] = input_text  # 초기 입력값 저장

            # 새로운 세션 생성
            new_session = {"chat_history": []}
            result = session_collection.insert_one(new_session)
            session_id = result.inserted_id

            # 사용자 세션에 추가
            user_collection.update_one(
                {"_id": userId},
                {"$push": {"sessions": session_id}}
            )

            session['session_id'] = str(session_id)
            question = get_question(input_text, session['chat_history'])
            session['chat_history'] = [{'type': 'question', 'content': question}]

            # 새로 생성된 질문을 세션 데이터베이스에 추가
            session_collection.update_one(
                {"_id": session_id},
                {"$push": {"chat_history": {"question": question, "answer": "", "score": 0}}}
            )

            # TTS 생성
            speech_file = generate_speech(question)
            session['speech_file'] = speech_file
        elif 'user_answer' in request.form:
            user_answer = request.form['user_answer']

            if 'session_id' in session:
                session_id = ObjectId(session['session_id'])

                # 마지막 질문 가져오기
                last_question = session['chat_history'][-1]['content']
                score = get_score(last_question, user_answer)

                # 답변과 점수 업데이트
                session['chat_history'].append({'type': 'answer', 'content': user_answer, 'score': score})

                # 데이터베이스 업데이트
                session_collection.update_one(
                    {"_id": session_id, "chat_history.answer": ""},
                    {"$set": {"chat_history.$.answer": user_answer, "chat_history.$.score": score}}
                )

                if 'initial_input' in session:
                    question = get_question(session['initial_input'], session['chat_history'])
                else:
                    question = "죄송합니다. 새로운 질문을 생성할 수 없습니다. 채팅을 다시 시작해주세요."
                session['chat_history'].append({'type': 'question', 'content': question})

                # 새로운 질문 추가
                session_collection.update_one(
                    {"_id": session_id},
                    {"$push": {"chat_history": {"question": question, "answer": "", "score": 0}}}
                )

                # TTS 생성
                speech_file = generate_speech(question)
                session['speech_file'] = speech_file

        elif 'restart_chat' in request.form:
            session.clear()
            return redirect(url_for('index'))

        session.modified = True

    speech_file = session.get('speech_file', None)
    average_score = calculate_average_score(ObjectId(session['session_id'])) if 'session_id' in session else 0

    return render_template('index.html', chat_history=session.get('chat_history', []), average_score=average_score, speech_file=speech_file)

@app.route('/submit_voice_answer', methods=['POST'])
def submit_voice_answer():
    if 'audio' not in request.files:
        return jsonify({'error': 'No audio file provided'}), 400

    audio_file = request.files['audio']

    # 임시 파일로 저장
    temp_filename = f"temp_{uuid.uuid4()}.wav"
    temp_filepath = os.path.join(app.root_path, "static", temp_filename)
    audio_file.save(temp_filepath)

    # Naver STT API 호출
    lang = "Kor"
    url = "https://naveropenapi.apigw.ntruss.com/recog/v1/stt?lang=" + lang

    headers = {
        "X-NCP-APIGW-API-KEY-ID": CLIENT_ID,
        "X-NCP-APIGW-API-KEY": CLIENT_SECRET,
        "Content-Type": "application/octet-stream"
    }

    with open(temp_filepath, 'rb') as audio:
        response = requests.post(url, data=audio, headers=headers)

    # 임시 파일 삭제
    os.remove(temp_filepath)

    if response.status_code == 200:
        stt_result = response.json()
        transcribed_text = stt_result.get('text', '')
        print(f"Transcribed text: {transcribed_text}")

        return jsonify({
            'success': True,
            'transcribed_text': transcribed_text
        })

    return jsonify({'error': 'Failed to process audio'}), 500

@app.route('/get_audio')
def get_audio():
    file_path = request.args.get('file_path')
    if file_path:
        return send_file(file_path, mimetype="audio/mp3")
    else:
        return "파일 경로를 제공해야 합니다.", 400

if __name__ == '__main__':
    app.run(debug=True,port=5001, host='0.0.0.0')