moduwa-server/src/ai-prediction/services/ai.prediction.service.js at 77fa24c9f37611173f9c2150f66b3ac3a31cf055 · munwalk/moduwa-server · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
import { AiPredictionTimeoutError } from '../../errors/app.error.js';
import { countBySelectedSentence } from '../repositories/conversation.repository.js';

// FastAPI 서버 URL 설정
// Docker 환경에서는 서비스 이름(fastapi)으로 접근
const FASTAPI_URL = process.env.FASTAPI_URL || 'http://fastapi:8000';

/**
 * 학습 데이터를 활용한 추천 순위 재정렬 (순위 기반 점수 시스템)
 *
 * [최적화된 순위 기반 점수 시스템]
 * - GPT는 가장 적절한 문장을 먼저 출력하는 특성 활용
 * - GPT가 confidence 값을 생성하지 않아 응답 속도 향상 & JSON 에러 방지
 * - FastAPI에서 순위별 고정 점수 부여: 1위(0.6), 2위(0.5), 3위(0.4)
 * - 사용자 학습 데이터(빈도수)를 추가 점수로 합산 (최대 0.4)
 * - 최종 점수 = 순위 점수(0.6~0.4) + 빈도 점수(0~0.4) = 최대 1.0
 *
 * @param {Array} predictions - FastAPI에서 받은 추천 문장 배열 (confidence는 순위 점수)
 * @param {string} userId - 사용자 ID (빈도수 조회용)
 * @returns {Promise<Array>} 가중치가 적용되어 재정렬된 추천 문장 배열
 */
const rankByLearningData = async (predictions, userId) => {
  // userId가 없으면 빈도수 적용 불가 - 원본 순서 유지
  if (!userId || predictions.length === 0) {
    return predictions;
  }

  try {
    // 1. 각 문장의 사용 빈도 조회 (DB 호출)
    const dbStart = Date.now();
    const frequencies = await Promise.all(
      predictions.map(pred =>
        countBySelectedSentence(userId, pred.sentence)
      )
    );
    const dbEnd = Date.now();
    console.log(`⏱️ [Performance] DB 빈도수 조회 소요 시간: ${dbEnd - dbStart}ms (${predictions.length}개 문장)`);

    // 2. 최대 빈도수 계산
    const maxFrequency = Math.max(...frequencies, 0);

    // 3. 콜드 스타트 방어: 모든 빈도가 0인 경우 (처음 쓰는 단어 조합)
    if (maxFrequency === 0) {
      return predictions.map((pred, index) => ({
        ...pred,
        usageFrequency: 0,
        normalizedFrequency: 0,
        finalScore: parseFloat(pred.confidence).toFixed(2) // 순위 점수 그대로 유지
      }));
    }

    // 4. 가중치 계산: 순위 점수(FastAPI에서 설정) + 빈도 점수 (최대 0.4)
    const scoredPredictions = predictions.map((pred, index) => {
      const frequency = frequencies[index];
      const normalizedFreq = frequency / maxFrequency; // 0~1 범위

      // 가중치 공식: 순위 점수(0.6/0.5/0.4) + 빈도 점수(최대 0.4)
      const rankScore = pred.confidence; // FastAPI에서 이미 순위별로 설정됨
      const frequencyScore = normalizedFreq * 0.4;
      const finalScore = rankScore + frequencyScore;

      return {
        ...pred,
        usageFrequency: frequency,
        normalizedFrequency: normalizedFreq,
        finalScore: finalScore.toFixed(2)
      };
    });

    // 5. 점수 기준 내림차순 정렬
    scoredPredictions.sort((a, b) => b.finalScore - a.finalScore);

    console.log('📊 순위 기반 가중치 재정렬 완료:', scoredPredictions.map(p => ({
      sentence: p.sentence.substring(0, 15) + '...',
      rankScore: p.confidence.toFixed(2),
      frequency: p.usageFrequency,
      finalScore: p.finalScore
    })));

    return scoredPredictions;

  } catch (error) {
    console.error('⚠️ 빈도수 조회 실패, 원본 순서 유지:', error.message);
    return predictions;
  }
};

/**
 * AI-01: FastAPI 서버를 통해 낱말 조합으로부터 문장 3개를 생성
 *
 * FastAPI 서버:
 * - Endpoint: POST /api/ai/predictions
 * - OpenAI GPT-4o-mini 호출
 * - Redis 캐싱 (1시간 TTL)
 * - Temperature 0.3 (문법적 정확성 우선)
 *
 * @param {Array<string>} words - 선택된 낱말 카드 배열 (1~10개)
 * @param {string} typedText - 사용자가 직접 입력한 텍스트 (현재 미사용)
 * @param {Object} context - 문맥 정보
 * @param {boolean} refresh - 캐시 무시하고 새로 생성할지 여부
 * @param {string} userId - 사용자 ID (학습 데이터 가중치 적용용)
 * @returns {Promise<Array>} 추천 문장 3개 (빈도수 가중치 적용 후 정렬)
 */
const predictSentences = async (words = [], typedText = '', context = {}, refresh = false, userId = null, tone = null) => {
  const { currentTime, previousMessages = [] } = context;

  // FastAPI 요청 페이로드 생성
  const payload = {
    words,
    context: {
      currentTime: currentTime,
      previousMessages: previousMessages.slice(-3) // 최근 3개만 전달
    },
    refresh,
    ...(tone && { tone }) // tone이 있을 때만 포함
  };

  // AbortController로 타임아웃 처리 (10초)
  const controller = new AbortController();
  const timeoutId = setTimeout(() => controller.abort(), 10000);

  try {
    // FastAPI 서버 호출
    const response = await fetch(`${FASTAPI_URL}/api/ai/predictions`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json'
      },
      body: JSON.stringify(payload),
      signal: controller.signal
    });

    clearTimeout(timeoutId);

    if (!response.ok) {
      const errorData = await response.json().catch(() => ({}));
      throw new Error(errorData.detail || `FastAPI 서버 오류: ${response.status}`);
    }

    const result = await response.json();

    // FastAPI 응답 검증
    if (!result.predictions || !Array.isArray(result.predictions)) {
      throw new Error('AI 응답 형식 오류: predictions 배열이 없습니다');
    }

    // 1단계: 응답 정규화 (FastAPI에서 문자열 배열로 반환됨)
    const rankScores = [0.6, 0.5, 0.4]; // 순위별 기본 점수
    const normalizedPredictions = result.predictions.slice(0, 3).map((pred, index) => ({
      sentence: typeof pred === 'string' ? pred : pred.sentence,
      confidence: rankScores[index] || 0.4
    }));

    // 2단계: 학습 데이터 가중치 적용 및 재정렬
    const rankedPredictions = await rankByLearningData(normalizedPredictions, userId);

    // 최종 반환: { predictions, rawPredictions }
    // rawPredictions는 캐싱용 (사용자별 가중치 미적용)
    return {
      predictions: rankedPredictions.map(pred => ({
        sentence: pred.sentence,
        confidence: pred.finalScore || pred.confidence
      })),
      rawPredictions: normalizedPredictions // 캐싱용 원본
    };
  } catch (error) {
    clearTimeout(timeoutId);

    // AbortError는 타임아웃
    if (error.name === 'AbortError') {
      throw new AiPredictionTimeoutError('AI 응답이 10초를 초과했습니다');
    }

    // 그 외 에러는 그대로 전달
    throw error;
  }
};

export { predictSentences, rankByLearningData };