imetting_backend/app/api/endpoints/meetings.py

930 lines
43 KiB
Python
Raw Normal View History

2025-11-24 15:10:06 +00:00
from fastapi import APIRouter, UploadFile, File, Form, Depends, BackgroundTasks, Request, Header
from fastapi.responses import StreamingResponse, Response
2025-09-30 04:14:19 +00:00
from app.models.models import Meeting, TranscriptSegment, TranscriptionTaskStatus, CreateMeetingRequest, UpdateMeetingRequest, SpeakerTagUpdateRequest, BatchSpeakerTagUpdateRequest, BatchTranscriptUpdateRequest, Tag
2025-08-05 01:46:40 +00:00
from app.core.database import get_db_connection
2025-09-25 03:48:02 +00:00
from app.core.config import BASE_DIR, AUDIO_DIR, MARKDOWN_DIR, ALLOWED_EXTENSIONS, ALLOWED_IMAGE_EXTENSIONS
import app.core.config as config_module
2025-08-26 13:57:16 +00:00
from app.services.llm_service import LLMService
2025-08-28 08:02:59 +00:00
from app.services.async_transcription_service import AsyncTranscriptionService
from app.services.async_meeting_service import async_meeting_service
2025-12-11 08:48:12 +00:00
from app.services.audio_service import handle_audio_upload
2025-09-25 03:48:02 +00:00
from app.core.auth import get_current_user
2025-09-26 07:47:37 +00:00
from app.core.response import create_api_response
2025-09-19 08:51:07 +00:00
from typing import List, Optional
2025-09-09 03:35:56 +00:00
from datetime import datetime
2025-08-26 13:57:16 +00:00
from pydantic import BaseModel
2025-11-24 15:10:06 +00:00
from urllib.parse import quote
2025-08-05 01:46:40 +00:00
import os
import uuid
import shutil
2025-11-24 15:10:06 +00:00
import mimetypes
2025-08-05 01:46:40 +00:00
router = APIRouter()
2025-08-26 13:57:16 +00:00
llm_service = LLMService()
2025-08-28 08:02:59 +00:00
transcription_service = AsyncTranscriptionService()
2025-08-26 13:57:16 +00:00
class GenerateSummaryRequest(BaseModel):
user_prompt: Optional[str] = ""
2025-12-11 08:48:12 +00:00
prompt_id: Optional[int] = None # 提示词模版ID如果不指定则使用默认模版
2025-08-26 13:57:16 +00:00
2025-11-24 15:10:06 +00:00
2025-10-31 06:54:54 +00:00
def _process_tags(cursor, tag_string: Optional[str], creator_id: Optional[int] = None) -> List[Tag]:
"""
处理标签查询已存在的标签如果提供了 creator_id 则创建不存在的标签
"""
2025-09-19 08:51:07 +00:00
if not tag_string:
return []
tag_names = [name.strip() for name in tag_string.split(',') if name.strip()]
if not tag_names:
return []
2025-10-31 06:54:54 +00:00
# 如果提供了 creator_id则创建不存在的标签
if creator_id:
insert_ignore_query = "INSERT IGNORE INTO tags (name, creator_id) VALUES (%s, %s)"
cursor.executemany(insert_ignore_query, [(name, creator_id) for name in tag_names])
# 查询所有标签信息
2025-09-19 08:51:07 +00:00
format_strings = ', '.join(['%s'] * len(tag_names))
cursor.execute(f"SELECT id, name, color FROM tags WHERE name IN ({format_strings})", tuple(tag_names))
tags_data = cursor.fetchall()
return [Tag(**tag) for tag in tags_data]
2025-09-26 07:47:37 +00:00
@router.get("/meetings")
2025-11-07 09:12:29 +00:00
def get_meetings(
current_user: dict = Depends(get_current_user),
user_id: Optional[int] = None,
page: int = 1,
page_size: Optional[int] = None,
search: Optional[str] = None,
tags: Optional[str] = None,
filter_type: str = "all"
):
from app.core.config import TIMELINE_PAGESIZE
# 使用配置的默认页面大小
if page_size is None:
page_size = TIMELINE_PAGESIZE
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-11-07 09:12:29 +00:00
# 构建WHERE子句
where_conditions = []
params = []
# 用户过滤
if user_id:
# 需要联表查询参与者
has_attendees_join = True
else:
has_attendees_join = False
# 按类型过滤 (created/attended/all)
if user_id:
if filter_type == "created":
where_conditions.append("m.user_id = %s")
params.append(user_id)
elif filter_type == "attended":
where_conditions.append("m.user_id != %s AND a.user_id = %s")
params.extend([user_id, user_id])
has_attendees_join = True
else: # all
where_conditions.append("(m.user_id = %s OR a.user_id = %s)")
params.extend([user_id, user_id])
has_attendees_join = True
# 搜索关键词过滤
if search and search.strip():
search_pattern = f"%{search.strip()}%"
where_conditions.append("(m.title LIKE %s OR u.caption LIKE %s)")
params.extend([search_pattern, search_pattern])
# 标签过滤
if tags and tags.strip():
tag_list = [t.strip() for t in tags.split(',') if t.strip()]
if tag_list:
# 使用JSON_CONTAINS或LIKE查询
tag_conditions = []
for tag in tag_list:
tag_conditions.append("m.tags LIKE %s")
params.append(f"%{tag}%")
where_conditions.append(f"({' OR '.join(tag_conditions)})")
# 构建基础查询
2025-08-05 01:46:40 +00:00
base_query = '''
2025-09-26 07:47:37 +00:00
SELECT m.meeting_id, m.title, m.meeting_time, m.summary, m.created_at, m.tags,
2025-10-15 06:31:25 +00:00
m.user_id as creator_id, u.caption as creator_username, af.file_path as audio_file_path
2025-11-07 09:12:29 +00:00
FROM meetings m
JOIN users u ON m.user_id = u.user_id
LEFT JOIN audio_files af ON m.meeting_id = af.meeting_id
2025-08-05 01:46:40 +00:00
'''
2025-11-07 09:12:29 +00:00
if has_attendees_join:
base_query += " LEFT JOIN attendees a ON m.meeting_id = a.meeting_id"
# 添加WHERE子句
if where_conditions:
base_query += f" WHERE {' AND '.join(where_conditions)}"
# 获取总数 - 需要在添加 GROUP BY 之前
count_base = base_query # 保存一份不含GROUP BY的查询
if has_attendees_join:
# 如果有联表,使用子查询计数
count_query = f"SELECT COUNT(DISTINCT m.meeting_id) as total {count_base[count_base.find('FROM'):]}"
2025-08-05 01:46:40 +00:00
else:
2025-11-07 09:12:29 +00:00
# 没有联表,直接计数
count_query = f"SELECT COUNT(*) as total {count_base[count_base.find('FROM'):]}"
cursor.execute(count_query, params)
total = cursor.fetchone()['total']
# 添加GROUP BY如果联表了attendees
if has_attendees_join:
base_query += " GROUP BY m.meeting_id"
# 计算分页
total_pages = (total + page_size - 1) // page_size
has_more = page < total_pages
offset = (page - 1) * page_size
# 添加排序和分页
query = f"{base_query} ORDER BY m.meeting_time DESC, m.created_at DESC LIMIT %s OFFSET %s"
params.extend([page_size, offset])
cursor.execute(query, params)
2025-08-05 01:46:40 +00:00
meetings = cursor.fetchall()
2025-11-07 09:12:29 +00:00
2025-08-05 01:46:40 +00:00
meeting_list = []
for meeting in meetings:
2025-09-26 07:47:37 +00:00
attendees_query = 'SELECT u.user_id, u.caption FROM attendees a JOIN users u ON a.user_id = u.user_id WHERE a.meeting_id = %s'
2025-08-05 01:46:40 +00:00
cursor.execute(attendees_query, (meeting['meeting_id'],))
attendees_data = cursor.fetchall()
attendees = [{'user_id': row['user_id'], 'caption': row['caption']} for row in attendees_data]
2025-11-07 09:12:29 +00:00
tags_list = _process_tags(cursor, meeting.get('tags'))
2025-08-05 01:46:40 +00:00
meeting_list.append(Meeting(
2025-09-26 07:47:37 +00:00
meeting_id=meeting['meeting_id'], title=meeting['title'], meeting_time=meeting['meeting_time'],
2025-10-15 06:31:25 +00:00
summary=meeting['summary'], created_at=meeting['created_at'], audio_file_path=meeting['audio_file_path'],
2025-11-07 09:12:29 +00:00
attendees=attendees, creator_id=meeting['creator_id'], creator_username=meeting['creator_username'], tags=tags_list
2025-08-05 01:46:40 +00:00
))
2025-11-07 09:12:29 +00:00
return create_api_response(code="200", message="获取会议列表成功", data={
"meetings": meeting_list,
"total": total,
"page": page,
"page_size": page_size,
"total_pages": total_pages,
"has_more": has_more
})
@router.get("/meetings/stats")
def get_meetings_stats(
current_user: dict = Depends(get_current_user),
user_id: Optional[int] = None
):
"""
获取会议统计数据全部会议我创建的会议我参加的会议数量
"""
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
if not user_id:
return create_api_response(code="400", message="user_id is required")
# 获取全部会议数量(创建的 + 参加的)
all_query = '''
SELECT COUNT(DISTINCT m.meeting_id) as count
FROM meetings m
LEFT JOIN attendees a ON m.meeting_id = a.meeting_id
WHERE m.user_id = %s OR a.user_id = %s
'''
cursor.execute(all_query, (user_id, user_id))
all_count = cursor.fetchone()['count']
# 获取我创建的会议数量
created_query = '''
SELECT COUNT(*) as count
FROM meetings m
WHERE m.user_id = %s
'''
cursor.execute(created_query, (user_id,))
created_count = cursor.fetchone()['count']
# 获取我参加的会议数量(不包括我创建的)
attended_query = '''
SELECT COUNT(DISTINCT a.meeting_id) as count
FROM attendees a
JOIN meetings m ON a.meeting_id = m.meeting_id
WHERE a.user_id = %s AND m.user_id != %s
'''
cursor.execute(attended_query, (user_id, user_id))
attended_count = cursor.fetchone()['count']
return create_api_response(code="200", message="获取会议统计成功", data={
"all_meetings": all_count,
"created_meetings": created_count,
"attended_meetings": attended_count
})
2025-08-05 01:46:40 +00:00
2025-09-26 07:47:37 +00:00
@router.get("/meetings/{meeting_id}")
2025-08-29 08:37:29 +00:00
def get_meeting_details(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
query = '''
2025-09-26 07:47:37 +00:00
SELECT m.meeting_id, m.title, m.meeting_time, m.summary, m.created_at, m.tags,
m.user_id as creator_id, u.caption as creator_username, af.file_path as audio_file_path
FROM meetings m JOIN users u ON m.user_id = u.user_id LEFT JOIN audio_files af ON m.meeting_id = af.meeting_id
2025-08-05 01:46:40 +00:00
WHERE m.meeting_id = %s
'''
cursor.execute(query, (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
attendees_query = 'SELECT u.user_id, u.caption FROM attendees a JOIN users u ON a.user_id = u.user_id WHERE a.meeting_id = %s'
2025-08-05 01:46:40 +00:00
cursor.execute(attendees_query, (meeting['meeting_id'],))
attendees_data = cursor.fetchall()
attendees = [{'user_id': row['user_id'], 'caption': row['caption']} for row in attendees_data]
2025-09-19 08:51:07 +00:00
tags = _process_tags(cursor, meeting.get('tags'))
2025-08-28 08:02:59 +00:00
cursor.close()
2025-08-05 01:46:40 +00:00
meeting_data = Meeting(
2025-09-26 07:47:37 +00:00
meeting_id=meeting['meeting_id'], title=meeting['title'], meeting_time=meeting['meeting_time'],
summary=meeting['summary'], created_at=meeting['created_at'], attendees=attendees,
creator_id=meeting['creator_id'], creator_username=meeting['creator_username'], tags=tags
2025-08-05 01:46:40 +00:00
)
if meeting['audio_file_path']:
meeting_data.audio_file_path = meeting['audio_file_path']
2025-08-28 08:02:59 +00:00
try:
transcription_status_data = transcription_service.get_meeting_transcription_status(meeting_id)
if transcription_status_data:
meeting_data.transcription_status = TranscriptionTaskStatus(**transcription_status_data)
except Exception as e:
print(f"Warning: Failed to get transcription status for meeting {meeting_id}: {e}")
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="获取会议详情成功", data=meeting_data)
2025-08-05 01:46:40 +00:00
2025-09-26 07:47:37 +00:00
@router.get("/meetings/{meeting_id}/transcript")
2025-08-29 08:37:29 +00:00
def get_meeting_transcript(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-09-26 07:47:37 +00:00
cursor.execute("SELECT meeting_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
2025-08-05 01:46:40 +00:00
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-08-05 01:46:40 +00:00
transcript_query = '''
2025-08-25 08:10:29 +00:00
SELECT segment_id, meeting_id, speaker_id, speaker_tag, start_time_ms, end_time_ms, text_content
2025-09-26 07:47:37 +00:00
FROM transcript_segments WHERE meeting_id = %s ORDER BY start_time_ms ASC
2025-08-05 01:46:40 +00:00
'''
cursor.execute(transcript_query, (meeting_id,))
segments = cursor.fetchall()
2025-09-26 07:47:37 +00:00
transcript_segments = [TranscriptSegment(
segment_id=s['segment_id'], meeting_id=s['meeting_id'], speaker_id=s['speaker_id'],
speaker_tag=s['speaker_tag'] if s['speaker_tag'] else f"发言人 {s['speaker_id']}",
start_time_ms=s['start_time_ms'], end_time_ms=s['end_time_ms'], text_content=s['text_content']
) for s in segments]
return create_api_response(code="200", message="获取转录内容成功", data=transcript_segments)
2025-08-05 01:46:40 +00:00
@router.post("/meetings")
2025-08-29 08:37:29 +00:00
def create_meeting(meeting_request: CreateMeetingRequest, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-10-31 06:54:54 +00:00
# 使用 _process_tags 来处理标签创建
2025-09-19 08:51:07 +00:00
if meeting_request.tags:
2025-10-31 06:54:54 +00:00
_process_tags(cursor, meeting_request.tags, current_user['user_id'])
2025-09-26 07:47:37 +00:00
meeting_query = 'INSERT INTO meetings (user_id, title, meeting_time, summary, tags, created_at) VALUES (%s, %s, %s, %s, %s, %s)'
cursor.execute(meeting_query, (meeting_request.user_id, meeting_request.title, meeting_request.meeting_time, None, meeting_request.tags, datetime.now().isoformat()))
2025-08-05 01:46:40 +00:00
meeting_id = cursor.lastrowid
for attendee_id in meeting_request.attendee_ids:
2025-09-26 07:47:37 +00:00
cursor.execute('INSERT IGNORE INTO attendees (meeting_id, user_id) VALUES (%s, %s)', (meeting_id, attendee_id))
2025-08-05 01:46:40 +00:00
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Meeting created successfully", data={"meeting_id": meeting_id})
2025-08-05 01:46:40 +00:00
@router.put("/meetings/{meeting_id}")
2025-08-29 08:37:29 +00:00
def update_meeting(meeting_id: int, meeting_request: UpdateMeetingRequest, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-08-29 08:37:29 +00:00
cursor.execute("SELECT user_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-08-29 08:37:29 +00:00
if meeting['user_id'] != current_user['user_id']:
2025-09-26 07:47:37 +00:00
return create_api_response(code="403", message="Permission denied")
2025-10-31 06:54:54 +00:00
# 使用 _process_tags 来处理标签创建
2025-09-19 08:51:07 +00:00
if meeting_request.tags:
2025-10-31 06:54:54 +00:00
_process_tags(cursor, meeting_request.tags, current_user['user_id'])
2025-09-26 07:47:37 +00:00
update_query = 'UPDATE meetings SET title = %s, meeting_time = %s, summary = %s, tags = %s WHERE meeting_id = %s'
cursor.execute(update_query, (meeting_request.title, meeting_request.meeting_time, meeting_request.summary, meeting_request.tags, meeting_id))
2025-08-05 01:46:40 +00:00
cursor.execute("DELETE FROM attendees WHERE meeting_id = %s", (meeting_id,))
for attendee_id in meeting_request.attendee_ids:
2025-09-26 07:47:37 +00:00
cursor.execute('INSERT INTO attendees (meeting_id, user_id) VALUES (%s, %s)', (meeting_id, attendee_id))
2025-08-05 01:46:40 +00:00
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Meeting updated successfully")
2025-08-05 01:46:40 +00:00
@router.delete("/meetings/{meeting_id}")
2025-08-29 08:37:29 +00:00
def delete_meeting(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-08-29 08:37:29 +00:00
cursor.execute("SELECT user_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-08-29 08:37:29 +00:00
if meeting['user_id'] != current_user['user_id']:
2025-09-26 07:47:37 +00:00
return create_api_response(code="403", message="Permission denied")
2025-08-05 01:46:40 +00:00
cursor.execute("DELETE FROM transcript_segments WHERE meeting_id = %s", (meeting_id,))
cursor.execute("DELETE FROM audio_files WHERE meeting_id = %s", (meeting_id,))
cursor.execute("DELETE FROM attachments WHERE meeting_id = %s", (meeting_id,))
cursor.execute("DELETE FROM attendees WHERE meeting_id = %s", (meeting_id,))
cursor.execute("DELETE FROM meetings WHERE meeting_id = %s", (meeting_id,))
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Meeting deleted successfully")
2025-08-05 01:46:40 +00:00
2025-09-26 07:47:37 +00:00
@router.get("/meetings/{meeting_id}/edit")
2025-08-29 08:37:29 +00:00
def get_meeting_for_edit(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
query = '''
2025-09-26 07:47:37 +00:00
SELECT m.meeting_id, m.title, m.meeting_time, m.summary, m.created_at, m.tags,
m.user_id as creator_id, u.caption as creator_username, af.file_path as audio_file_path
FROM meetings m JOIN users u ON m.user_id = u.user_id LEFT JOIN audio_files af ON m.meeting_id = af.meeting_id
2025-08-05 01:46:40 +00:00
WHERE m.meeting_id = %s
'''
cursor.execute(query, (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
attendees_query = 'SELECT u.user_id, u.caption FROM attendees a JOIN users u ON a.user_id = u.user_id WHERE a.meeting_id = %s'
cursor.execute(attendees_query, (meeting['meeting_id'],))
2025-08-05 01:46:40 +00:00
attendees_data = cursor.fetchall()
attendees = [{'user_id': row['user_id'], 'caption': row['caption']} for row in attendees_data]
2025-09-19 08:51:07 +00:00
tags = _process_tags(cursor, meeting.get('tags'))
2025-08-28 08:02:59 +00:00
cursor.close()
2025-08-05 01:46:40 +00:00
meeting_data = Meeting(
2025-09-26 07:47:37 +00:00
meeting_id=meeting['meeting_id'], title=meeting['title'], meeting_time=meeting['meeting_time'],
summary=meeting['summary'], created_at=meeting['created_at'], attendees=attendees,
creator_id=meeting['creator_id'], creator_username=meeting['creator_username'], tags=tags
2025-08-05 01:46:40 +00:00
)
2025-08-26 13:57:16 +00:00
if meeting.get('audio_file_path'):
2025-08-05 01:46:40 +00:00
meeting_data.audio_file_path = meeting['audio_file_path']
2025-08-28 08:02:59 +00:00
try:
transcription_status_data = transcription_service.get_meeting_transcription_status(meeting_id)
if transcription_status_data:
meeting_data.transcription_status = TranscriptionTaskStatus(**transcription_status_data)
except Exception as e:
print(f"Warning: Failed to get transcription status for meeting {meeting_id}: {e}")
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="获取会议编辑信息成功", data=meeting_data)
2025-08-05 01:46:40 +00:00
@router.post("/meetings/upload-audio")
2025-11-24 15:10:06 +00:00
async def upload_audio(
audio_file: UploadFile = File(...),
meeting_id: int = Form(...),
auto_summarize: str = Form("true"),
2025-12-11 08:48:12 +00:00
prompt_id: Optional[int] = Form(None), # 可选的提示词模版ID
2025-11-24 15:10:06 +00:00
background_tasks: BackgroundTasks = None,
current_user: dict = Depends(get_current_user)
):
"""
音频文件上传接口
上传音频文件并启动转录任务可选择是否自动生成总结
Args:
audio_file: 音频文件
meeting_id: 会议ID
auto_summarize: 是否自动生成总结"true"/"false"默认"true"
2025-12-11 08:48:12 +00:00
prompt_id: 提示词模版ID可选如果不指定则使用默认模版
2025-11-24 15:10:06 +00:00
background_tasks: FastAPI后台任务
current_user: 当前登录用户
Returns:
HTTP 200: 处理成功返回任务ID
HTTP 400/403/404/500: 各种错误情况
"""
auto_summarize_bool = auto_summarize.lower() in ("true", "1", "yes")
2025-12-11 08:48:12 +00:00
# 打印接收到的 prompt_id
print(f"[Upload Audio] Meeting ID: {meeting_id}, Received prompt_id: {prompt_id}, Type: {type(prompt_id)}, Auto-summarize: {auto_summarize_bool}")
# 1. 文件类型验证
file_extension = os.path.splitext(audio_file.filename)[1].lower()
if file_extension not in ALLOWED_EXTENSIONS:
return create_api_response(
code="400",
message=f"不支持的文件类型。支持的类型: {', '.join(ALLOWED_EXTENSIONS)}"
)
2025-11-24 15:10:06 +00:00
2025-12-11 08:48:12 +00:00
# 2. 文件大小验证
max_file_size = getattr(config_module, 'MAX_FILE_SIZE', 100 * 1024 * 1024)
if audio_file.size > max_file_size:
return create_api_response(
code="400",
message=f"文件大小超过 {max_file_size // (1024 * 1024)}MB 限制"
)
# 3. 保存音频文件到磁盘
meeting_dir = AUDIO_DIR / str(meeting_id)
meeting_dir.mkdir(exist_ok=True)
unique_filename = f"{uuid.uuid4()}{file_extension}"
absolute_path = meeting_dir / unique_filename
relative_path = absolute_path.relative_to(BASE_DIR)
try:
with open(absolute_path, "wb") as buffer:
shutil.copyfileobj(audio_file.file, buffer)
except Exception as e:
return create_api_response(code="500", message=f"保存文件失败: {str(e)}")
file_path = '/' + str(relative_path)
file_name = audio_file.filename
file_size = audio_file.size
# 4. 调用 audio_service 处理文件(权限检查、数据库更新、启动转录)
result = handle_audio_upload(
file_path=file_path,
file_name=file_name,
file_size=file_size,
meeting_id=meeting_id,
current_user=current_user,
auto_summarize=auto_summarize_bool,
background_tasks=background_tasks,
prompt_id=prompt_id # 传递 prompt_id 参数
)
# 如果不成功,删除已保存的文件并返回错误
2025-11-24 15:10:06 +00:00
if not result["success"]:
2025-12-11 08:48:12 +00:00
if absolute_path.exists():
try:
os.remove(absolute_path)
print(f"Deleted file due to processing error: {absolute_path}")
except Exception as e:
print(f"Warning: Failed to delete file {absolute_path}: {e}")
2025-11-24 15:10:06 +00:00
return result["response"]
2025-12-11 08:48:12 +00:00
# 5. 返回成功响应
2025-11-24 15:10:06 +00:00
transcription_task_id = result["transcription_task_id"]
2025-12-11 08:48:12 +00:00
message_suffix = ""
if transcription_task_id:
if auto_summarize_bool:
message_suffix = ",正在进行转录和总结"
else:
message_suffix = ",正在进行转录"
2025-11-24 15:10:06 +00:00
return create_api_response(
code="200",
message="Audio file uploaded successfully" +
(" and replaced existing file" if result["replaced_existing"] else "") +
message_suffix,
data={
"file_name": result["file_info"]["file_name"],
"file_path": result["file_info"]["file_path"],
"task_id": transcription_task_id,
"transcription_started": transcription_task_id is not None,
"auto_summarize": auto_summarize_bool,
"replaced_existing": result["replaced_existing"],
"previous_transcription_cleared": result["replaced_existing"] and result["has_transcription"]
}
)
2025-08-05 01:46:40 +00:00
@router.get("/meetings/{meeting_id}/audio")
2025-08-29 08:37:29 +00:00
def get_audio_file(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-05 01:46:40 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-09-26 07:47:37 +00:00
cursor.execute("SELECT file_name, file_path, file_size, upload_time FROM audio_files WHERE meeting_id = %s", (meeting_id,))
2025-08-05 01:46:40 +00:00
audio_file = cursor.fetchone()
if not audio_file:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Audio file not found for this meeting")
return create_api_response(code="200", message="Audio file found", data=audio_file)
2025-08-06 07:07:02 +00:00
2025-11-24 15:10:06 +00:00
@router.get("/meetings/{meeting_id}/audio/stream")
async def stream_audio_file(
meeting_id: int,
range: Optional[str] = Header(None, alias="Range")
):
"""
音频文件流式传输端点支持HTTP Range请求Safari浏览器必需
无需登录认证用于前端audio标签直接访问
"""
# 获取音频文件信息
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
cursor.execute("SELECT file_name, file_path, file_size FROM audio_files WHERE meeting_id = %s", (meeting_id,))
audio_file = cursor.fetchone()
if not audio_file:
return Response(content="Audio file not found", status_code=404)
# 构建完整文件路径
file_path = BASE_DIR / audio_file['file_path'].lstrip('/')
if not file_path.exists():
return Response(content="Audio file not found on disk", status_code=404)
# 总是使用实际文件大小(不依赖数据库记录,防止文件被优化后大小不匹配)
file_size = os.path.getsize(file_path)
file_name = audio_file['file_name']
# 根据文件扩展名确定MIME类型
extension = os.path.splitext(file_name)[1].lower()
mime_types = {
'.mp3': 'audio/mpeg',
'.m4a': 'audio/mp4',
'.wav': 'audio/wav',
'.mpeg': 'audio/mpeg',
'.mp4': 'audio/mp4'
}
content_type = mime_types.get(extension, 'audio/mpeg')
# 处理Range请求
start = 0
end = file_size - 1
if range:
# 解析Range头: "bytes=start-end" 或 "bytes=start-"
try:
range_spec = range.replace("bytes=", "")
if "-" in range_spec:
parts = range_spec.split("-")
if parts[0]:
start = int(parts[0])
if parts[1]:
end = int(parts[1])
except (ValueError, IndexError):
pass
# 确保范围有效
if start >= file_size:
return Response(
content="Range Not Satisfiable",
status_code=416,
headers={"Content-Range": f"bytes */{file_size}"}
)
end = min(end, file_size - 1)
content_length = end - start + 1
# 对所有文件名统一使用RFC 5987标准的URL编码格式
# 这样可以正确处理中文、特殊字符等所有情况
encoded_filename = quote(file_name)
filename_header = f"inline; filename*=UTF-8''{encoded_filename}"
# 生成器函数用于流式读取文件
def iter_file():
with open(file_path, 'rb') as f:
f.seek(start)
remaining = content_length
chunk_size = 64 * 1024 # 64KB chunks
while remaining > 0:
read_size = min(chunk_size, remaining)
data = f.read(read_size)
if not data:
break
remaining -= len(data)
yield data
# 根据是否有Range请求返回不同的响应
if range:
return StreamingResponse(
iter_file(),
status_code=206, # Partial Content
media_type=content_type,
headers={
"Content-Range": f"bytes {start}-{end}/{file_size}",
"Accept-Ranges": "bytes",
"Content-Length": str(content_length),
"Content-Disposition": filename_header
}
)
else:
return StreamingResponse(
iter_file(),
status_code=200,
media_type=content_type,
headers={
"Accept-Ranges": "bytes",
"Content-Length": str(file_size),
"Content-Disposition": filename_header
}
)
2025-08-28 08:02:59 +00:00
@router.get("/meetings/{meeting_id}/transcription/status")
2025-08-29 08:37:29 +00:00
def get_meeting_transcription_status(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-28 08:02:59 +00:00
try:
status_info = transcription_service.get_meeting_transcription_status(meeting_id)
if not status_info:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="No transcription task found for this meeting")
return create_api_response(code="200", message="Transcription status retrieved", data=status_info)
2025-08-28 08:02:59 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to get meeting transcription status: {str(e)}")
2025-08-28 08:02:59 +00:00
@router.post("/meetings/{meeting_id}/transcription/start")
2025-08-29 08:37:29 +00:00
def start_meeting_transcription(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-28 08:02:59 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
cursor.execute("SELECT meeting_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
cursor.execute("SELECT file_path FROM audio_files WHERE meeting_id = %s LIMIT 1", (meeting_id,))
2025-08-28 08:02:59 +00:00
audio_file = cursor.fetchone()
if not audio_file:
2025-09-26 07:47:37 +00:00
return create_api_response(code="400", message="No audio file found for this meeting")
2025-08-28 08:02:59 +00:00
existing_status = transcription_service.get_meeting_transcription_status(meeting_id)
if existing_status and existing_status['status'] in ['pending', 'processing']:
2025-09-26 07:47:37 +00:00
return create_api_response(code="409", message="Transcription task already exists", data={
"task_id": existing_status['task_id'], "status": existing_status['status']
})
2025-08-28 08:02:59 +00:00
task_id = transcription_service.start_transcription(meeting_id, audio_file['file_path'])
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Transcription task started successfully", data={
"task_id": task_id, "meeting_id": meeting_id
})
2025-08-28 08:02:59 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to start transcription: {str(e)}")
2025-08-28 08:02:59 +00:00
2025-08-06 07:07:02 +00:00
@router.post("/meetings/{meeting_id}/upload-image")
2025-09-26 07:47:37 +00:00
async def upload_image(meeting_id: int, image_file: UploadFile = File(...), current_user: dict = Depends(get_current_user)):
2025-08-06 07:07:02 +00:00
file_extension = os.path.splitext(image_file.filename)[1].lower()
if file_extension not in ALLOWED_IMAGE_EXTENSIONS:
2025-09-26 07:47:37 +00:00
return create_api_response(code="400", message=f"Unsupported image type. Allowed types: {', '.join(ALLOWED_IMAGE_EXTENSIONS)}")
2025-09-25 03:48:02 +00:00
max_image_size = getattr(config_module, 'MAX_IMAGE_SIZE', 10 * 1024 * 1024)
if image_file.size > max_image_size:
2025-09-26 07:47:37 +00:00
return create_api_response(code="400", message=f"Image size exceeds {max_image_size // (1024 * 1024)}MB limit")
2025-08-06 07:07:02 +00:00
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-08-29 08:37:29 +00:00
cursor.execute("SELECT user_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-08-29 08:37:29 +00:00
if meeting['user_id'] != current_user['user_id']:
2025-09-26 07:47:37 +00:00
return create_api_response(code="403", message="Permission denied")
2025-08-06 07:07:02 +00:00
meeting_dir = MARKDOWN_DIR / str(meeting_id)
meeting_dir.mkdir(exist_ok=True)
unique_filename = f"{uuid.uuid4()}{file_extension}"
absolute_path = meeting_dir / unique_filename
relative_path = absolute_path.relative_to(BASE_DIR)
2025-08-06 07:07:02 +00:00
try:
with open(absolute_path, "wb") as buffer:
2025-08-06 07:07:02 +00:00
shutil.copyfileobj(image_file.file, buffer)
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to save image: {str(e)}")
2025-09-30 04:14:19 +00:00
return create_api_response(code="200", message="Image uploaded successfully", data={
2025-09-26 07:47:37 +00:00
"file_name": image_file.filename, "file_path": '/'+ str(relative_path)
})
2025-08-25 08:10:29 +00:00
@router.put("/meetings/{meeting_id}/speaker-tags")
2025-08-29 08:37:29 +00:00
def update_speaker_tag(meeting_id: int, request: SpeakerTagUpdateRequest, current_user: dict = Depends(get_current_user)):
2025-08-25 08:10:29 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor()
2025-09-26 07:47:37 +00:00
update_query = 'UPDATE transcript_segments SET speaker_tag = %s WHERE meeting_id = %s AND speaker_id = %s'
2025-08-25 08:10:29 +00:00
cursor.execute(update_query, (request.new_tag, meeting_id, request.speaker_id))
if cursor.rowcount == 0:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="No segments found for this speaker")
2025-08-25 08:10:29 +00:00
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Speaker tag updated successfully", data={'updated_count': cursor.rowcount})
2025-08-25 08:10:29 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to update speaker tag: {str(e)}")
2025-08-25 08:10:29 +00:00
@router.put("/meetings/{meeting_id}/speaker-tags/batch")
2025-08-29 08:37:29 +00:00
def batch_update_speaker_tags(meeting_id: int, request: BatchSpeakerTagUpdateRequest, current_user: dict = Depends(get_current_user)):
2025-08-25 08:10:29 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor()
total_updated = 0
for update_item in request.updates:
2025-09-26 07:47:37 +00:00
update_query = 'UPDATE transcript_segments SET speaker_tag = %s WHERE meeting_id = %s AND speaker_id = %s'
2025-08-25 08:10:29 +00:00
cursor.execute(update_query, (update_item.new_tag, meeting_id, update_item.speaker_id))
total_updated += cursor.rowcount
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Speaker tags updated successfully", data={'total_updated': total_updated})
2025-08-25 08:10:29 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to batch update speaker tags: {str(e)}")
2025-08-26 13:57:16 +00:00
@router.put("/meetings/{meeting_id}/transcript/batch")
2025-08-29 08:37:29 +00:00
def batch_update_transcript(meeting_id: int, request: BatchTranscriptUpdateRequest, current_user: dict = Depends(get_current_user)):
2025-08-26 13:57:16 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor()
total_updated = 0
for update_item in request.updates:
2025-09-26 07:47:37 +00:00
cursor.execute("SELECT segment_id FROM transcript_segments WHERE segment_id = %s AND meeting_id = %s", (update_item.segment_id, meeting_id))
2025-08-26 13:57:16 +00:00
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
continue
update_query = 'UPDATE transcript_segments SET text_content = %s WHERE segment_id = %s AND meeting_id = %s'
2025-08-26 13:57:16 +00:00
cursor.execute(update_query, (update_item.text_content, update_item.segment_id, meeting_id))
total_updated += cursor.rowcount
connection.commit()
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Transcript updated successfully", data={'total_updated': total_updated})
2025-08-26 13:57:16 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to update transcript: {str(e)}")
2025-08-26 13:57:16 +00:00
@router.get("/meetings/{meeting_id}/summaries")
2025-08-29 08:37:29 +00:00
def get_meeting_summaries(meeting_id: int, current_user: dict = Depends(get_current_user)):
2025-08-26 13:57:16 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
cursor.execute("SELECT meeting_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-08-26 13:57:16 +00:00
summaries = llm_service.get_meeting_summaries(meeting_id)
2025-09-26 07:47:37 +00:00
return create_api_response(code="200", message="Summaries retrieved successfully", data={"summaries": summaries})
2025-08-26 13:57:16 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to get summaries: {str(e)}")
2025-08-26 13:57:16 +00:00
@router.get("/meetings/{meeting_id}/summaries/{summary_id}")
2025-08-29 08:37:29 +00:00
def get_summary_detail(meeting_id: int, summary_id: int, current_user: dict = Depends(get_current_user)):
2025-08-26 13:57:16 +00:00
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-09-26 07:47:37 +00:00
query = "SELECT id, summary_content, user_prompt, created_at FROM meeting_summaries WHERE id = %s AND meeting_id = %s"
2025-08-26 13:57:16 +00:00
cursor.execute(query, (summary_id, meeting_id))
summary = cursor.fetchone()
if not summary:
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Summary not found")
return create_api_response(code="200", message="Summary detail retrieved", data=summary)
2025-08-26 13:57:16 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to get summary detail: {str(e)}")
2025-09-09 03:35:56 +00:00
@router.post("/meetings/{meeting_id}/generate-summary-async")
def generate_meeting_summary_async(meeting_id: int, request: GenerateSummaryRequest, background_tasks: BackgroundTasks, current_user: dict = Depends(get_current_user)):
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
cursor.execute("SELECT meeting_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
2025-12-11 08:48:12 +00:00
# 传递 prompt_id 参数给服务层
task_id = async_meeting_service.start_summary_generation(meeting_id, request.user_prompt, request.prompt_id)
background_tasks.add_task(async_meeting_service._process_task, task_id)
2025-09-30 04:14:19 +00:00
return create_api_response(code="200", message="Summary generation task has been accepted.", data={
2025-09-26 07:47:37 +00:00
"task_id": task_id, "status": "pending", "meeting_id": meeting_id
})
2025-09-09 03:35:56 +00:00
except Exception as e:
2025-09-26 07:47:37 +00:00
return create_api_response(code="500", message=f"Failed to start summary generation: {str(e)}")
2025-09-09 03:35:56 +00:00
@router.get("/meetings/{meeting_id}/llm-tasks")
def get_meeting_llm_tasks(meeting_id: int, current_user: dict = Depends(get_current_user)):
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
cursor.execute("SELECT meeting_id FROM meetings WHERE meeting_id = %s", (meeting_id,))
if not cursor.fetchone():
2025-09-26 07:47:37 +00:00
return create_api_response(code="404", message="Meeting not found")
tasks = async_meeting_service.get_meeting_llm_tasks(meeting_id)
2025-09-30 04:14:19 +00:00
return create_api_response(code="200", message="LLM tasks retrieved successfully", data={
2025-09-26 07:47:37 +00:00
"tasks": tasks, "total": len(tasks)
})
2025-09-09 03:35:56 +00:00
except Exception as e:
2025-09-30 04:14:19 +00:00
return create_api_response(code="500", message=f"Failed to get LLM tasks: {str(e)}")
2025-11-07 09:12:29 +00:00
2025-11-19 03:49:07 +00:00
@router.get("/meetings/{meeting_id}/navigation")
def get_meeting_navigation(
meeting_id: int,
current_user: dict = Depends(get_current_user),
user_id: Optional[int] = None,
filter_type: str = "all",
search: Optional[str] = None,
tags: Optional[str] = None
):
"""
获取当前会议在列表中的上一条和下一条
Query params:
- user_id: 当前用户ID
- filter_type: 筛选类型 ('all', 'created', 'attended')
- search: 搜索关键词 (可选)
- tags: 标签列表逗号分隔 (可选)
"""
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
# 构建WHERE子句 - 与get_meetings保持一致
where_conditions = []
params = []
has_attendees_join = False
# 按类型过滤
if user_id:
if filter_type == "created":
where_conditions.append("m.user_id = %s")
params.append(user_id)
elif filter_type == "attended":
where_conditions.append("m.user_id != %s AND a.user_id = %s")
params.extend([user_id, user_id])
has_attendees_join = True
else: # all
where_conditions.append("(m.user_id = %s OR a.user_id = %s)")
params.extend([user_id, user_id])
has_attendees_join = True
# 搜索关键词过滤
if search and search.strip():
search_pattern = f"%{search.strip()}%"
where_conditions.append("(m.title LIKE %s OR u.caption LIKE %s)")
params.extend([search_pattern, search_pattern])
# 标签过滤
if tags and tags.strip():
tag_list = [t.strip() for t in tags.split(',') if t.strip()]
if tag_list:
tag_conditions = []
for tag in tag_list:
tag_conditions.append("m.tags LIKE %s")
params.append(f"%{tag}%")
where_conditions.append(f"({' OR '.join(tag_conditions)})")
# 构建查询 - 只获取meeting_id按meeting_time降序排序
query = '''
SELECT m.meeting_id
FROM meetings m
JOIN users u ON m.user_id = u.user_id
'''
if has_attendees_join:
query += " LEFT JOIN attendees a ON m.meeting_id = a.meeting_id"
if where_conditions:
query += f" WHERE {' AND '.join(where_conditions)}"
if has_attendees_join:
query += " GROUP BY m.meeting_id"
query += " ORDER BY m.meeting_time DESC, m.created_at DESC"
cursor.execute(query, params)
all_meetings = cursor.fetchall()
all_meeting_ids = [m['meeting_id'] for m in all_meetings]
# 找到当前会议在列表中的位置
try:
current_index = all_meeting_ids.index(meeting_id)
except ValueError:
return create_api_response(code="200", message="当前会议不在筛选结果中", data={
'prev_meeting_id': None,
'next_meeting_id': None,
'current_index': None,
'total_count': len(all_meeting_ids)
})
# 计算上一条和下一条
prev_meeting_id = all_meeting_ids[current_index - 1] if current_index > 0 else None
next_meeting_id = all_meeting_ids[current_index + 1] if current_index < len(all_meeting_ids) - 1 else None
return create_api_response(code="200", message="获取导航信息成功", data={
'prev_meeting_id': prev_meeting_id,
'next_meeting_id': next_meeting_id,
'current_index': current_index,
'total_count': len(all_meeting_ids)
})
except Exception as e:
return create_api_response(code="500", message=f"获取导航信息失败: {str(e)}")
2025-11-07 09:12:29 +00:00
@router.get("/meetings/{meeting_id}/preview-data")
def get_meeting_preview_data(meeting_id: int):
"""
获取会议预览数据无需登录认证
用于二维码扫描后的预览页面
"""
try:
with get_db_connection() as connection:
cursor = connection.cursor(dictionary=True)
2025-12-11 08:48:12 +00:00
# 检查会议是否存在,并获取模版信息
2025-11-07 09:12:29 +00:00
query = '''
2025-12-11 08:48:12 +00:00
SELECT m.meeting_id, m.title, m.meeting_time, m.summary, m.updated_at, m.prompt_id,
m.user_id as creator_id, u.caption as creator_username,
p.name as prompt_name
2025-11-07 09:12:29 +00:00
FROM meetings m
JOIN users u ON m.user_id = u.user_id
2025-12-11 08:48:12 +00:00
LEFT JOIN prompts p ON m.prompt_id = p.id
2025-11-07 09:12:29 +00:00
WHERE m.meeting_id = %s
'''
cursor.execute(query, (meeting_id,))
meeting = cursor.fetchone()
if not meeting:
return create_api_response(code="404", message="会议不存在")
# 检查是否已生成会议总结
if not meeting['summary'] or not meeting['updated_at']:
return create_api_response(code="400", message="该会议总结尚未生成")
# 获取参会人员信息
attendees_query = 'SELECT u.user_id, u.caption FROM attendees a JOIN users u ON a.user_id = u.user_id WHERE a.meeting_id = %s'
cursor.execute(attendees_query, (meeting_id,))
attendees_data = cursor.fetchall()
attendees = [{'user_id': row['user_id'], 'caption': row['caption']} for row in attendees_data]
# 组装返回数据
preview_data = {
"meeting_id": meeting['meeting_id'],
"title": meeting['title'],
"meeting_time": meeting['meeting_time'],
"summary": meeting['summary'],
"creator_username": meeting['creator_username'],
2025-12-11 08:48:12 +00:00
"prompt_id": meeting['prompt_id'],
"prompt_name": meeting['prompt_name'],
2025-11-07 09:12:29 +00:00
"attendees": attendees,
"attendees_count": len(attendees)
}
return create_api_response(code="200", message="获取会议预览数据成功", data=preview_data)
except Exception as e:
return create_api_response(code="500", message=f"Failed to get meeting preview data: {str(e)}")