添加API服务模块

2026-01-07 11:56:46 +08:00
parent 9ca3a3a89a
commit c634cb2daa
8 changed files with 241 additions and 0 deletions
--- a/api/services/init.py
+++ b/api/services/init.py
@@ -0,0 +1,11 @@
 """
 服务模块
 """
 from .asr_service import asr_service
 from .tts_service import tts_service
 __all__ = [
    "asr_service",
    "tts_service",
 ]
--- a/api/services/pycache/init.cpython-312.pyc
+++ b/api/services/pycache/init.cpython-312.pyc
--- a/api/services/pycache/asr_service.cpython-312.pyc
+++ b/api/services/pycache/asr_service.cpython-312.pyc
--- a/api/services/pycache/pdf_service.cpython-312.pyc
+++ b/api/services/pycache/pdf_service.cpython-312.pyc
--- a/api/services/pycache/tts_service.cpython-312.pyc
+++ b/api/services/pycache/tts_service.cpython-312.pyc
--- a/api/services/asr_service.py
+++ b/api/services/asr_service.py
@@ -0,0 +1,64 @@
 """
 ASR 服务：语音转文字
 """
 import os
 import base64
 from typing import Optional, Any, Coroutine
 from openai import OpenAI
 class ASRService:
    """ASR 服务（语音转文字）"""
    def __init__(self):
        api_key = os.getenv("OPENAI_API_KEY", "")
        if api_key:
            self.client = OpenAI(api_key=api_key)
        else:
            self.client = None
    async def transcribe(self, audio_base64: str) -> str | None:
        """
        转写音频为文字
        Args:
            audio_base64: Base64 编码的音频数据
        Returns:
            转写文本
        """
        if not self.client:
            # 如果没有配置 API Key，返回模拟数据
            return "这是模拟的转写文本（请配置 OPENAI_API_KEY 以使用实际 ASR 功能）"
        try:
            # 解码 Base64 音频
            audio_bytes = base64.b64decode(audio_base64)
            # 保存临时文件
            import tempfile
            with tempfile.NamedTemporaryFile(suffix=".m4a", delete=False) as tmp_file:
                tmp_file.write(audio_bytes)
                tmp_file_path = tmp_file.name
            try:
                # 调用 OpenAI Whisper API
                with open(tmp_file_path, "rb") as audio_file:
                    transcript = self.client.audio.transcriptions.create(
                        model="whisper-1",
                        file=audio_file,
                        language="zh"  # 中文
                    )
                return transcript.text
            finally:
                # 清理临时文件
                import os
                if os.path.exists(tmp_file_path):
                    os.remove(tmp_file_path)
        except Exception as e:
            # 出错时返回错误信息
            return f"转写失败: {str(e)}"
 # 全局实例
 asr_service = ASRService()
--- a/api/services/pdf_service.py
+++ b/api/services/pdf_service.py
@@ -0,0 +1,107 @@
 """
 PDF 生成服务
 """
 from typing import List
 from reportlab.lib.pagesizes import letter, A4
 from reportlab.lib.styles import getSampleStyleSheet, ParagraphStyle
 from reportlab.lib.units import inch
 from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer, PageBreak
 from reportlab.pdfbase import pdfmetrics
 from reportlab.pdfbase.ttfonts import TTFont
 from reportlab.pdfbase.cidfonts import UnicodeCIDFont
 from io import BytesIO
 import os
 class PDFService:
    """PDF 生成服务"""
    def __init__(self):
        # 尝试注册中文字体
        try:
            # 使用系统字体或 ReportLab 内置的中文字体
            # 如果没有中文字体文件，使用 UnicodeCIDFont
            pdfmetrics.registerFont(UnicodeCIDFont('STSong-Light'))
            self.chinese_font = 'STSong-Light'
        except Exception:
            # 如果注册失败，使用默认字体（可能不支持中文）
            self.chinese_font = 'Helvetica'
    async def generate_pdf(self, book, chapters: List) -> bytes:
        """
        生成 PDF
        Args:
            book: 回忆录对象
            chapters: 章节列表
        Returns:
            PDF 字节数据
        """
        buffer = BytesIO()
        doc = SimpleDocTemplate(buffer, pagesize=A4)
        # 创建样式
        styles = getSampleStyleSheet()
        title_style = ParagraphStyle(
            'CustomTitle',
            parent=styles['Heading1'],
            fontSize=24,
            spaceAfter=30,
            alignment=1,  # 居中
            fontName=self.chinese_font
        )
        heading_style = ParagraphStyle(
            'CustomHeading',
            parent=styles['Heading1'],
            fontSize=18,
            spaceAfter=12,
            fontName=self.chinese_font
        )
        normal_style = ParagraphStyle(
            'CustomNormal',
            parent=styles['Normal'],
            fontSize=12,
            leading=18,
            fontName=self.chinese_font
        )
        # 构建内容
        story = []
        # 封面
        story.append(Paragraph(book.title, title_style))
        story.append(Spacer(1, 0.5*inch))
        story.append(PageBreak())
        # 目录
        story.append(Paragraph("目录", heading_style))
        story.append(Spacer(1, 0.2*inch))
        for i, chapter in enumerate(chapters, 1):
            story.append(Paragraph(f"{i}. {chapter.title}", normal_style))
        story.append(PageBreak())
        # 章节内容
        for chapter in chapters:
            story.append(Paragraph(chapter.title, heading_style))
            story.append(Spacer(1, 0.2*inch))
            # 分段处理内容
            paragraphs = chapter.content.split('\n\n')
            for para in paragraphs:
                if para.strip():
                    story.append(Paragraph(para.strip(), normal_style))
                    story.append(Spacer(1, 0.1*inch))
            story.append(PageBreak())
        # 生成 PDF
        doc.build(story)
        buffer.seek(0)
        return buffer.read()
 # 全局实例
 pdf_service = PDFService()
--- a/api/services/tts_service.py
+++ b/api/services/tts_service.py
@@ -0,0 +1,59 @@
 """
 TTS 服务：文字转语音
 """
 import base64
 import os
 from io import BytesIO
 from openai import OpenAI
 class TTSService:
    """TTS 服务（文字转语音）"""
    def __init__(self):
        api_key = os.getenv("OPENAI_API_KEY", "")
        if api_key:
            self.client = OpenAI(api_key=api_key)
        else:
            self.client = None
    async def synthesize(self, text: str) -> str:
        """
        将文字转换为语音
        Args:
            text: 要转换的文字
        Returns:
            Base64 编码的音频数据
        """
        if not self.client:
            # 如果没有配置 API Key，返回空字符串
            return ""
        try:
            # 调用 OpenAI TTS API
            response = self.client.audio.speech.create(
                model="tts-1",
                voice="alloy",  # 可选: alloy, echo, fable, onyx, nova, shimmer
                input=text
            )
            # 读取音频数据
            audio_bytes = BytesIO()
            for chunk in response.iter_bytes():
                audio_bytes.write(chunk)
            # 转换为 Base64
            audio_data = audio_bytes.getvalue()
            audio_base64 = base64.b64encode(audio_data).decode('utf-8')
            return audio_base64
        except Exception as e:
            # 出错时返回空字符串
            print(f"TTS 生成失败: {str(e)}")
            return ""
 # 全局实例
 tts_service = TTSService()