StructBERT 中文情感分类 WebUI 实现与多语言切换

StructBERT 中文情感分类 WebUI 实现与多语言切换 | 极客日志

# 创建 conda 环境
conda create -n sentiment python=3.8
conda activate sentiment
# 安装核心依赖
pip install torch gradio flask transformers

import gradio as gr
from typing import Dict

LANGUAGE_TEXT = {
    "zh": {
        "title": "StructBERT 中文情感分析",
        "single_title": "单文本情感分析",
        "batch_title": "批量情感分析",
        "input_placeholder": "请输入中文文本...",
        "analyze_btn": "开始分析",
        "positive": "积极",
        "negative": "消极",
        "neutral": "中性"
    },
    "en": {
        "title": "StructBERT Sentiment Analysis",
        "single_title": "Single Text Analysis",
        "batch_title": "Batch Analysis",
        "input_placeholder": "Enter Chinese text...",
        "analyze_btn": "Analyze",
        "positive": "Positive",
        "negative": "Negative",
        "neutral": "Neutral"
    }
}

def create_interface(lang: str = "zh"):
    """创建多语言界面"""
    texts = LANGUAGE_TEXT[lang]
    with gr.Blocks(title=texts["title"]) as demo:
        gr.Markdown(f"# {texts['title']}")
        # 语言切换按钮
        with gr.Row():
            lang_btn = gr.Radio(
                choices=["中文", "English"],
                value="中文" if lang == "zh" else "English",
                label="选择语言 / Language"
            )
        # 单文本分析区域
        with gr.Tab(texts["single_title"]):
            with gr.Row():
                single_input = gr.Textbox(
                    label="输入文本",
                    placeholder=texts["input_placeholder"],
                    lines=3
                )
            with gr.Row():
                analyze_btn = gr.Button(texts["analyze_btn"])
            with gr.Row():
                output = gr.Label(label="情感分析结果")
        # 批量分析区域
        with gr.Tab(texts["batch_title"]):
            with gr.Row():
                batch_input = gr.Textbox(
                    label="批量输入（每行一条）",
                    placeholder=texts["input_placeholder"],
                    lines=10
                )
            with gr.Row():
                batch_btn = gr.Button("批量分析")
            with gr.Row():
                batch_output = gr.Dataframe(
                    headers=["文本", "情感", "置信度"],
                    label="批量分析结果"
                )
        # 语言切换逻辑
        def update_language(selected_lang):
            new_lang = "zh" if selected_lang == "中文" else "en"
            return create_interface(new_lang)
        lang_btn.change(update_language, inputs=lang_btn, outputs=demo)
    return demo

# 启动多语言界面
demo = create_interface("zh")
demo.launch(
    server_name="0.0.0.0",
    server_port=7860,
    share=False
)

from transformers import BertTokenizer, BertForSequenceClassification
import torch
from typing import List, Dict

class SentimentAnalyzer:
    def __init__(self, model_path: str):
        """初始化情感分析模型"""
        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
        self.tokenizer = BertTokenizer.from_pretrained(model_path)
        self.model = BertForSequenceClassification.from_pretrained(model_path)
        self.model.to(self.device)
        self.model.eval()
        # 情感标签映射
        self.label_map = {0: "negative", 1: "neutral", 2: "positive"}

    def analyze_single(self, text: str):
        """分析单条文本"""
        # 文本编码
        inputs = self.tokenizer(
            text, return_tensors="pt", truncation=True, max_length=512, padding=True
        )
        # 模型预测
        with torch.no_grad():
            inputs = {k: v.to(self.device) for k, v in inputs.items()}
            outputs = self.model(**inputs)
            probabilities = torch.softmax(outputs.logits, dim=-1)
        # 结果解析
        pred_label = torch.argmax(probabilities, dim=-1).item()
        confidence = probabilities[0][pred_label].item()
        return {
            "text": text,
            "sentiment": self.label_map[pred_label],
            "confidence": round(confidence, 4),
            "probabilities": probabilities.tolist()
        }

    def analyze_batch(self, texts: List[str], batch_size: int = 32):
        """批量分析文本，支持大批量处理"""
        results = []
        # 分批处理避免内存溢出
        for i in range(0, len(texts), batch_size):
            batch_texts = texts[i:i + batch_size]
            # 批量编码
            inputs = self.tokenizer(
                batch_texts, return_tensors="pt", truncation=True, max_length=512,
                padding=True, add_special_tokens=True
            )
            # 批量预测
            with torch.no_grad():
                inputs = {k: v.to(self.device) for k, v in inputs.items()}
                outputs = self.model(**inputs)
                probabilities = torch.softmax(outputs.logits, dim=-1)
            # 批量结果处理
            batch_results = []
            for j, probs in enumerate(probabilities):
                pred_label = torch.argmax(probs).item()
                confidence = probs[pred_label].item()
                batch_results.append({
                    "text": batch_texts[j],
                    "sentiment": self.label_map[pred_label],
                    "confidence": round(confidence, 4)
                })
            results.extend(batch_results)
        return results

#!/bin/bash
# start_sentiment.sh
# 激活 conda 环境
conda activate sentiment
# 启动 WebUI 服务
cd /root/nlp_structbert_sentiment-classification_chinese-base
python app/webui.py &
# 启动 API 服务
python app/main.py &
echo "服务启动完成！"
echo "WebUI 地址：http://localhost:7860"
echo "API 地址：http://localhost:8080"

supervisorctl status

# 重启 WebUI
supervisorctl restart nlp_structbert_webui
# 重启 API
supervisorctl restart nlp_structbert_sentiment

# 实时查看 WebUI 日志
supervisorctl tail -f nlp_structbert_webui
# 查看 API 日志
supervisorctl tail -f nlp_structbert_sentiment

# 示例评论数据
reviews = [
    "产品质量很好，物超所值！",
    "快递速度太慢了，等了好几天",
    "包装很精美，适合送礼",
    "功能没有描述的好，有点失望"
]
# 批量分析
analyzer = SentimentAnalyzer(MODEL_PATH)
results = analyzer.analyze_batch(reviews)
for result in results:
    print(f"评论：{result['text']}")
    print(f"情感：{result['sentiment']} (置信度：{result['confidence']})")
    print("-" * 50)

def monitor_social_media(keywords: List[str], platform: str = "weibo"):
    """监控社交媒体情感"""
    # 获取相关帖子
    posts = fetch_posts(keywords, platform)
    # 情感分析
    sentiments = analyzer.analyze_batch(posts)
    # 生成情感报告
    positive_count = sum(1 for s in sentiments if s['sentiment'] == 'positive')
    negative_count = sum(1 for s in sentiments if s['sentiment'] == 'negative')
    return {
        "total_posts": len(posts),
        "positive_rate": positive_count / len(posts),
        "negative_rate": negative_count / len(posts),
        "details": sentiments
    }

StructBERT 中文情感分类 WebUI 实现与多语言切换

StructBERT 中文情感分类 WebUI 实现与多语言切换

1. 项目概述与环境准备

2. WebUI 界面功能详解

2.1 单文本情感分析

2.2 批量文本分析

3. 多语言界面实现详解

3.1 中英文切换核心代码

3.2 界面动态更新机制

4. 情感分析核心功能实现

4.1 模型加载与初始化

4.2 批量处理优化

5. 完整部署与使用指南

5.1 一键启动脚本

5.2 服务管理命令

6. 实际应用案例

6.1 电商评论分析

6.2 社交媒体情绪监控

7. 总结与建议

更多推荐文章

相关免费在线工具

StructBERT 中文情感分类 WebUI 实现与多语言切换

StructBERT 中文情感分类 WebUI 实现与多语言切换

1. 项目概述与环境准备

2. WebUI 界面功能详解

2.1 单文本情感分析

2.2 批量文本分析

3. 多语言界面实现详解

3.1 中英文切换核心代码

3.2 界面动态更新机制

4. 情感分析核心功能实现

4.1 模型加载与初始化

4.2 批量处理优化

5. 完整部署与使用指南

5.1 一键启动脚本

5.2 服务管理命令

6. 实际应用案例

6.1 电商评论分析

6.2 社交媒体情绪监控

7. 总结与建议

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具