Files
Extract_reqs/config.yaml

103 lines
2.8 KiB
YAML
Raw Normal View History

2026-02-03 22:48:22 +08:00
# 配置文件 - SRS 需求文档解析工具 (LLM增强版)
# Configuration file for SRS Requirement Document Parser (LLM Enhanced Version)
# LLM配置 - 阿里云千问
llm:
# 是否启用LLM设为false则使用纯规则提取
enabled: true
# LLM提供商qwen阿里云千问
provider: "qwen"
# 模型名称
model: "qwen3-max-2026-01-23"
2026-02-03 22:48:22 +08:00
# API密钥建议使用环境变量 DASHSCOPE_API_KEY
api_key: "sk-7097f7842f724f0c9e70c4bf3b16dacb"
# 可选参数
temperature: 0.3
max_tokens: 1024
# 文档解析配置
document:
supported_formats:
- ".pdf"
- ".docx"
# 标题识别的样式列表
heading_styles:
- "Heading 1"
- "Heading 2"
- "Heading 3"
- "Heading 4"
- "Heading 5"
# 需要过滤的非需求章节GJB438B标准
non_requirement_sections:
- "标识"
- "系统概述"
- "文档概述"
- "引用文档"
- "合格性规定"
- "需求可追踪性"
- "注释"
- "附录"
# 需求提取配置
extraction:
# 需求类型关键字(用于自动判断需求类型)
requirement_types:
功能需求:
prefix: "FR"
keywords: ["功能", "feature", "requirement", "CSCI组成", "控制", "处理", "监测", "显示"]
priority: 1
接口需求:
prefix: "IR"
keywords: ["接口", "interface", "api", "外部接口", "内部接口", "CAN", "以太网", "通信"]
priority: 2
性能需求:
prefix: "PR"
keywords: ["性能", "performance", "速度", "响应时间", "吞吐量"]
priority: 3
安全需求:
prefix: "SR"
keywords: ["安全", "security", "安全性", "报警"]
priority: 4
可靠性需求:
prefix: "RR"
keywords: ["可靠", "reliability", "容错", "恢复", "冗余"]
priority: 5
其他需求:
prefix: "OR"
keywords: ["约束", "资源", "适应性", "保密", "环境", "计算机", "质量", "设计", "人员", "培训", "保障", "验收", "交付"]
priority: 6
splitter:
enabled: true
max_sentence_len: 120
min_clause_len: 12
semantic_guard:
enabled: true
preserve_condition_action_chain: true
preserve_alarm_chain: true
table_strategy:
llm_semantic_enabled: true
sequence_table_merge: "single_requirement"
merge_time_series_rows_min: 3
rewrite_policy:
llm_light_rewrite_enabled: true
preserve_ratio_min: 0.65
max_length_growth_ratio: 1.25
renumber_policy:
enabled: true
mode: "section_continuous"
2026-02-03 22:48:22 +08:00
# 输出配置
output:
format: "json"
indent: 2
# 是否美化输出(格式化)
pretty_print: true
# 是否包含元数据
include_metadata: true
# 日志配置
logging:
level: "INFO" # DEBUG, INFO, WARNING, ERROR
format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
file: "srs_parser.log"