ALL-teach_sys/frontend_环保/convert_env_resume_data.py

import json
import re
import os

# 读取环保岗位简历数据
with open('网页未导入数据/环保产业/环保岗位简历.json', 'r', encoding='utf-8') as f:
    env_data = json.load(f)

# 读取面试题数据
with open('网页未导入数据/岗位群面试题（全产业）.json', 'r', encoding='utf-8') as f:
    interview_data = json.load(f)

# 读取修改版简历
modified_resumes = {}
modified_resume_dir = '网页未导入数据/环保产业/环保修改版简历'
if os.path.exists(modified_resume_dir):
    for filename in os.listdir(modified_resume_dir):
        if filename.endswith('.md'):
            # 获取文件名（不含扩展名）
            file_position_name = filename.replace('.md', '')
            # 处理特殊的岗位名称映射
            if file_position_name == '环评工程师（环境影响评价工程师）':
                # 同时存储两种形式，以确保能匹配
                with open(os.path.join(modified_resume_dir, filename), 'r', encoding='utf-8') as f:
                    content = f.read()
                    modified_resumes['环评工程师'] = content
                    modified_resumes['环评工程师（环境影响评价工程师）'] = content
            else:
                with open(os.path.join(modified_resume_dir, filename), 'r', encoding='utf-8') as f:
                    modified_resumes[file_position_name] = f.read()

print(f"已加载{len(modified_resumes)}个修改版简历：{list(modified_resumes.keys())}")

# 按岗位群组织数据
position_groups = {
    "环境规划": [],
    "节能与碳管理": [],
    "设备运维与支持": [],
    "生态修复": [],
    "污染治理": [],
    "资源回收与再生": [],
    "报告输出与管理": [],
    "环境监测": [],
    "环境体系咨询": [],
    "实验室检测": []
}

# 组织简历数据
for item in env_data:
    group = item.get("简历岗位群", "")
    if group in position_groups:
        position_groups[group].append(item)

# 获取环保产业的面试题
env_interview_questions = {}
for item in interview_data:
    if item.get("所属就业管家") == "环保":
        group = item.get("简历岗位群", "")
        if group not in env_interview_questions:
            env_interview_questions[group] = item.get("面试题内容", "")

# 生成JavaScript格式的数据结构
js_output = """// 岗位群列表
const industries = [
"""

# 生成所有岗位群的数据
industry_configs = [
    ("environment_planning", "环境规划"),
    ("energy_carbon", "节能与碳管理"),
    ("equipment_maintenance", "设备运维与支持"),
    ("ecological_restoration", "生态修复"),
    ("pollution_control", "污染治理"),
    ("resource_recycling", "资源回收与再生"),
    ("report_management", "报告输出与管理"),
    ("environment_monitoring", "环境监测"),
    ("environment_consulting", "环境体系咨询"),
    ("laboratory_testing", "实验室检测")
]

for idx, (industry_id, industry_name) in enumerate(industry_configs):
    js_output += f"""  {{
    id: "{industry_id}",
    name: "{industry_name}",
    positions: [
"""

    # 获取该岗位群的岗位列表
    positions = position_groups.get(industry_name, [])
    for pos_idx, pos in enumerate(positions):
        position_name = pos.get("岗位名称", "")
        level = pos.get("岗位等级标签", "普通岗")
        avatar = pos.get("简历头像url", "")

        js_output += f"""      {{
        id: "{industry_id}_{pos_idx + 1}",
        title: "{position_name}",
        level: "{level}",
        avatar: "{avatar}",
        department: "{industry_name}",
        type: "全职",
        experience: "1-3年",
        education: "大专",
        salary: "6-10K",
        location: "苏州",
        updateTime: "2024-01-20",
        description: "{position_name}职位描述",
        requirements: [
          "熟悉{industry_name}相关工作",
          "具有良好的沟通能力",
          "有相关工作经验优先"
        ]
      }}"""
        if pos_idx < len(positions) - 1:
            js_output += ","
        js_output += "\n"

    js_output += """    ],
    questions: [
      {
"""

    # 添加面试题内容
    interview_content = env_interview_questions.get(industry_name, "")
    if interview_content:
        # 解析面试题内容，提取问答对
        questions = []
        lines = interview_content.split('\n')
        current_q = ""
        current_a = ""

        in_answer = False
        for i, line in enumerate(lines):
            # 匹配题目行：数字开头，可能包含"问题："
            if line.strip() and line.strip()[0].isdigit() and '.' in line:
                if current_q and current_a:
                    questions.append((current_q, current_a))
                # 移除题号和"问题："前缀
                current_q = re.sub(r'^\d+\.\s*', '', line.strip())
                current_q = re.sub(r'^问题：\s*', '', current_q)
                current_a = ""
                in_answer = False
            # 匹配答案标记行
            elif '答案' in line or '参考' in line or '回答' in line or '回复' in line:
                in_answer = True
                # 如果答案在同一行（冒号后）
                if '：' in line or ':' in line:
                    parts = re.split('[：:]', line, 1)
                    if len(parts) > 1 and parts[1].strip():
                        current_a = parts[1].strip()
            # 收集答案内容
            elif in_answer and line.strip():
                if not current_a:
                    current_a = line.strip()
                else:
                    current_a += " " + line.strip()
            # 空行可能表示答案结束
            elif in_answer and not line.strip() and current_a:
                in_answer = False

        if current_q and current_a:
            questions.append((current_q, current_a))

        # 不限制问题数量，显示所有题目
        # questions = questions[:6]

        js_output += f"""        id: "{industry_id}_q1",
        question: "{industry_name}岗位群面试题",
        subQuestions: [
"""
        for q_idx, (question, answer) in enumerate(questions):
            # 清理问题和答案文本
            question = question.replace('"', '\\"').replace('\n', ' ')
            answer = answer.replace('"', '\\"').replace('\n', ' ')

            js_output += f"""          {{
            id: "q{q_idx + 1}",
            question: "{question}",
            answer: `{answer}`
          }}"""
            if q_idx < len(questions) - 1:
                js_output += ","
            js_output += "\n"

        js_output += """        ]
      }
    ]
"""

    js_output += "  }"
    if idx < len(industry_configs) - 1:
        js_output += ","
    js_output += "\n"

js_output += """];

// 简历模板数据
const resumeTemplates = {
"""

# 生成简历模板数据
for idx, (industry_id, industry_name) in enumerate(industry_configs):
    js_output += f'  "{industry_name}": [\n'

    positions = position_groups.get(industry_name, [])
    for pos_idx, pos in enumerate(positions):
        position_name = pos.get("岗位名称", "")
        level = pos.get("岗位等级标签", "普通岗")
        resume_content = pos.get("简历内容", "")
        project_name = pos.get("对应项目案例名称", "")
        avatar = pos.get("简历头像url", "")

        # 解析简历内容
        project_desc = ""
        core_skills = []
        compound_skills = []
        personal_summary = ""

        if resume_content:
            # 提取项目职责
            match = re.search(r'###\s*\(五\)\s*岗位职责[：:](.*?)(?=\n#|$)', resume_content, re.DOTALL)
            if match:
                project_desc = match.group(1).strip()

            # 提取垂直能力
            match = re.search(r'###\s*\(一\)\s*垂直能力(.*?)(?=###|\n#|$)', resume_content, re.DOTALL)
            if match:
                skills_text = match.group(1)
                core_skills = [s.strip() for s in re.findall(r'\d+\.\s*(.*?)(?=\n\d+\.|$)', skills_text, re.DOTALL)][:5]

            # 提取复合能力
            match = re.search(r'###\s*\(二\)\s*复合能力(.*?)(?=\n#|$)', resume_content, re.DOTALL)
            if match:
                skills_text = match.group(1)
                compound_skills = [s.strip() for s in re.findall(r'\d+\.\s*(.*?)(?=\n\d+\.|$)', skills_text, re.DOTALL)][:5]

            # 提取个人评价
            match = re.search(r'#\s*三、\s*个人评价(.*?)$', resume_content, re.DOTALL)
            if match:
                personal_summary = match.group(1).strip()

        # 清理文本
        def clean_text(text):
            return text.replace('\\n', '\\\\n').replace('"', '\\"').replace('\n', '\\n')

        # 获取修改版简历（如果存在）
        modified_content = modified_resumes.get(position_name)
        if not modified_content:
            # 尝试不同的岗位名称格式
            if '（' in position_name:
                # 尝试去掉括号部分
                short_name = position_name.split('（')[0]
                modified_content = modified_resumes.get(short_name)
            elif position_name == '环评工程师':
                # 特殊处理环评工程师
                modified_content = modified_resumes.get('环评工程师（环境影响评价工程师）')

        # 如果没有修改版，使用原始版本
        if not modified_content:
            modified_content = resume_content

        js_output += f"""    {{
      position: "{position_name}",
      level: "{level}",
      avatar: "{avatar}",
      content: {{
        original: `{clean_text(resume_content)}`,
        modified: `{clean_text(modified_content)}`
      }},
      studentInfo: {{
        project_experience: {{
          project_name: "{project_name}",
          position: "{position_name}",
          time_period: "XXXXXX",
          company: "XXXXXX",
          description: `{clean_text(project_desc)}`
        }},
        core_skills: [
"""

        for skill_idx, skill in enumerate(core_skills):
            js_output += f'          "{clean_text(skill)}"'
            if skill_idx < len(core_skills) - 1:
                js_output += ","
            js_output += "\n"

        js_output += """        ],
        compound_skills: [
"""

        for skill_idx, skill in enumerate(compound_skills):
            js_output += f'          "{clean_text(skill)}"'
            if skill_idx < len(compound_skills) - 1:
                js_output += ","
            js_output += "\n"

        js_output += f"""        ],
        personal_summary: "{clean_text(personal_summary)}"
      }}
    }}"""

        if pos_idx < len(positions) - 1:
            js_output += ","
        js_output += "\n"

    js_output += "  ]"
    if idx < len(industry_configs) - 1:
        js_output += ","
    js_output += "\n"

js_output += """};

// 我的简历数据
const myResume = {
    personalInfo: {
      name: "邓沐",
      phone: "138****8888",
      email: "dengmu@example.com",
      age: 22,
      education: "苏州农业职业技术学院 生态环境修复技术 2021.9-2024.6",
      experience: "1年",
      location: "苏州"
    },
    workExperience: [
      {
        company: "某环保科技公司",
        position: "环境监测实习生",
        duration: "2023.06-2024.01",
        description: "负责环境监测数据采集、分析和报告编制工作"
      }
    ],
    skills: ["环境监测", "数据分析", "报告编制", "AutoCAD", "GIS"],
    projects: [
      {
        name: "某工业园区环境影响评价项目",
        role: "环评助理",
        duration: "2023.09-2024.01",
        description: "协助完成环境影响评价报告的编制和现场踏勘工作"
      }
    ]
  };

// 获取页面mock数据的函数
export function getMockPageData() {
  return resumeInterviewMockData;
}

// 导出合并的数据
export const resumeInterviewMockData = {
  industries,
  resumeTemplates,
  myResume
};
"""

# 写入文件
with open('src/mocks/resumeInterviewMock_env.js', 'w', encoding='utf-8') as f:
    f.write(js_output)

print("转换完成！已生成 src/mocks/resumeInterviewMock_env.js")
-												初始化12个产业教务系统项目

主要内容：
- 包含12个产业的完整教务系统前端代码
- 智能启动脚本 (start-industry.sh)
- 可视化产业导航页面 (index.html)
- 项目文档 (README.md)

优化内容：
- 删除所有node_modules和.yoyo文件夹，从7.5GB减少到2.7GB
- 添加.gitignore文件避免上传不必要的文件
- 自动依赖管理和智能启动系统

产业列表：
1. 文旅产业 (5150)
2. 智能制造 (5151)
3. 智能开发 (5152)
4. 财经商贸 (5153)
5. 视觉设计 (5154)
6. 交通物流 (5155)
7. 大健康 (5156)
8. 土木水利 (5157)
9. 食品产业 (5158)
10. 化工产业 (5159)
11. 能源产业 (5160)
12. 环保产业 (5161)

🤖 Generated with Claude Code
Co-Authored-By: Claude <noreply@anthropic.com>

											
										
										
											2025-09-24 14:14:14 +08:00
+								import json
 								import re
 								import os
 								# 读取环保岗位简历数据
 								with open('网页未导入数据/环保产业/环保岗位简历.json', 'r', encoding='utf-8') as f:
 								    env_data = json.load(f)
 								# 读取面试题数据
 								with open('网页未导入数据/岗位群面试题（全产业）.json', 'r', encoding='utf-8') as f:
 								    interview_data = json.load(f)
 								# 读取修改版简历
 								modified_resumes = {}
 								modified_resume_dir = '网页未导入数据/环保产业/环保修改版简历'
 								if os.path.exists(modified_resume_dir):
 								    for filename in os.listdir(modified_resume_dir):
 								        if filename.endswith('.md'):
 								            # 获取文件名（不含扩展名）
 								            file_position_name = filename.replace('.md', '')
 								            # 处理特殊的岗位名称映射
 								            if file_position_name == '环评工程师（环境影响评价工程师）':
 								                # 同时存储两种形式，以确保能匹配
 								                with open(os.path.join(modified_resume_dir, filename), 'r', encoding='utf-8') as f:
 								                    content = f.read()
 								                    modified_resumes['环评工程师'] = content
 								                    modified_resumes['环评工程师（环境影响评价工程师）'] = content
 								            else:
 								                with open(os.path.join(modified_resume_dir, filename), 'r', encoding='utf-8') as f:
 								                    modified_resumes[file_position_name] = f.read()
 								print(f"已加载{len(modified_resumes)}个修改版简历：{list(modified_resumes.keys())}")
 								# 按岗位群组织数据
 								position_groups = {
 								    "环境规划": [],
 								    "节能与碳管理": [],
 								    "设备运维与支持": [],
 								    "生态修复": [],
 								    "污染治理": [],
 								    "资源回收与再生": [],
 								    "报告输出与管理": [],
 								    "环境监测": [],
 								    "环境体系咨询": [],
 								    "实验室检测": []
 								}
 								# 组织简历数据
 								for item in env_data:
 								    group = item.get("简历岗位群", "")
 								    if group in position_groups:
 								        position_groups[group].append(item)
 								# 获取环保产业的面试题
 								env_interview_questions = {}
 								for item in interview_data:
 								    if item.get("所属就业管家") == "环保":
 								        group = item.get("简历岗位群", "")
 								        if group not in env_interview_questions:
 								            env_interview_questions[group] = item.get("面试题内容", "")
 								# 生成JavaScript格式的数据结构
 								js_output = """// 岗位群列表
 								const industries = [
 								"""
 								# 生成所有岗位群的数据
 								industry_configs = [
 								    ("environment_planning", "环境规划"),
 								    ("energy_carbon", "节能与碳管理"),
 								    ("equipment_maintenance", "设备运维与支持"),
 								    ("ecological_restoration", "生态修复"),
 								    ("pollution_control", "污染治理"),
 								    ("resource_recycling", "资源回收与再生"),
 								    ("report_management", "报告输出与管理"),
 								    ("environment_monitoring", "环境监测"),
 								    ("environment_consulting", "环境体系咨询"),
 								    ("laboratory_testing", "实验室检测")
 								]
 								for idx, (industry_id, industry_name) in enumerate(industry_configs):
 								    js_output += f"""  {{
 								    id: "{industry_id}",
 								    name: "{industry_name}",
 								    positions: [
 								"""
 								    # 获取该岗位群的岗位列表
 								    positions = position_groups.get(industry_name, [])
 								    for pos_idx, pos in enumerate(positions):
 								        position_name = pos.get("岗位名称", "")
 								        level = pos.get("岗位等级标签", "普通岗")
 								        avatar = pos.get("简历头像url", "")
 								        js_output += f"""      {{
 								        id: "{industry_id}_{pos_idx + 1}",
 								        title: "{position_name}",
 								        level: "{level}",
 								        avatar: "{avatar}",
 								        department: "{industry_name}",
 								        type: "全职",
 								        experience: "1-3年",
 								        education: "大专",
 								        salary: "6-10K",
 								        location: "苏州",
 								        updateTime: "2024-01-20",
 								        description: "{position_name}职位描述",
 								        requirements: [
 								          "熟悉{industry_name}相关工作",
 								          "具有良好的沟通能力",
 								          "有相关工作经验优先"
 								        ]
 								      }}"""
 								        if pos_idx < len(positions) - 1:
 								            js_output += ","
 								        js_output += "\n"
 								    js_output += """    ],
 								    questions: [
 								      {
 								"""
 								    # 添加面试题内容
 								    interview_content = env_interview_questions.get(industry_name, "")
 								    if interview_content:
 								        # 解析面试题内容，提取问答对
 								        questions = []
 								        lines = interview_content.split('\n')
 								        current_q = ""
 								        current_a = ""
 								        in_answer = False
 								        for i, line in enumerate(lines):
 								            # 匹配题目行：数字开头，可能包含"问题："
 								            if line.strip() and line.strip()[0].isdigit() and '.' in line:
 								                if current_q and current_a:
 								                    questions.append((current_q, current_a))
 								                # 移除题号和"问题："前缀
 								                current_q = re.sub(r'^\d+\.\s*', '', line.strip())
 								                current_q = re.sub(r'^问题：\s*', '', current_q)
 								                current_a = ""
 								                in_answer = False
 								            # 匹配答案标记行
 								            elif '答案' in line or '参考' in line or '回答' in line or '回复' in line:
 								                in_answer = True
 								                # 如果答案在同一行（冒号后）
 								                if '：' in line or ':' in line:
 								                    parts = re.split('[：:]', line, 1)
 								                    if len(parts) > 1 and parts[1].strip():
 								                        current_a = parts[1].strip()
 								            # 收集答案内容
 								            elif in_answer and line.strip():
 								                if not current_a:
 								                    current_a = line.strip()
 								                else:
 								                    current_a += " " + line.strip()
 								            # 空行可能表示答案结束
 								            elif in_answer and not line.strip() and current_a:
 								                in_answer = False
 								        if current_q and current_a:
 								            questions.append((current_q, current_a))
 								        # 不限制问题数量，显示所有题目
 								        # questions = questions[:6]
 								        js_output += f"""        id: "{industry_id}_q1",
 								        question: "{industry_name}岗位群面试题",
 								        subQuestions: [
 								"""
 								        for q_idx, (question, answer) in enumerate(questions):
 								            # 清理问题和答案文本
 								            question = question.replace('"', '\\"').replace('\n', ' ')
 								            answer = answer.replace('"', '\\"').replace('\n', ' ')
 								            js_output += f"""          {{
 								            id: "q{q_idx + 1}",
 								            question: "{question}",
 								            answer: `{answer}`
 								          }}"""
 								            if q_idx < len(questions) - 1:
 								                js_output += ","
 								            js_output += "\n"
 								        js_output += """        ]
 								      }
 								    ]
 								"""
 								    js_output += "  }"
 								    if idx < len(industry_configs) - 1:
 								        js_output += ","
 								    js_output += "\n"
 								js_output += """];
 								// 简历模板数据
 								const resumeTemplates = {
 								"""
 								# 生成简历模板数据
 								for idx, (industry_id, industry_name) in enumerate(industry_configs):
 								    js_output += f'  "{industry_name}": [\n'
 								    positions = position_groups.get(industry_name, [])
 								    for pos_idx, pos in enumerate(positions):
 								        position_name = pos.get("岗位名称", "")
 								        level = pos.get("岗位等级标签", "普通岗")
 								        resume_content = pos.get("简历内容", "")
 								        project_name = pos.get("对应项目案例名称", "")
 								        avatar = pos.get("简历头像url", "")
 								        # 解析简历内容
 								        project_desc = ""
 								        core_skills = []
 								        compound_skills = []
 								        personal_summary = ""
 								        if resume_content:
 								            # 提取项目职责
 								            match = re.search(r'###\s*\(五\)\s*岗位职责[：:](.*?)(?=\n#|$)', resume_content, re.DOTALL)
 								            if match:
 								                project_desc = match.group(1).strip()
 								            # 提取垂直能力
 								            match = re.search(r'###\s*\(一\)\s*垂直能力(.*?)(?=###|\n#|$)', resume_content, re.DOTALL)
 								            if match:
 								                skills_text = match.group(1)
 								                core_skills = [s.strip() for s in re.findall(r'\d+\.\s*(.*?)(?=\n\d+\.|$)', skills_text, re.DOTALL)][:5]
 								            # 提取复合能力
 								            match = re.search(r'###\s*\(二\)\s*复合能力(.*?)(?=\n#|$)', resume_content, re.DOTALL)
 								            if match:
 								                skills_text = match.group(1)
 								                compound_skills = [s.strip() for s in re.findall(r'\d+\.\s*(.*?)(?=\n\d+\.|$)', skills_text, re.DOTALL)][:5]
 								            # 提取个人评价
 								            match = re.search(r'#\s*三、\s*个人评价(.*?)$', resume_content, re.DOTALL)
 								            if match:
 								                personal_summary = match.group(1).strip()
 								        # 清理文本
 								        def clean_text(text):
 								            return text.replace('\\n', '\\\\n').replace('"', '\\"').replace('\n', '\\n')
 								        # 获取修改版简历（如果存在）
 								        modified_content = modified_resumes.get(position_name)
 								        if not modified_content:
 								            # 尝试不同的岗位名称格式
 								            if '（' in position_name:
 								                # 尝试去掉括号部分
 								                short_name = position_name.split('（')[0]
 								                modified_content = modified_resumes.get(short_name)
 								            elif position_name == '环评工程师':
 								                # 特殊处理环评工程师
 								                modified_content = modified_resumes.get('环评工程师（环境影响评价工程师）')
 								        # 如果没有修改版，使用原始版本
 								        if not modified_content:
 								            modified_content = resume_content
 								        js_output += f"""    {{
 								      position: "{position_name}",
 								      level: "{level}",
 								      avatar: "{avatar}",
 								      content: {{
 								        original: `{clean_text(resume_content)}`,
 								        modified: `{clean_text(modified_content)}`
 								      }},
 								      studentInfo: {{
 								        project_experience: {{
 								          project_name: "{project_name}",
 								          position: "{position_name}",
 								          time_period: "XXXXXX",
 								          company: "XXXXXX",
 								          description: `{clean_text(project_desc)}`
 								        }},
 								        core_skills: [
 								"""
 								        for skill_idx, skill in enumerate(core_skills):
 								            js_output += f'          "{clean_text(skill)}"'
 								            if skill_idx < len(core_skills) - 1:
 								                js_output += ","
 								            js_output += "\n"
 								        js_output += """        ],
 								        compound_skills: [
 								"""
 								        for skill_idx, skill in enumerate(compound_skills):
 								            js_output += f'          "{clean_text(skill)}"'
 								            if skill_idx < len(compound_skills) - 1:
 								                js_output += ","
 								            js_output += "\n"
 								        js_output += f"""        ],
 								        personal_summary: "{clean_text(personal_summary)}"
 								      }}
 								    }}"""
 								        if pos_idx < len(positions) - 1:
 								            js_output += ","
 								        js_output += "\n"
 								    js_output += "  ]"
 								    if idx < len(industry_configs) - 1:
 								        js_output += ","
 								    js_output += "\n"
 								js_output += """};
 								// 我的简历数据
 								const myResume = {
 								    personalInfo: {
 								      name: "邓沐",
 								      phone: "138****8888",
 								      email: "dengmu@example.com",
 								      age: 22,
 								      education: "苏州农业职业技术学院 生态环境修复技术 2021.9-2024.6",
 								      experience: "1年",
 								      location: "苏州"
 								    },
 								    workExperience: [
 								      {
 								        company: "某环保科技公司",
 								        position: "环境监测实习生",
 								        duration: "2023.06-2024.01",
 								        description: "负责环境监测数据采集、分析和报告编制工作"
 								      }
 								    ],
 								    skills: ["环境监测", "数据分析", "报告编制", "AutoCAD", "GIS"],
 								    projects: [
 								      {
 								        name: "某工业园区环境影响评价项目",
 								        role: "环评助理",
 								        duration: "2023.09-2024.01",
 								        description: "协助完成环境影响评价报告的编制和现场踏勘工作"
 								      }
 								    ]
 								  };
 								// 获取页面mock数据的函数
 								export function getMockPageData() {
 								  return resumeInterviewMockData;
 								}
 								// 导出合并的数据
 								export const resumeInterviewMockData = {
 								  industries,
 								  resumeTemplates,
 								  myResume
 								};
 								"""
 								# 写入文件
 								with open('src/mocks/resumeInterviewMock_env.js', 'w', encoding='utf-8') as f:
 								    f.write(js_output)
 								print("转换完成！已生成 src/mocks/resumeInterviewMock_env.js")