12345678 |
- from data.analyze_data.analyze_xls import readXls, analyze_entity, set_become_dict_list
- if __name__ == "__main__":
- path = '../data/source/机械相关专业数据汇总/爬虫数据(山东省数据)/【最终】2024_11_03_临沂职业学院-智联招聘和前程无忧数据.xls'
- data_list = readXls(path)
- set_post, set_job_category, set_company_industry, set_company_name, set_company_nature, set_city = analyze_entity(data_list)
- list_job = set_become_dict_list(set_post)
- print(list_job)
|