-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathjobs2mongo.py
30 lines (23 loc) · 892 Bytes
/
jobs2mongo.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import pymongo
import json
import os
def insert_json_to_mongodb(filename, collection):
# 先把json换成字典
with open(filename, 'r', encoding='utf-8') as f:
data_dict = json.load(f)
# 将data插入collection
#collection.insert_one(data_dict)
job_dict = {}
for i in range(len(data_dict["data"])):
job_dict = data_dict["data"][i]
collection.insert_one(job_dict)
# 建立MongoDB连接
client = pymongo.MongoClient("mongodb://localhost:27017/")
db = client["bigdata"]
# 定义集合名称列表
collections = ["cloud_developer", "data_scientist", "jobs_data", "product_manager", "researcher", "software_engineer", "technical_manager"]
# 遍历列表并插入到MongoDB
for collection_name in collections:
collection = db[collection_name]
filename = f"data/{collection_name}.json"
insert_json_to_mongodb(filename, collection)