github_mongoDB_dataprocess/check_repeat.py

25 lines
655 B
Python

from github import Github
from datetime import datetime
import pandas as pd
import ast
from pymongo import MongoClient
g = Github("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")
# 连接到MongoDB
client = MongoClient('localhost', 27017)
db = client['reference_db']
# 列出数据库中的所有集合
for collection_name in db.list_collection_names():
try:
num1 = db[collection_name].count_documents({})
repo = collection_name.replace('_','/',1)
num2 = g.get_repo(repo).get_issues(state='all').totalCount
if num2 and num1/num2 > 1.5:
print(num1,num2,repo)
except Exception as e:
print(repo,e)