This repository has been archived on 2024-11-02. You can view files and clone it, but cannot push or open issues or pull requests.
db-manager/src/mongo.py

63 lines
2.4 KiB
Python
Raw Normal View History

2023-02-11 15:16:25 +00:00
import os
from pymongo import MongoClient
2023-02-11 22:05:30 +00:00
import time
2023-02-11 15:16:25 +00:00
import urllib.parse
import logger as log
log.out("mongo.py: Fetching configuration", "INFO")
2023-02-11 22:05:30 +00:00
db_host = os.getenv('OWL_DB_HOST', 'localhost')
db_port = os.getenv('OWL_DB_PORT', 27017)
db_user = urllib.parse.quote_plus(os.getenv('OWL_DB_USER', "owl"))
db_pass = urllib.parse.quote_plus(os.getenv('OWL_DB_PASS', "twittwoo"))
db_name = os.getenv('OWL_DB_NAME', "owlboard")
2023-02-12 20:03:20 +00:00
log.out(f"mongo.py: Connecting to database at {db_host}:{db_port}", "INFOm")
2023-02-11 22:05:30 +00:00
client = MongoClient(f"mongodb://{db_user}:{db_pass}@{db_host}:{db_port}")
db = client[db_name]
def metaCheckTime(target):
col = db["meta"]
2023-02-12 20:03:20 +00:00
res = col.find_one({"target": target, "type": "collection"})
2023-02-11 22:05:30 +00:00
log.out(f'mongo.metaUpdateTime: {target} last updated at {res["updated"]}', "INFO")
return res["updated"]
def metaUpdateTime(target):
col = db["meta"]
log.out(f'mongo.metaUpdateTime: Updating updated time for {target}', "INFO")
2023-02-12 20:03:20 +00:00
res = col.update_one({"target": target, "type":"collection"}, {"$set":{"updated": int(time.time()),"target":target, "type":"collection"}}, upsert=True)
2023-02-11 22:05:30 +00:00
def getLength(collection):
col = db[collection]
return col.count_documents({})
def putBulkCorpus(data):
startCount = getLength("corpus")
col = db["corpus"]
if startCount > 0:
log.out(f'mongo.putBulkCorpus: Dropping {startCount} CORPUS documents', "INFO")
col.drop()
col.insert_many(data)
endCount = getLength("corpus")
log.out(f'mongo.putBulkCorpus: {endCount} documents inserted', "INFO")
log.out(f'mongo.putBulkCorpus: {endCount - startCount} new documents', "INFO")
#log.out('mongo.putBulkCorpus: Building collection indexes',"INFO")
# ADD INDEXES HERE
log.out('mongo.putBulkCorpus: Updating meta time',"INFO")
metaUpdateTime("corpus")
return
def putBulkStations(data):
startCount = getLength("stations")
col = db["stations"]
if startCount > 0:
log.out(f'mongo.putBulkStations: Dropping {startCount} station documents', "INFO")
col.drop()
col.insert_many(data)
endCount = getLength("stations")
log.out(f'mongo.putBulkStations: {endCount} documents inserted', "INFO")
log.out(f'mongo.putBulkStations: {endCount - startCount} new documents', "INFO")
#log.out('mongo.putBulkStations: Building collection indexes',"INFO")
# ADD INDEXES HERE
log.out('mongo.putBulkStations: Updating meta time',"INFO")
metaUpdateTime("stations")
return