This repository has been archived on 2024-11-02. You can view files and clone it, but cannot push or open issues or pull requests.
db-manager/src/mongo.py

90 lines
3.4 KiB
Python
Raw Normal View History

2023-02-11 15:16:25 +00:00
import os
from pymongo import MongoClient
2023-02-11 22:05:30 +00:00
import time
2023-02-11 15:16:25 +00:00
import urllib.parse
import logger as log
log.out("mongo.py: Fetching configuration", "INFO")
2023-02-11 22:05:30 +00:00
db_host = os.getenv('OWL_DB_HOST', 'localhost')
db_port = os.getenv('OWL_DB_PORT', 27017)
db_user = urllib.parse.quote_plus(os.getenv('OWL_DB_USER', "owl"))
db_pass = urllib.parse.quote_plus(os.getenv('OWL_DB_PASS', "twittwoo"))
db_name = os.getenv('OWL_DB_NAME', "owlboard")
2023-02-12 20:53:59 +00:00
log.out(f"mongo.py: Connecting to database at {db_host}:{db_port}", "INFO")
2023-02-11 22:05:30 +00:00
client = MongoClient(f"mongodb://{db_user}:{db_pass}@{db_host}:{db_port}")
db = client[db_name]
def metaCheckTime(target):
col = db["meta"]
2023-02-12 20:03:20 +00:00
res = col.find_one({"target": target, "type": "collection"})
2023-02-12 21:36:41 +00:00
if 'updated' in res:
log.out(f'mongo.metaUpdateTime: {target} last updated at {res["updated"]}', "INFO")
return res["updated"]
else:
log.out(f'mongo.metaUpdatetime: {target} does not exist', "INFO")
return 0
2023-02-11 22:05:30 +00:00
def metaUpdateTime(target):
col = db["meta"]
log.out(f'mongo.metaUpdateTime: Updating updated time for {target}', "INFO")
2023-02-12 20:03:20 +00:00
res = col.update_one({"target": target, "type":"collection"}, {"$set":{"updated": int(time.time()),"target":target, "type":"collection"}}, upsert=True)
2023-02-11 22:05:30 +00:00
def getLength(collection):
col = db[collection]
return col.count_documents({})
2023-02-12 20:53:59 +00:00
def createSingleIndex(collection, field):
col = db[collection]
col.create_index(field)
log.out(f'mongo.createSingleIndex: Created index of {field} in {collection}', "INFO")
return
2023-02-11 22:05:30 +00:00
def putBulkCorpus(data):
2023-02-12 20:53:59 +00:00
collection = "corpus"
startCount = getLength(collection)
col = db[collection]
2023-02-11 22:05:30 +00:00
if startCount > 0:
log.out(f'mongo.putBulkCorpus: Dropping {startCount} CORPUS documents', "INFO")
col.drop()
col.insert_many(data)
2023-02-12 20:53:59 +00:00
endCount = getLength(collection)
2023-02-11 22:05:30 +00:00
log.out(f'mongo.putBulkCorpus: {endCount} documents inserted', "INFO")
log.out(f'mongo.putBulkCorpus: {endCount - startCount} new documents', "INFO")
2023-02-12 20:53:59 +00:00
log.out('mongo.putBulkCorpus: Building collection indexes',"INFO")
createSingleIndex(collection, "NLC")
createSingleIndex(collection, "3ALPHA")
2023-02-11 22:05:30 +00:00
log.out('mongo.putBulkCorpus: Updating meta time',"INFO")
2023-02-12 20:53:59 +00:00
metaUpdateTime(collection)
2023-02-11 22:05:30 +00:00
return
def putBulkStations(data):
2023-02-12 20:53:59 +00:00
collection = "stations"
startCount = getLength(collection)
col = db[collection]
2023-02-11 22:05:30 +00:00
if startCount > 0:
log.out(f'mongo.putBulkStations: Dropping {startCount} station documents', "INFO")
col.drop()
col.insert_many(data)
2023-02-12 20:53:59 +00:00
endCount = getLength(collection)
2023-02-11 22:05:30 +00:00
log.out(f'mongo.putBulkStations: {endCount} documents inserted', "INFO")
log.out(f'mongo.putBulkStations: {endCount - startCount} new documents', "INFO")
2023-02-12 20:53:59 +00:00
log.out('mongo.putBulkStations: Building collection indexes',"INFO")
createSingleIndex(collection, "3ALPHA")
createSingleIndex(collection, "STANOX")
createSingleIndex(collection, "TIPLOC")
2023-02-11 22:05:30 +00:00
log.out('mongo.putBulkStations: Updating meta time',"INFO")
2023-02-12 20:53:59 +00:00
metaUpdateTime(collection)
2023-02-12 21:36:41 +00:00
return
def metaCounters():
collection = "meta"
col = db[collection]
res = col.find_one({"target": "counters","type": "count"})
if 'since' not in res:
log.out('mongo.metaCounters: counters does not exist, creating', "INFO")
col.update_one({"target": "counters","type": "count"}, {"target": "counters","type": "count","since": int(time.time())})
else:
log.out('mongo.metaCounters: counters already exists, skipping', "INFO")
2023-02-11 22:05:30 +00:00
return