2023-02-11 15:16:25 +00:00
|
|
|
import os
|
|
|
|
from pymongo import MongoClient
|
2023-02-11 22:05:30 +00:00
|
|
|
import time
|
2023-02-11 15:16:25 +00:00
|
|
|
import urllib.parse
|
|
|
|
import logger as log
|
|
|
|
|
|
|
|
log.out("mongo.py: Fetching configuration", "INFO")
|
2023-02-11 22:05:30 +00:00
|
|
|
db_host = os.getenv('OWL_DB_HOST', 'localhost')
|
|
|
|
db_port = os.getenv('OWL_DB_PORT', 27017)
|
|
|
|
db_user = urllib.parse.quote_plus(os.getenv('OWL_DB_USER', "owl"))
|
|
|
|
db_pass = urllib.parse.quote_plus(os.getenv('OWL_DB_PASS', "twittwoo"))
|
|
|
|
db_name = os.getenv('OWL_DB_NAME', "owlboard")
|
|
|
|
|
2023-02-12 20:53:59 +00:00
|
|
|
log.out(f"mongo.py: Connecting to database at {db_host}:{db_port}", "INFO")
|
2023-02-11 22:05:30 +00:00
|
|
|
client = MongoClient(f"mongodb://{db_user}:{db_pass}@{db_host}:{db_port}")
|
|
|
|
db = client[db_name]
|
|
|
|
|
|
|
|
def metaCheckTime(target):
|
|
|
|
col = db["meta"]
|
2023-02-12 20:03:20 +00:00
|
|
|
res = col.find_one({"target": target, "type": "collection"})
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter("meta")
|
2023-02-13 20:45:05 +00:00
|
|
|
if type(res) is dict:
|
|
|
|
if 'updated' in res:
|
2023-02-12 21:36:41 +00:00
|
|
|
log.out(f'mongo.metaUpdateTime: {target} last updated at {res["updated"]}', "INFO")
|
|
|
|
return res["updated"]
|
2023-02-13 20:45:05 +00:00
|
|
|
log.out(f'mongo.metaUpdatetime: {target} does not exist', "INFO")
|
|
|
|
return 0
|
2023-02-11 22:05:30 +00:00
|
|
|
|
|
|
|
def metaUpdateTime(target):
|
|
|
|
col = db["meta"]
|
|
|
|
log.out(f'mongo.metaUpdateTime: Updating updated time for {target}', "INFO")
|
2023-02-12 20:03:20 +00:00
|
|
|
res = col.update_one({"target": target, "type":"collection"}, {"$set":{"updated": int(time.time()),"target":target, "type":"collection"}}, upsert=True)
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter("meta")
|
2023-02-11 22:05:30 +00:00
|
|
|
|
|
|
|
def getLength(collection):
|
|
|
|
col = db[collection]
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
return col.count_documents({})
|
|
|
|
|
2023-02-12 20:53:59 +00:00
|
|
|
def createSingleIndex(collection, field):
|
|
|
|
col = db[collection]
|
|
|
|
col.create_index(field)
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter(collection)
|
2023-02-12 20:53:59 +00:00
|
|
|
log.out(f'mongo.createSingleIndex: Created index of {field} in {collection}', "INFO")
|
|
|
|
return
|
|
|
|
|
2023-02-11 22:05:30 +00:00
|
|
|
def putBulkCorpus(data):
|
2023-02-12 20:53:59 +00:00
|
|
|
collection = "corpus"
|
|
|
|
startCount = getLength(collection)
|
|
|
|
col = db[collection]
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
if startCount > 0:
|
|
|
|
log.out(f'mongo.putBulkCorpus: Dropping {startCount} CORPUS documents', "INFO")
|
|
|
|
col.drop()
|
|
|
|
col.insert_many(data)
|
2023-02-12 20:53:59 +00:00
|
|
|
endCount = getLength(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
log.out(f'mongo.putBulkCorpus: {endCount} documents inserted', "INFO")
|
|
|
|
log.out(f'mongo.putBulkCorpus: {endCount - startCount} new documents', "INFO")
|
2023-02-12 20:53:59 +00:00
|
|
|
log.out('mongo.putBulkCorpus: Building collection indexes',"INFO")
|
|
|
|
createSingleIndex(collection, "NLC")
|
|
|
|
createSingleIndex(collection, "3ALPHA")
|
2023-02-11 22:05:30 +00:00
|
|
|
log.out('mongo.putBulkCorpus: Updating meta time',"INFO")
|
2023-02-12 20:53:59 +00:00
|
|
|
metaUpdateTime(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
return
|
|
|
|
|
|
|
|
def putBulkStations(data):
|
2023-02-12 20:53:59 +00:00
|
|
|
collection = "stations"
|
|
|
|
startCount = getLength(collection)
|
|
|
|
col = db[collection]
|
2023-02-16 21:34:31 +00:00
|
|
|
incrementCounter("stations")
|
2023-02-11 22:05:30 +00:00
|
|
|
if startCount > 0:
|
|
|
|
log.out(f'mongo.putBulkStations: Dropping {startCount} station documents', "INFO")
|
|
|
|
col.drop()
|
|
|
|
col.insert_many(data)
|
2023-02-12 20:53:59 +00:00
|
|
|
endCount = getLength(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
log.out(f'mongo.putBulkStations: {endCount} documents inserted', "INFO")
|
|
|
|
log.out(f'mongo.putBulkStations: {endCount - startCount} new documents', "INFO")
|
2023-02-12 20:53:59 +00:00
|
|
|
log.out('mongo.putBulkStations: Building collection indexes',"INFO")
|
|
|
|
createSingleIndex(collection, "3ALPHA")
|
|
|
|
createSingleIndex(collection, "STANOX")
|
|
|
|
createSingleIndex(collection, "TIPLOC")
|
2023-02-11 22:05:30 +00:00
|
|
|
log.out('mongo.putBulkStations: Updating meta time',"INFO")
|
2023-02-12 20:53:59 +00:00
|
|
|
metaUpdateTime(collection)
|
2023-02-12 21:36:41 +00:00
|
|
|
return
|
|
|
|
|
2023-02-16 21:34:31 +00:00
|
|
|
def incrementCounter(target):
|
|
|
|
collection = "meta"
|
|
|
|
col = db[collection]
|
2023-02-16 22:17:35 +00:00
|
|
|
log.out(f'mongo.incrementCounter: Incrementing counter for {target}', "INFO")
|
|
|
|
col.update_one({"target": "counters","type": "count"}, {"$inc":{target: 1}})
|
2023-02-16 21:34:31 +00:00
|
|
|
return
|
|
|
|
|
2023-02-12 21:36:41 +00:00
|
|
|
def metaCounters():
|
|
|
|
collection = "meta"
|
|
|
|
col = db[collection]
|
|
|
|
res = col.find_one({"target": "counters","type": "count"})
|
2023-02-13 20:45:05 +00:00
|
|
|
log.out(f'mongo.metaCounters: Query returned `{res}`', "DEBG")
|
|
|
|
if type(res) is dict:
|
|
|
|
if 'since' in res:
|
2023-02-12 21:36:41 +00:00
|
|
|
log.out('mongo.metaCounters: counters already exists, skipping', "INFO")
|
2023-02-16 22:23:54 +00:00
|
|
|
incrementCounter(collection)
|
2023-02-13 20:45:05 +00:00
|
|
|
return
|
|
|
|
log.out('mongo.metaCounters: counters does not exist, creating', "INFO")
|
|
|
|
col.update_one({"target": "counters","type": "count"}, {"$set":{"target": "counters","type": "count","since": int(time.time())}}, upsert=True)
|
2023-02-16 22:23:54 +00:00
|
|
|
incrementCounter(collection)
|
2023-02-11 22:05:30 +00:00
|
|
|
return
|