use configured client

This commit is contained in:
James Turk 2011-08-05 19:08:01 -04:00
parent 67cc05078e
commit 47d094e919
5 changed files with 72 additions and 18 deletions

View File

@ -9,6 +9,23 @@ import gridfs
import scrapelib import scrapelib
def get_configured_client():
from oyster.conf import settings
return Client(mongo_host=settings.MONGO_HOST,
mongo_port=settings.MONGO_PORT,
mongo_db=settings.MONGO_DATABASE,
mongo_log_maxsize=settings.MONGO_LOG_MAXSIZE,
user_agent=settings.USER_AGENT,
rpm=settings.REQUESTS_PER_MINUTE,
timeout=settings.REQUEST_TIMEOUT,
retry_attempts=settings.RETRY_ATTEMPTS,
retry_wait_seconds=settings.RETRY_WAIT_SECONDS)
class Client(object): class Client(object):

21
oyster/conf/__init__.py Normal file
View File

@ -0,0 +1,21 @@
from oyster.conf import default_settings
class Settings(object):
def __init__(self):
pass
def update(self, module):
for setting in dir(module):
if setting.isupper():
val = getattr(module, setting)
if val is not None:
setattr(self, setting, val)
settings = Settings()
settings.update(default_settings)
try:
import oyster_settings
settings.update(oyster_settings)
except ImportError:
pass

View File

@ -0,0 +1,14 @@
# mongodb
MONGO_HOST = 'localhost'
MONGO_PORT = 27017
MONGO_DATABASE = 'oyster'
MONGO_LOG_MAXSIZE = 100000000
# scrapelib
USER_AGENT = 'oyster'
REQUESTS_PER_MINUTE = 300
REQUEST_TIMEOUT = 0
RETRY_ATTEMPTS = 0
RETRY_WAIT_SECONDS = 5

View File

@ -1,21 +1,25 @@
from celery.task import task from celery.task.base import Task, PeriodicTask
from celery.task.base import PeriodicTask
from celery.task.schedules import schedule
from celery.execute import send_task from celery.execute import send_task
from oyster.client import Client from oyster.client import get_configured_client
client = Client()
@task(ignore_result=True) class UpdateTask(Task):
def update_task(doc_id): # results go straight to database
# maybe fetch doc instead? ignore_result = True
doc = client.db.tracked.find_one({'_id': doc_id})
client.update(doc) def __init__(self):
for hook in doc.get('post_update_hooks', []): # one client per process
send_task(hook, (doc_id,)) client = get_configured_client()
client.db.status.update({}, {'$inc': {'update_queue': -1}})
def run(self, doc_id):
# maybe fetch doc instead?
doc = client.db.tracked.find_one({'_id': doc_id})
client.update(doc)
for hook in doc.get('post_update_hooks', []):
send_task(hook, (doc_id,))
client.db.status.update({}, {'$inc': {'update_queue': -1}})
class UpdateTaskScheduler(PeriodicTask): class UpdateTaskScheduler(PeriodicTask):

View File

@ -5,7 +5,7 @@ import functools
import flask import flask
import pymongo.objectid import pymongo.objectid
from oyster.client import Client from oyster.client import get_configured_client
class JSONEncoder(json.JSONEncoder): class JSONEncoder(json.JSONEncoder):
@ -33,14 +33,13 @@ def api_wrapper(template=None):
app = flask.Flask('oyster') app = flask.Flask('oyster')
client = Client() client = get_configured_client()
@app.route('/') @app.route('/')
@api_wrapper('index.html') @api_wrapper('index.html')
def index(): def index():
status = { status = {
'queue_size': app.work_queue.qsize(),
'tracking': client.db.tracked.count(), 'tracking': client.db.tracked.count(),
'need_update': client.get_update_queue_size(), 'need_update': client.get_update_queue_size(),
'logs': client.db.logs.find().sort('$natural', -1).limit(20) 'logs': client.db.logs.find().sort('$natural', -1).limit(20)
@ -52,7 +51,6 @@ def index():
@api_wrapper() @api_wrapper()
def doc_list(): def doc_list():
status = { status = {
'queue_size': app.work_queue.qsize(),
'tracking': client.db.tracked.count(), 'tracking': client.db.tracked.count(),
'need_update': client.get_update_queue_size(), 'need_update': client.get_update_queue_size(),
} }