1 /* Blue Sky: File Systems in the Cloud
3 * Copyright (C) 2009 The Regents of the University of California
4 * Written by Michael Vrable <mvrable@cs.ucsd.edu>
13 #include "bluesky-private.h"
15 /* Interaction with cloud storage. We expose very simple GET/PUT style
16 * interface, which different backends can implement. Available backends
17 * (will) include Amazon S3 and a simple local store for testing purposes.
18 * Operations may be performed asynchronously. */
20 struct _BlueSkyStore {
21 const BlueSkyStoreImplementation *impl;
26 int pending; /* Count of operations not yet complete. */
29 GHashTable *store_implementations;
31 /* Thread pool for calling notifier functions when an operation completes.
32 * These are called in a separate thread for locking reasons: we want to call
33 * the notifiers without the lock on the async object held, but completion
34 * occurs when the lock is held--so we need some way to defer the call. This
35 * isn't really optimal from a cache-locality standpoint. */
36 static GThreadPool *notifier_thread_pool;
38 void bluesky_store_register(const BlueSkyStoreImplementation *impl,
41 g_hash_table_insert(store_implementations, g_strdup(name), (gpointer)impl);
44 BlueSkyStore *bluesky_store_new(const gchar *type)
46 const BlueSkyStoreImplementation *impl;
49 scheme = g_strdup(type);
50 path = strchr(scheme, ':');
56 impl = g_hash_table_lookup(store_implementations, scheme);
62 gpointer handle = impl->create(path);
68 BlueSkyStore *store = g_new(BlueSkyStore, 1);
70 store->handle = handle;
71 store->lock = g_mutex_new();
72 store->cond_idle = g_cond_new();
78 void bluesky_store_free(BlueSkyStore *store)
80 store->impl->destroy(store->handle);
84 BlueSkyStoreAsync *bluesky_store_async_new(BlueSkyStore *store)
86 BlueSkyStoreAsync *async;
88 async = g_new(BlueSkyStoreAsync, 1);
90 async->lock = g_mutex_new();
91 async->completion_cond = g_cond_new();
93 async->status = ASYNC_NEW;
94 async->op = STORE_OP_NONE;
98 async->notifiers = NULL;
99 async->notifier_count = 0;
100 async->barrier = NULL;
101 async->store_private = NULL;
106 gpointer bluesky_store_async_get_handle(BlueSkyStoreAsync *async)
108 return async->store->handle;
111 void bluesky_store_async_ref(BlueSkyStoreAsync *async)
116 g_return_if_fail(g_atomic_int_get(&async->refcount) > 0);
118 g_atomic_int_inc(&async->refcount);
121 void bluesky_store_async_unref(BlueSkyStoreAsync *async)
126 if (g_atomic_int_dec_and_test(&async->refcount)) {
127 async->store->impl->cleanup(async->store->handle, async);
128 g_mutex_free(async->lock);
129 g_cond_free(async->completion_cond);
131 bluesky_string_unref(async->data);
136 /* Block until the given operation has completed. */
137 void bluesky_store_async_wait(BlueSkyStoreAsync *async)
139 g_return_if_fail(async != NULL);
140 g_mutex_lock(async->lock);
142 if (async->status == ASYNC_NEW) {
143 g_error("bluesky_store_async_wait on a new async object!\n");
144 g_mutex_unlock(async->lock);
148 while (async->status != ASYNC_COMPLETE
149 || g_atomic_int_get(&async->notifier_count) > 0) {
150 g_cond_wait(async->completion_cond, async->lock);
153 g_mutex_unlock(async->lock);
156 /* Add a notifier function to be called when the operation completes. */
157 void bluesky_store_async_add_notifier(BlueSkyStoreAsync *async,
158 GFunc func, gpointer user_data)
160 struct BlueSkyNotifierList *nl = g_new(struct BlueSkyNotifierList, 1);
161 g_mutex_lock(async->lock);
162 nl->next = async->notifiers;
164 nl->async = async; bluesky_store_async_ref(async);
165 nl->user_data = user_data;
166 g_atomic_int_inc(&async->notifier_count);
167 if (async->status == ASYNC_COMPLETE) {
168 g_thread_pool_push(notifier_thread_pool, nl, NULL);
170 async->notifiers = nl;
172 g_mutex_unlock(async->lock);
175 static void op_complete(gpointer a, gpointer b)
177 BlueSkyStoreAsync *barrier = (BlueSkyStoreAsync *)b;
179 bluesky_store_async_ref(barrier);
180 g_mutex_lock(barrier->lock);
181 barrier->store_private
182 = GINT_TO_POINTER(GPOINTER_TO_INT(barrier->store_private) - 1);
183 if (GPOINTER_TO_INT(barrier->store_private) == 0
184 && barrier->status != ASYNC_NEW) {
185 bluesky_store_async_mark_complete(barrier);
187 g_mutex_unlock(barrier->lock);
188 bluesky_store_async_unref(barrier);
191 /* Mark an asynchronous operation as complete. This should only be called by
192 * the store implementations. The lock should be held when calling this
193 * function. Any notifier functions will be called, but in a separate thread
194 * and without the lock held. */
195 void bluesky_store_async_mark_complete(BlueSkyStoreAsync *async)
197 g_return_if_fail(async->status != ASYNC_COMPLETE);
199 bluesky_time_hires elapsed = bluesky_now_hires() - async->start_time;
200 bluesky_time_hires latency = bluesky_now_hires() - async->exec_time;
202 if (async->op != STORE_OP_BARRIER) {
203 g_mutex_lock(async->store->lock);
204 async->store->pending--;
205 if (async->store->pending == 0)
206 g_cond_broadcast(async->store->cond_idle);
207 g_mutex_unlock(async->store->lock);
210 async->status = ASYNC_COMPLETE;
211 g_cond_broadcast(async->completion_cond);
213 if (async->barrier != NULL && async->notifiers == NULL)
214 op_complete(async, async->barrier);
216 while (async->notifiers != NULL) {
217 struct BlueSkyNotifierList *nl = async->notifiers;
218 async->notifiers = nl->next;
219 g_thread_pool_push(notifier_thread_pool, nl, NULL);
222 if (bluesky_verbose) {
223 g_log("bluesky/store", G_LOG_LEVEL_DEBUG,
224 "[%p] complete: elapsed = %"PRIi64" ns, latency = %"PRIi64" ns",
225 async, elapsed, latency);
229 void bluesky_store_async_submit(BlueSkyStoreAsync *async)
231 BlueSkyStore *store = async->store;
233 async->start_time = bluesky_now_hires();
235 // Backends should fill this in with a better estimate of the actual time
236 // processing was started, if there could be a delay from submission time.
237 async->exec_time = bluesky_now_hires();
239 if (bluesky_verbose) {
240 g_log("bluesky/store", G_LOG_LEVEL_DEBUG, "[%p] submit: %s %s",
242 async->op == STORE_OP_GET ? "GET"
243 : async->op == STORE_OP_PUT ? "PUT"
244 : async->op == STORE_OP_DELETE ? "DELETE"
245 : async->op == STORE_OP_BARRIER ? "BARRIER" : "???",
249 /* Barriers are handled specially, and not handed down the storage
250 * implementation layer. */
251 if (async->op == STORE_OP_BARRIER) {
252 async->status = ASYNC_RUNNING;
253 if (GPOINTER_TO_INT(async->store_private) == 0)
254 bluesky_store_async_mark_complete(async);
258 g_mutex_lock(async->store->lock);
259 async->store->pending++;
260 g_mutex_unlock(async->store->lock);
262 store->impl->submit(store->handle, async);
264 if (bluesky_options.synchronous_stores)
265 bluesky_store_async_wait(async);
268 /* Add the given operation to the barrier. The barrier will not complete until
269 * all operations added to it have completed. */
270 void bluesky_store_add_barrier(BlueSkyStoreAsync *barrier,
271 BlueSkyStoreAsync *async)
273 g_return_if_fail(barrier->op == STORE_OP_BARRIER);
275 g_mutex_lock(barrier->lock);
276 barrier->store_private
277 = GINT_TO_POINTER(GPOINTER_TO_INT(barrier->store_private) + 1);
278 g_mutex_unlock(barrier->lock);
280 g_mutex_lock(async->lock);
281 if (async->barrier == NULL) {
282 async->barrier = barrier;
284 g_warning("Adding async to more than one barrier!\n");
285 bluesky_store_async_add_notifier(async, op_complete, barrier);
287 g_mutex_unlock(async->lock);
290 static void notifier_task(gpointer n, gpointer s)
292 struct BlueSkyNotifierList *notifier = (struct BlueSkyNotifierList *)n;
294 notifier->func(notifier->async, notifier->user_data);
295 if (g_atomic_int_dec_and_test(¬ifier->async->notifier_count)) {
296 g_mutex_lock(notifier->async->lock);
297 if (notifier->async->barrier != NULL)
298 op_complete(notifier->async, notifier->async->barrier);
299 g_cond_broadcast(notifier->async->completion_cond);
300 g_mutex_unlock(notifier->async->lock);
302 bluesky_store_async_unref(notifier->async);
306 void bluesky_store_sync(BlueSkyStore *store)
308 g_mutex_lock(store->lock);
309 if (bluesky_verbose) {
310 g_log("bluesky/store", G_LOG_LEVEL_DEBUG,
311 "Waiting for pending store operations to complete...");
313 while (store->pending > 0) {
314 g_cond_wait(store->cond_idle, store->lock);
316 g_mutex_unlock(store->lock);
317 if (bluesky_verbose) {
318 g_log("bluesky/store", G_LOG_LEVEL_DEBUG, "Operations are complete.");
322 /* Convenience wrappers that perform a single operation synchronously. */
323 BlueSkyRCStr *bluesky_store_get(BlueSkyStore *store, const gchar *key)
325 BlueSkyStoreAsync *async = bluesky_store_async_new(store);
326 async->op = STORE_OP_GET;
327 async->key = g_strdup(key);
328 bluesky_store_async_submit(async);
330 bluesky_store_async_wait(async);
332 BlueSkyRCStr *data = async->data;
333 bluesky_string_ref(data);
334 bluesky_store_async_unref(async);
338 void bluesky_store_put(BlueSkyStore *store,
339 const gchar *key, BlueSkyRCStr *val)
341 BlueSkyStoreAsync *async = bluesky_store_async_new(store);
342 async->op = STORE_OP_PUT;
343 async->key = g_strdup(key);
344 bluesky_string_ref(val);
346 bluesky_store_async_submit(async);
348 bluesky_store_async_wait(async);
349 bluesky_store_async_unref(async);
352 /* Simple in-memory data store for test purposes. */
356 /* TODO: A hashtable isn't optimal for list queries... */
360 static gpointer memstore_create(const gchar *path)
362 MemStore *store = g_new(MemStore, 1);
363 store->lock = g_mutex_new();
364 store->store = g_hash_table_new_full(g_str_hash, g_str_equal,
366 (GDestroyNotify)bluesky_string_unref);
368 return (gpointer)store;
371 static void memstore_destroy(gpointer store)
376 static BlueSkyRCStr *memstore_get(gpointer st, const gchar *key)
378 MemStore *store = (MemStore *)st;
379 BlueSkyRCStr *s = g_hash_table_lookup(store->store, key);
381 bluesky_string_ref(s);
385 static void memstore_put(gpointer s, const gchar *key, BlueSkyRCStr *val)
387 MemStore *store = (MemStore *)s;
388 bluesky_string_ref(val);
389 g_hash_table_insert(store->store, g_strdup(key), val);
392 static void memstore_submit(gpointer s, BlueSkyStoreAsync *async)
394 g_return_if_fail(async->status == ASYNC_NEW);
395 g_return_if_fail(async->op != STORE_OP_NONE);
399 async->data = memstore_get(s, async->key);
403 memstore_put(s, async->key, async->data);
407 g_warning("Uknown operation type for MemStore: %d\n", async->op);
411 bluesky_store_async_mark_complete(async);
414 static void memstore_cleanup(gpointer store, BlueSkyStoreAsync *async)
418 static BlueSkyStoreImplementation memstore_impl = {
419 .create = memstore_create,
420 .destroy = memstore_destroy,
421 .submit = memstore_submit,
422 .cleanup = memstore_cleanup,
425 /* Store implementation which writes data as files to disk. */
426 static gpointer filestore_create(const gchar *path)
428 return GINT_TO_POINTER(1);
431 static void filestore_destroy()
435 static BlueSkyRCStr *filestore_get(const gchar *key)
437 gchar *contents = NULL;
439 GError *error = NULL;
441 g_file_get_contents(key, &contents, &length, &error);
442 if (contents == NULL)
445 return bluesky_string_new(contents, length);
448 static void filestore_put(const gchar *key, BlueSkyRCStr *val)
450 g_file_set_contents(key, val->data, val->len, NULL);
453 static void filestore_submit(gpointer s, BlueSkyStoreAsync *async)
455 g_return_if_fail(async->status == ASYNC_NEW);
456 g_return_if_fail(async->op != STORE_OP_NONE);
460 async->data = filestore_get(async->key);
465 filestore_put(async->key, async->data);
470 g_warning("Uknown operation type for FileStore: %d\n", async->op);
474 bluesky_store_async_mark_complete(async);
477 static void filestore_cleanup(gpointer store, BlueSkyStoreAsync *async)
481 static BlueSkyStoreImplementation filestore_impl = {
482 .create = filestore_create,
483 .destroy = filestore_destroy,
484 .submit = filestore_submit,
485 .cleanup = filestore_cleanup,
488 void bluesky_store_init()
490 store_implementations = g_hash_table_new(g_str_hash, g_str_equal);
491 notifier_thread_pool = g_thread_pool_new(notifier_task, NULL,
492 bluesky_max_threads, FALSE, NULL);
493 bluesky_store_register(&memstore_impl, "mem");
494 bluesky_store_register(&filestore_impl, "file");