ocf/src/cleaning/acp.c
Michal Mielewczyk 2dfd6248c9 Configure all io classes at once.
Signed-off-by: Michal Mielewczyk <michal.mielewczyk@intel.com>
2019-01-28 08:51:26 -05:00

733 lines
19 KiB
C

/*
* Copyright(c) 2012-2018 Intel Corporation
* SPDX-License-Identifier: BSD-3-Clause-Clear
*/
#include "ocf/ocf.h"
#include "../ocf_cache_priv.h"
#include "cleaning.h"
#include "../metadata/metadata.h"
#include "../utils/utils_cleaner.h"
#include "../utils/utils_cache_line.h"
#include "../utils/utils_req.h"
#include "../cleaning/acp.h"
#include "../engine/engine_common.h"
#include "../concurrency/ocf_cache_concurrency.h"
#include "cleaning_priv.h"
#include "../utils/utils_core.h"
#define OCF_ACP_DEBUG 0
#if 1 == OCF_ACP_DEBUG
#define OCF_DEBUG_PREFIX "[Clean] %s():%d "
#define OCF_DEBUG_LOG(cache, format, ...) \
ocf_cache_log_prefix(cache, log_info, OCF_DEBUG_PREFIX, \
format"\n", __func__, __LINE__, ##__VA_ARGS__)
#define OCF_DEBUG_TRACE(cache) OCF_DEBUG_LOG(cache, "")
#define OCF_DEBUG_MSG(cache, msg) OCF_DEBUG_LOG(cache, "- %s", msg)
#define OCF_DEBUG_PARAM(cache, format, ...) OCF_DEBUG_LOG(cache, "- "format, \
##__VA_ARGS__)
#define ACP_DEBUG_INIT(acp) acp->checksum = 0
#define ACP_DEBUG_BEGIN(acp, cache_line) acp->checksum ^= cache_line
#define ACP_DEBUG_END(acp, cache_line) acp->checksum ^= cache_line
#define ACP_DEBUG_CHECK(acp) ENV_BUG_ON(acp->checksum)
#else
#define OCF_DEBUG_PREFIX
#define OCF_DEBUG_LOG(cache, format, ...)
#define OCF_DEBUG_TRACE(cache)
#define OCF_DEBUG_MSG(cache, msg)
#define OCF_DEBUG_PARAM(cache, format, ...)
#define ACP_DEBUG_INIT(acp)
#define ACP_DEBUG_BEGIN(acp, cache_line)
#define ACP_DEBUG_END(acp, cache_line)
#define ACP_DEBUG_CHECK(acp)
#endif
#define ACP_CHUNK_SIZE (100 * MiB)
/* minimal time to chunk cleaning after error */
#define ACP_CHUNK_CLEANING_BACKOFF_TIME 5
/* time to sleep when nothing to clean in ms */
#define ACP_BACKOFF_TIME_MS 1000
#define ACP_MAX_BUCKETS 11
/* Upper thresholds for buckets in percent dirty pages. First bucket should have
* threshold=0 - it isn't cleaned and we don't want dirty chunks staying dirty
* forever. Last bucket also should stay at 100 for obvious reasons */
static const uint16_t ACP_BUCKET_DEFAULTS[ACP_MAX_BUCKETS] = { 0, 10, 20, 30, 40,
50, 60, 70, 80, 90, 100 };
struct acp_flush_context {
/* number of cache lines in flush */
uint64_t size;
/* chunk_for error handling */
struct acp_chunk_info *chunk;
/* cache lines to flush */
struct flush_data data[OCF_ACP_MAX_FLUSH_MAX_BUFFERS];
/* flush error code */
int error;
};
struct acp_state {
/* currently cleaned chunk */
struct acp_chunk_info *chunk;
/* cache line iterator within current chunk */
unsigned iter;
/* true if there are cache lines to process
* current chunk */
bool in_progress;
};
struct acp_chunk_info {
struct list_head list;
uint64_t chunk_id;
uint64_t next_cleaning_timestamp;
ocf_core_id_t core_id;
uint16_t num_dirty;
uint8_t bucket_id;
};
struct acp_bucket {
struct list_head chunk_list;
uint16_t threshold; /* threshold in clines */
};
struct acp_context {
env_rwsem chunks_lock;
/* number of chunks per core */
uint64_t num_chunks[OCF_CORE_MAX];
/* per core array of all chunks */
struct acp_chunk_info *chunk_info[OCF_CORE_MAX];
struct acp_bucket bucket_info[ACP_MAX_BUCKETS];
/* total number of chunks in cache */
uint64_t chunks_total;
/* structure to keep track of I/O in progress */
struct acp_flush_context flush;
/* cleaning state persistent over subsequent calls to
perform_cleaning */
struct acp_state state;
#if 1 == OCF_ACP_DEBUG
/* debug only */
uint64_t checksum;
#endif
};
struct acp_core_line_info
{
ocf_cache_line_t cache_line;
ocf_core_id_t core_id;
uint64_t core_line;
};
#define ACP_LOCK_CHUNKS_RD() env_rwsem_down_read(&acp->chunks_lock)
#define ACP_UNLOCK_CHUNKS_RD() env_rwsem_up_read(&acp->chunks_lock)
#define ACP_LOCK_CHUNKS_WR() env_rwsem_down_write(&acp->chunks_lock)
#define ACP_UNLOCK_CHUNKS_WR() env_rwsem_up_write(&acp->chunks_lock)
static struct acp_context *_acp_get_ctx_from_cache(struct ocf_cache *cache)
{
return cache->cleaning_policy_context;
}
static struct acp_cleaning_policy_meta* _acp_meta_get(
struct ocf_cache *cache, uint32_t cache_line,
struct cleaning_policy_meta *policy_meta)
{
ocf_metadata_get_cleaning_policy(cache, cache_line, policy_meta);
return &policy_meta->meta.acp;
}
static void _acp_meta_set(struct ocf_cache *cache, uint32_t cache_line,
struct cleaning_policy_meta *policy_meta)
{
ocf_metadata_set_cleaning_policy(cache, cache_line, policy_meta);
}
static struct acp_core_line_info _acp_core_line_info(struct ocf_cache *cache,
ocf_cache_line_t cache_line)
{
struct acp_core_line_info acp_core_line_info = {.cache_line = cache_line, };
ocf_metadata_get_core_info(cache, cache_line, &acp_core_line_info.core_id,
&acp_core_line_info.core_line);
return acp_core_line_info;
}
static struct acp_chunk_info *_acp_get_chunk(struct ocf_cache *cache,
uint32_t cache_line)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
struct acp_core_line_info core_line =
_acp_core_line_info(cache, cache_line);
uint64_t chunk_id;
chunk_id = core_line.core_line * ocf_line_size(cache) / ACP_CHUNK_SIZE;
return &acp->chunk_info[core_line.core_id][chunk_id];
}
static void _acp_remove_cores(struct ocf_cache *cache)
{
int i;
for_each_core(cache, i)
cleaning_policy_acp_remove_core(cache, i);
}
static int _acp_load_cores(struct ocf_cache *cache)
{
int i;
int err = 0;
for_each_core(cache, i) {
OCF_DEBUG_PARAM(cache, "loading core %i\n", i);
err = cleaning_policy_acp_add_core(cache, i);
if (err)
break;
}
if (err)
_acp_remove_cores(cache);
return err;
}
void cleaning_policy_acp_init_cache_block(struct ocf_cache *cache,
uint32_t cache_line)
{
struct cleaning_policy_meta policy_meta;
struct acp_cleaning_policy_meta *acp_meta;
/* TODO: acp meta is going to be removed soon */
acp_meta = _acp_meta_get(cache, cache_line, &policy_meta);
acp_meta->dirty = 0;
_acp_meta_set(cache, cache_line, &policy_meta);
}
void cleaning_policy_acp_deinitialize(struct ocf_cache *cache)
{
_acp_remove_cores(cache);
env_vfree(cache->cleaning_policy_context);
cache->cleaning_policy_context = NULL;
}
static void _acp_rebuild(struct ocf_cache *cache)
{
ocf_cache_line_t cline;
ocf_core_id_t cline_core_id;
uint32_t step = 0;
for (cline = 0; cline < cache->device->collision_table_entries; cline++) {
ocf_metadata_get_core_and_part_id(cache, cline, &cline_core_id,
NULL);
OCF_COND_RESCHED_DEFAULT(step);
if (cline_core_id == OCF_CORE_MAX)
continue;
cleaning_policy_acp_init_cache_block(cache, cline);
if (!metadata_test_dirty(cache, cline))
continue;
cleaning_policy_acp_set_hot_cache_line(cache, cline);
}
ocf_cache_log(cache, log_info, "Finished rebuilding ACP metadata\n");
}
void cleaning_policy_acp_setup(struct ocf_cache *cache)
{
struct acp_cleaning_policy_config *config;
config = (void *)&cache->conf_meta->cleaning[ocf_cleaning_acp].data;
config->thread_wakeup_time = OCF_ACP_DEFAULT_WAKE_UP;
config->flush_max_buffers = OCF_ACP_DEFAULT_FLUSH_MAX_BUFFERS;
}
int cleaning_policy_acp_initialize(struct ocf_cache *cache,
int init_metadata)
{
struct acp_context *acp;
int err, i;
/* bug if max chunk number would overflow dirty_no array type */
#if defined (BUILD_BUG_ON)
BUILD_BUG_ON(ACP_CHUNK_SIZE / ocf_cache_line_size_min >=
1U << (sizeof(acp->chunk_info[0][0].num_dirty) * 8));
#else
ENV_BUG_ON(ACP_CHUNK_SIZE / ocf_cache_line_size_min >=
1U << (sizeof(acp->chunk_info[0][0].num_dirty) * 8));
#endif
ENV_BUG_ON(cache->cleaning_policy_context);
cache->cleaning_policy_context = env_vzalloc(sizeof(struct acp_context));
if (!cache->cleaning_policy_context) {
ocf_cache_log(cache, log_err, "acp context allocation error\n");
return -OCF_ERR_NO_MEM;
}
acp = cache->cleaning_policy_context;
env_rwsem_init(&acp->chunks_lock);
for (i = 0; i < ACP_MAX_BUCKETS; i++) {
INIT_LIST_HEAD(&acp->bucket_info[i].chunk_list);
acp->bucket_info[i].threshold =
((ACP_CHUNK_SIZE/ocf_line_size(cache)) *
ACP_BUCKET_DEFAULTS[i]) / 100;
}
if (cache->conf_meta->core_count > 0) {
err = _acp_load_cores(cache);
if (err) {
cleaning_policy_acp_deinitialize(cache);
return err;
}
}
_acp_rebuild(cache);
return 0;
}
int cleaning_policy_acp_set_cleaning_param(ocf_cache_t cache,
uint32_t param_id, uint32_t param_value)
{
struct acp_cleaning_policy_config *config;
config = (void *)&cache->conf_meta->cleaning[ocf_cleaning_acp].data;
switch (param_id) {
case ocf_acp_wake_up_time:
OCF_CLEANING_CHECK_PARAM(cache, param_value,
OCF_ACP_MIN_WAKE_UP,
OCF_ACP_MAX_WAKE_UP,
"thread_wakeup_time");
config->thread_wakeup_time = param_value;
ocf_cache_log(cache, log_info, "Write-back flush thread "
"wake-up time: %d\n", config->thread_wakeup_time);
break;
case ocf_acp_flush_max_buffers:
OCF_CLEANING_CHECK_PARAM(cache, param_value,
OCF_ACP_MIN_FLUSH_MAX_BUFFERS,
OCF_ACP_MAX_FLUSH_MAX_BUFFERS,
"flush_max_buffers");
config->flush_max_buffers = param_value;
ocf_cache_log(cache, log_info, "Write-back flush thread max "
"buffers flushed per iteration: %d\n",
config->flush_max_buffers);
break;
default:
return -OCF_ERR_INVAL;
}
return 0;
}
int cleaning_policy_acp_get_cleaning_param(ocf_cache_t cache,
uint32_t param_id, uint32_t *param_value)
{
struct acp_cleaning_policy_config *config;
config = (void *)&cache->conf_meta->cleaning[ocf_cleaning_acp].data;
switch (param_id) {
case ocf_acp_flush_max_buffers:
*param_value = config->flush_max_buffers;
break;
case ocf_acp_wake_up_time:
*param_value = config->thread_wakeup_time;
break;
default:
return -OCF_ERR_INVAL;
}
return 0;
}
/* attempt to lock cache line if it's dirty */
static ocf_cache_line_t _acp_trylock_dirty(struct ocf_cache *cache,
uint32_t core_id, uint64_t core_line)
{
struct ocf_map_info info;
bool locked = false;
OCF_METADATA_LOCK_RD();
ocf_engine_lookup_map_entry(cache, &info, core_id,
core_line);
if (info.status == LOOKUP_HIT &&
metadata_test_dirty(cache, info.coll_idx) &&
ocf_cache_line_try_lock_rd(cache, info.coll_idx)) {
locked = true;
}
OCF_METADATA_UNLOCK_RD();
return locked ? info.coll_idx : cache->device->collision_table_entries;
}
static void _acp_handle_flush_error(struct ocf_cache *cache,
struct acp_context *acp)
{
struct acp_flush_context *flush = &acp->flush;
flush->chunk->next_cleaning_timestamp = env_get_tick_count() +
env_secs_to_ticks(ACP_CHUNK_CLEANING_BACKOFF_TIME);
if (ocf_cache_log_rl(cache)) {
ocf_core_log(&cache->core[flush->chunk->core_id],
log_err, "Cleaning error (%d) in range"
" <%llu; %llu) backing off for %u seconds\n",
flush->error,
flush->chunk->chunk_id * ACP_CHUNK_SIZE,
(flush->chunk->chunk_id * ACP_CHUNK_SIZE) +
ACP_CHUNK_SIZE,
ACP_CHUNK_CLEANING_BACKOFF_TIME);
}
}
/* called after flush request completed */
static void _acp_flush_end(
struct ocf_cache *cache,
struct acp_context *acp)
{
struct acp_flush_context *flush = &acp->flush;
int i;
for (i = 0; i < flush->size; i++) {
ocf_cache_line_unlock_rd(cache, flush->data[i].cache_line);
ACP_DEBUG_END(acp, flush->data[i].cache_line);
}
if (flush->error)
_acp_handle_flush_error(cache, acp);
}
/* flush data */
static void _acp_flush(struct ocf_cache *cache, struct acp_context *acp,
uint32_t io_queue, struct acp_flush_context *flush)
{
struct ocf_cleaner_attribs attribs = {
.cache_line_lock = false,
.metadata_locked = false,
.do_sort = false,
.io_queue = io_queue,
};
flush->error = ocf_cleaner_do_flush_data(cache, flush->data,
flush->size, &attribs);
_acp_flush_end(cache, acp);
}
static inline bool _acp_can_clean_chunk(struct ocf_cache *cache,
struct acp_chunk_info *chunk)
{
/* Check if core device is opened and if timeout after cleaning error
* expired or wasn't set in the first place */
return (cache->core[chunk->core_id].opened &&
(chunk->next_cleaning_timestamp > env_get_tick_count() ||
!chunk->next_cleaning_timestamp));
}
static struct acp_chunk_info *_acp_get_cleaning_candidate(
struct ocf_cache *cache)
{
int i;
struct acp_chunk_info *cur;
struct acp_context *acp = cache->cleaning_policy_context;
ACP_LOCK_CHUNKS_RD();
/* go through all buckets in descending order, excluding bucket 0 which
* is supposed to contain all clean chunks */
for (i = ACP_MAX_BUCKETS - 1; i > 0; i--) {
list_for_each_entry(cur, &acp->bucket_info[i].chunk_list, list) {
if (_acp_can_clean_chunk(cache, cur)) {
ACP_UNLOCK_CHUNKS_RD();
return cur;
}
}
}
ACP_UNLOCK_CHUNKS_RD();
return NULL;
}
#define CHUNK_FINISHED -1
/* clean at most 'flush_max_buffers' cache lines from given chunk, starting
* at given cache line */
static int _acp_clean(struct ocf_cache *cache, uint32_t io_queue,
struct acp_chunk_info *chunk, unsigned start,
uint32_t flush_max_buffers)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
size_t lines_per_chunk = ACP_CHUNK_SIZE /
ocf_line_size(cache);
uint64_t first_core_line = chunk->chunk_id * lines_per_chunk;
unsigned i;
OCF_DEBUG_PARAM(cache, "lines per chunk %llu chunk %llu "
"first_core_line %llu\n",
(uint64_t)lines_per_chunk,
chunk->chunk_id,
first_core_line);
ACP_DEBUG_INIT(acp);
acp->flush.size = 0;
acp->flush.chunk = chunk;
for (i = start; i < lines_per_chunk && acp->flush.size < flush_max_buffers ; i++) {
uint64_t core_line = first_core_line + i;
ocf_cache_line_t cache_line;
cache_line = _acp_trylock_dirty(cache, chunk->core_id, core_line);
if (cache_line == cache->device->collision_table_entries)
continue;
acp->flush.data[acp->flush.size].core_id = chunk->core_id;
acp->flush.data[acp->flush.size].core_line = core_line;
acp->flush.data[acp->flush.size].cache_line = cache_line;
acp->flush.size++;
ACP_DEBUG_BEGIN(acp, cache_line);
}
if (acp->flush.size > 0) {
_acp_flush(cache, acp, io_queue, &acp->flush);
}
ACP_DEBUG_CHECK(acp);
return (i == lines_per_chunk) ? CHUNK_FINISHED : i;
}
#define NOTHING_TO_CLEAN 0
#define MORE_TO_CLEAN 1
/* Clean at most 'flush_max_buffers' cache lines from current or newly
* selected chunk */
static int _acp_clean_iteration(struct ocf_cache *cache, uint32_t io_queue,
uint32_t flush_max_buffers)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
struct acp_state *state = &acp->state;
if (!state->in_progress) {
/* get next chunk to clean */
state->chunk = _acp_get_cleaning_candidate(cache);
if (!state->chunk) {
/* nothing co clean */
return NOTHING_TO_CLEAN;
}
/* new cleaning cycle - reset state */
state->iter = 0;
state->in_progress = true;
}
state->iter = _acp_clean(cache, io_queue, state->chunk, state->iter,
flush_max_buffers);
if (state->iter == CHUNK_FINISHED) {
/* reached end of chunk - reset state */
state->in_progress = false;
}
return MORE_TO_CLEAN;
}
int cleaning_policy_acp_perform_cleaning(struct ocf_cache *cache,
uint32_t io_queue)
{
struct acp_cleaning_policy_config *config;
int ret;
config = (void *)&cache->conf_meta->cleaning[ocf_cleaning_acp].data;
if (NOTHING_TO_CLEAN == _acp_clean_iteration(cache, io_queue,
config->flush_max_buffers)) {
ret = ACP_BACKOFF_TIME_MS;
} else {
ret = config->thread_wakeup_time;
}
return ret;
}
static void _acp_update_bucket(struct acp_context *acp,
struct acp_chunk_info *chunk)
{
struct acp_bucket *bucket = &acp->bucket_info[chunk->bucket_id];
if (chunk->num_dirty > bucket->threshold) {
ENV_BUG_ON(chunk->bucket_id == ACP_MAX_BUCKETS - 1);
chunk->bucket_id++;
/* buckets are stored in array, move up one bucket.
* No overflow here. ENV_BUG_ON made sure of no incrementation on
* last bucket */
bucket++;
list_move_tail(&chunk->list, &bucket->chunk_list);
} else if (chunk->bucket_id &&
chunk->num_dirty <= (bucket - 1)->threshold) {
chunk->bucket_id--;
/* move down one bucket, we made sure we won't underflow */
bucket--;
list_move(&chunk->list, &bucket->chunk_list);
}
}
void cleaning_policy_acp_set_hot_cache_line(struct ocf_cache *cache,
uint32_t cache_line)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
struct cleaning_policy_meta policy_meta;
struct acp_cleaning_policy_meta *acp_meta;
struct acp_chunk_info *chunk;
ACP_LOCK_CHUNKS_WR();
acp_meta = _acp_meta_get(cache, cache_line, &policy_meta);
chunk = _acp_get_chunk(cache, cache_line);
if (!acp_meta->dirty) {
acp_meta->dirty = 1;
_acp_meta_set(cache, cache_line, &policy_meta);
chunk->num_dirty++;
}
_acp_update_bucket(acp, chunk);
ACP_UNLOCK_CHUNKS_WR();
}
void cleaning_policy_acp_purge_block(struct ocf_cache *cache,
uint32_t cache_line)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
struct cleaning_policy_meta policy_meta;
struct acp_cleaning_policy_meta *acp_meta;
struct acp_chunk_info *chunk;
acp_meta = _acp_meta_get(cache, cache_line, &policy_meta);
chunk = _acp_get_chunk(cache, cache_line);
if (acp_meta->dirty) {
acp_meta->dirty = 0;
_acp_meta_set(cache, cache_line, &policy_meta);
chunk->num_dirty--;
}
_acp_update_bucket(acp, chunk);
}
int cleaning_policy_acp_purge_range(struct ocf_cache *cache,
int core_id, uint64_t start_byte, uint64_t end_byte)
{
return ocf_metadata_actor(cache, PARTITION_INVALID,
core_id, start_byte, end_byte,
cleaning_policy_acp_purge_block);
}
void cleaning_policy_acp_remove_core(ocf_cache_t cache,
ocf_core_id_t core_id)
{
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
uint64_t i;
ENV_BUG_ON(acp->chunks_total < acp->num_chunks[core_id]);
if (acp->state.in_progress && acp->state.chunk->core_id == core_id) {
acp->state.in_progress = false;
acp->state.iter = 0;
acp->state.chunk = NULL;
}
ACP_LOCK_CHUNKS_WR();
for (i = 0; i < acp->num_chunks[core_id]; i++)
list_del(&acp->chunk_info[core_id][i].list);
acp->chunks_total -= acp->num_chunks[core_id];
acp->num_chunks[core_id] = 0;
env_vfree(acp->chunk_info[core_id]);
acp->chunk_info[core_id] = NULL;
ACP_UNLOCK_CHUNKS_WR();
}
int cleaning_policy_acp_add_core(ocf_cache_t cache,
ocf_core_id_t core_id)
{
uint64_t core_size = cache->core_conf_meta[core_id].length;
uint64_t num_chunks = OCF_DIV_ROUND_UP(core_size, ACP_CHUNK_SIZE);
struct acp_context *acp = _acp_get_ctx_from_cache(cache);
int i;
OCF_DEBUG_PARAM(cache, "%s core_id %llu num_chunks %llu\n",
__func__, (uint64_t)core_id, (uint64_t) num_chunks);
ACP_LOCK_CHUNKS_WR();
ENV_BUG_ON(acp->chunk_info[core_id]);
acp->chunk_info[core_id] =
env_vzalloc(num_chunks * sizeof(acp->chunk_info[0][0]));
if (!acp->chunk_info[core_id]) {
ACP_UNLOCK_CHUNKS_WR();
OCF_DEBUG_PARAM(cache, "failed to allocate acp tables\n");
return -ENOMEM;
}
OCF_DEBUG_PARAM(cache, "successfully allocated acp tables\n");
/* increment counters */
acp->num_chunks[core_id] = num_chunks;
acp->chunks_total += num_chunks;
for (i = 0; i < acp->num_chunks[core_id]; i++) {
/* fill in chunk metadata and add to the clean bucket */
acp->chunk_info[core_id][i].core_id = core_id;
acp->chunk_info[core_id][i].chunk_id = i;
list_add(&acp->chunk_info[core_id][i].list,
&acp->bucket_info[0].chunk_list);
}
ACP_UNLOCK_CHUNKS_WR();
return 0;
}