首页
社区
课程
招聘
[原创]cache模拟器
发表于: 2012-12-19 11:34 12381

[原创]cache模拟器

2012-12-19 11:34
12381
Cache模拟器
  程序运行时,都会对内存进行相关操作,所访问的内存地址可以被记录下来,形成memory trace文件。在本实验中,你将使用benchmark程序产生的memory trace文件来测试Cache命中率,文件可以在http://cseweb.ucsd.edu/classes/fa07/cse240a/proj1-traces.tar.gz上获得。
  每次存储器访问都包含了三个信息:
访问类型,’l’表示Load操作,’s’表示Store操作;
地址。采用32位无符号的十六进制表示;
存储器访问指令之间的间隔指令数。例如第5条指令和第10条指令为存储器访问指令,且中间没有其他存储器访问指令,则间隔指令数为4。
#include <stdlib.h>
#include <stdio.h>
#include <string.h>

typedef unsigned char _u8;
typedef unsigned int  _u32;

//#ifdef _DEBUG
#define dbg_log                 printf
//#endif

#define CACHE_FLAG_VALID        0x1
#define CACHE_FLAG_WRITE_BACK   0x2
#define CACHE_FLAG_MASK         0xf

const char* swap_style_description[] = {
        "FIFO替换",
        "LRU替换",
        "随机替换"
};

const char* write_style_description[] = {
        "写直达",
        "写回"
};

enum cache_swap_style{
        CACHE_SWAP_FIFO,
        CACHE_SWAP_LRU,
        CACHE_SWAP_RAND,
        CACHE_SWAP_MAX
};

enum cache_write_style{
        CACHE_WRITE_THROUGH,
        CACHE_WRITE_BACK,
        CACHE_WRITE_MAX
};

struct cache_item {
        _u32 tag;                       /* cache标记缓存- 最低4bit为标志位 */
        union {
                _u32 count;
                _u32 lru_count;         /* 读写计数 */
                _u32 fifo_count;        /* 先入先出 = tickcount */
        };
        _u8* buf;                       /* 指向实际数据 */
};

struct cache_sim {
	_u32 cache_size;                 /* cache缓存容量 */
	_u32 cache_line_size;            /* cache块大小 */
        _u32 cache_item_num;             /* cache总入口数 */
	_u32 cache_mapping_ways;         /* cache总组数 */
        _u32 cache_group_size;           /* cache组大小 */

        _u32 cache_group_shifts;
        _u32 cache_block_shifts;
        _u32 cache_tag_mask;

        struct cache_item* caches;

        _u32* addr_list;                /* 地址列表-以便统计强制缺失 */
        _u32 addr_list_size;
        _u32 addr_num;

        _u32 tick_count;                /* 总指令计数器 */
        _u8* cache_buf;                 /* cache缓存区 */
        int swap_style;
        int write_style;

        _u32 cache_r_count;             /* cache读主存块数 */
        _u32 cache_w_count;             /* cache写主存块数 */
        _u32 cache_hit_count;
        _u32 cache_miss_count;

        _u32 cache_free_num;            /* 空闲cache条目 */
        _u32 force_miss_count;          /* 强制缺失 */
        _u32 capacity_miss_count;       /* 容量缺失 */
        _u32 conflict_miss_count;       /* 冲突缺失 */
};

/* 返回插入位置 */
int get_addr_index(struct cache_sim* cache, void* addr)
{
        int lo = 0;
        int hi = cache->addr_num - 1;
        int mid = (lo + hi) / 2;

        if (cache->addr_num < 1)
                return -1;
        if ((_u32)addr <= cache->addr_list[lo])
                return lo;
        if ((_u32)addr >= cache->addr_list[hi])
                return hi;

        while (hi > lo + 1) {
                mid = (lo + hi) / 2;
                if ((_u32)addr > cache->addr_list[mid])
                        lo = mid;
                else if ((_u32)addr < cache->addr_list[mid])
                        hi = mid;
                else
                        return mid;
        }

        return mid;
}

int add_addr_list(struct cache_sim* cache, void* addr)
{
        int index;

        if (!cache->addr_list || cache->addr_num < 1
                || cache->addr_num >= cache->addr_list_size) {
                cache->addr_list_size += 0x400;
                cache->addr_list = realloc(cache->addr_list, cache->addr_list_size * sizeof(_u32));
        }

        if (cache->addr_num < 1) {
                cache->addr_list[0] = (_u32)addr;
                cache->addr_num = 1;
                return 0;
        }

        index = get_addr_index(cache, addr);

        if ((_u32)addr == cache->addr_list[index])
                return -1;
        else if ((_u32)addr > cache->addr_list[index])
                index += 1;

        memmove(cache->addr_list + index + 1, 
                cache->addr_list + index, 
                sizeof(_u32)*(cache->addr_num - index));

        cache->addr_list[index] = (_u32)addr;
        cache->addr_num++;

        return 0;
}

int get_power_num(int num)
{
        int ret = -1;
        while (num > 0){
                ret++;
                num = num >> 1;
        }
        return ret;
}

void reset_cache_sim(struct cache_sim* cache, int cache_line_size, int mapping_ways)
{
        if (!cache || cache_line_size < 16 || mapping_ways < 1)
                return;

        cache->cache_line_size = cache_line_size;
        cache->cache_item_num = cache->cache_size / cache_line_size;
        cache->cache_block_shifts = get_power_num(cache_line_size);
        cache->cache_mapping_ways = mapping_ways;
        cache->cache_group_shifts = get_power_num(mapping_ways);
        cache->cache_group_size = cache->cache_item_num / mapping_ways;
        cache->cache_tag_mask = 0xffffffff << (cache->cache_group_shifts + cache->cache_block_shifts);
        cache->cache_free_num = cache->cache_item_num;

        cache->addr_num = 0;
        cache->cache_hit_count = 0;
        cache->cache_miss_count = 0;
        cache->cache_r_count = 0;
        cache->cache_w_count = 0;
        cache->capacity_miss_count = 0;
        cache->conflict_miss_count = 0;
        cache->force_miss_count = 0;
        cache->tick_count = 0;

        if (!cache->cache_buf){
                cache->cache_buf = malloc(cache->cache_size);
                memset(cache->cache_buf, 0, cache->cache_size);
        }

        if (cache->caches){
                free(cache->caches);
                cache->caches = NULL;
        }
        
        /* 这里直接设置cache-tags为32bits-简化 */
        cache->caches = malloc(sizeof(struct cache_item) * cache->cache_item_num);
        memset(cache->caches, 0, sizeof(struct cache_item) * cache->cache_item_num);
}

static int chk_cache_hit(struct cache_sim* cache, _u32 group_base, void* addr)
{
        _u32 i, tag;
        for (i=0; i<cache->cache_group_size; i++) {
                tag = cache->caches[group_base + i].tag;
                if ((tag & CACHE_FLAG_VALID)
                        && (tag & cache->cache_tag_mask) == ((_u32)addr & cache->cache_tag_mask)){
                        return group_base + i;
                }
        }

        return -1;
}

static int get_cache_free_item(struct cache_sim* cache,  _u32 group_base, void* addr)
{
        _u32 i, tag;
        _u32 min_count, free_index;
        for (i=0; i<cache->cache_group_size; i++) {
                tag = cache->caches[group_base + i].tag;
                if (!(tag & CACHE_FLAG_VALID)){
                        if (cache->cache_free_num > 0)
                                cache->cache_free_num--;
                        return group_base + i;
                }
        }

        /* 执行缓存切换算法 */
        free_index = 0;
        if (CACHE_SWAP_RAND == cache->swap_style){
                free_index = rand() % cache->cache_group_size;
        } else {
                min_count = cache->caches[group_base].count;
                for (i=0; i<cache->cache_group_size; i++) {
                        if (cache->caches[group_base + i].count < min_count){
                                min_count = cache->caches[group_base + i].count;
                                free_index = i;
                        }
                }
        }

        free_index += group_base;

        /* 检查cache回写标志 */
        if (cache->caches[free_index].tag & CACHE_FLAG_WRITE_BACK){
                cache->caches[free_index].tag &= ~CACHE_FLAG_WRITE_BACK;
                /*
                dbg_log("cache write back to block %p\n",
                        cache->caches[free_index].tag & (~(cache->cache_line_size - 1))
                        );
                 */
                cache->cache_w_count++;
        }

        /*
        dbg_log("cache swaped %d %p->%p\n",
                free_index,
                (_u32)addr & (~(cache->cache_line_size - 1)),
                cache->caches[free_index].tag & (~(cache->cache_line_size - 1))
                );
         */
        return free_index;
}

static void set_cache_item(struct cache_sim* cache, _u32 index, void* addr)
{
        struct cache_item* item = cache->caches + index;

        item->buf = cache->cache_buf + cache->cache_line_size * index;
        item->tag = (_u32)addr & ~CACHE_FLAG_MASK;
        item->tag |= CACHE_FLAG_VALID;
        item->count = cache->tick_count;
}

static int do_cache_op(struct cache_sim* cache, void* addr, int is_read)
{
        _u32 group;
        _u32 group_base;
        int index;
        
        group = ((_u32)addr >> cache->cache_block_shifts) % cache->cache_mapping_ways;
        group_base = group * cache->cache_group_size;
        
        index = chk_cache_hit(cache, group_base, addr);
        if (index >= 0){
                cache->cache_hit_count++;
                /* LRU更新时间戳 */
                if (CACHE_SWAP_LRU == cache->swap_style)
                        cache->caches[index].lru_count = cache->tick_count;
                if (!is_read && cache->write_style == CACHE_WRITE_THROUGH)
                        cache->cache_w_count++;
                if (!is_read && cache->write_style == CACHE_WRITE_BACK)
                        cache->caches[index].tag |= CACHE_FLAG_WRITE_BACK;
        } else {
                index = get_cache_free_item(cache, group_base, addr);
                /* 
                 * 统计缺失原因:强制缺失-第一次访问某块
                 */
                if (add_addr_list(cache, (void*)addr) == 0)
                        cache->force_miss_count++;
                else if (cache->cache_free_num > 0)
                        cache->conflict_miss_count++;
                else
                        cache->capacity_miss_count++;

                set_cache_item(cache, index, addr);
                /* 从主存读取到缓存 */
                if (is_read){
                        /*
                        dbg_log("read memory block %p -> cache:%d\n",
                                (_u32)addr & (~(cache->cache_line_size - 1)), index);
                         */
                        cache->cache_r_count++;
                } else {
                        /*
                        dbg_log("write memory block %p -> cache:%d\n",
                                (_u32)addr & (~(cache->cache_line_size - 1)), index);
                         */
                        cache->cache_w_count++;
                }
                
                cache->cache_miss_count++;
        }

	return 0;
}

struct cache_sim* init_cache_sim(int cache_size)
{
        struct cache_sim* cache_obj = (struct cache_sim*)malloc(sizeof(*cache_obj));
        
        memset(cache_obj, 0, sizeof(struct cache_sim));

        cache_obj->cache_size = cache_size;
        reset_cache_sim(cache_obj, 32, 2);
        
        return cache_obj;
}

void free_cache_sim(struct cache_sim* cache)
{
        if (cache) {
                if (cache->cache_buf)
                        free(cache->cache_buf);
                if (cache->caches)
                        free(cache->caches);
                free(cache);
        }
}

void load_trace(struct cache_sim* cache, char* filename)
{
        char buf[128];
        FILE* fp = fopen(filename, "r");
        _u32 rcount = 0, wcount = 0;

        if (!fp){
                dbg_log("load_trace %s failed...\n", filename);
                return;
        }

        while (fgets(buf, sizeof(buf), fp)){
                _u8 style = 0;
                _u32 addr = 0, instruct_deltha = 0;
                //printf("%d %s", cache->addr_num, buf);
                sscanf(buf, "%c %x %d", &style, &addr, &instruct_deltha);
                //add_addr_list(cache, (void*)addr);
                if (style == 'l'){
                        do_cache_op(cache, (void*)addr, 1);
                        rcount++;
                } else {
                        do_cache_op(cache, (void*)addr, 0);
                        wcount++;
                }

                cache->tick_count += instruct_deltha + 1;
        }

        dbg_log("%s\t%s/%s\t行大小:%d\t%d路相联\n", 
                filename, 
                swap_style_description[cache->swap_style],
                write_style_description[cache->write_style],
                cache->cache_line_size,
                cache->cache_mapping_ways
                );

        dbg_log("指令统计 读/写/合计:%d/%d/%d\n读指令比例:%f%%\t写指令比例:%f%%\n",
                rcount, wcount, cache->tick_count,
                100.0*rcount/cache->tick_count,
                100.0*wcount/cache->tick_count
                );

        dbg_log("miss/hit:%d/%d\t命中率:%f%%/%f%%\n",
                cache->cache_miss_count, 
                cache->cache_hit_count,
                100.0*cache->cache_hit_count/(cache->cache_miss_count + cache->cache_hit_count),
                100.0*cache->cache_miss_count/(cache->cache_miss_count + cache->cache_hit_count)
                );

        dbg_log("强制缺失:%d/%d/%f%%\n容量缺失:%d/%d/%f%%\n冲突缺失:%d/%d/%f%%\n",
                cache->force_miss_count, cache->cache_miss_count, 
                100.0*cache->force_miss_count/cache->cache_miss_count,
                cache->capacity_miss_count, cache->cache_miss_count, 
                100.0*cache->capacity_miss_count/cache->cache_miss_count,
                cache->conflict_miss_count, cache->cache_miss_count, 
                100.0*cache->conflict_miss_count/cache->cache_miss_count
                );

        dbg_log("读通信:%d bytes\t%dKB\n写通信:%d bytes\t%dKB\n\n", 
                cache->cache_r_count*cache->cache_line_size, 
                (cache->cache_r_count*cache->cache_line_size)>>10,
                cache->cache_w_count*cache->cache_line_size, 
                (cache->cache_w_count*cache->cache_line_size)>>10
                );

        fclose(fp);
}

static do_test(struct cache_sim* cache, char* filename)
{
        int line_size[] = {32, 64, 128};
        int ways[] = {1, 2, 4, 8};
        int i,j;
        
        for (i=0; i<sizeof(line_size)/sizeof(int); i++){
                for (j=0; j<sizeof(ways)/sizeof(int); j++){
                        reset_cache_sim(cache, line_size[i], ways[j]);
                        load_trace(cache, filename);
                }
        }

}

int main(int argc, char** argv)
{
        struct cache_sim* cache_obj;
        char* test_cases[] = {"gcc.trace","gzip.trace","mcf.trace","swim.trace","twolf.trace"};
        int i, j, k;

        cache_obj = init_cache_sim(0x8000);
        
        for (k=0; k<sizeof(test_cases)/sizeof(char*); k++){
                for(i=CACHE_SWAP_FIFO; i<CACHE_SWAP_MAX; i++){
                        for (j=CACHE_WRITE_THROUGH; j<CACHE_WRITE_MAX; j++) {
                                cache_obj->swap_style = i;
                                cache_obj->write_style = j;
                                do_test(cache_obj, test_cases[k]);
                                
                        }
                }
        }
        free_cache_sim(cache_obj);

        return 0;
}

老师让我过吧

[培训]《安卓高级研修班(网课)》月薪三万计划,掌握调试、分析还原ollvm、vmp的方法,定制art虚拟机自动化脱壳的方法

收藏
免费 6
支持
分享
最新回复 (4)
雪    币: 14
活跃值: (25)
能力值: ( LV3,RANK:20 )
在线值:
发帖
回帖
粉丝
2
杀个花. 这样的导师是想把每个少年都培养成科学家呀~ 可惜和谐社会貌似比较现实~
2012-12-20 22:08
0
雪    币: 1358
活跃值: (17)
能力值: ( LV2,RANK:10 )
在线值:
发帖
回帖
粉丝
3
不错,学习了!
2012-12-22 15:29
0
雪    币: 1233
活跃值: (907)
能力值: ( LV12,RANK:750 )
在线值:
发帖
回帖
粉丝
4
晕!你是校友嘛?你不要照抄我的代码啊,不然大家都不过呢
2012-12-22 17:51
0
雪    币: 1358
活跃值: (17)
能力值: ( LV2,RANK:10 )
在线值:
发帖
回帖
粉丝
5
我早过了要交作业的年代了!
2012-12-23 12:54
0
游客
登录 | 注册 方可回帖
返回
//