nudt csapp 2025 finished

weblab finished
threadlab finished
2025-06-18 10:30:41 +08:00 · 2025-06-08 21:34:30 +08:00 · 2025-06-08 11:25:52 +08:00 · 2025-06-08 00:58:01 +08:00 · 2025-06-04 17:06:19 +08:00 · 2025-06-04 00:49:13 +08:00
223 changed files with 1271623 additions and 225 deletions
--- a/Y86_as/as86.py
+++ b/Y86_as/as86.py
@@ -0,0 +1,252 @@
+import sys
+import re
+import struct
+
+# Y86-64 Constants
+# Register mapping from name to number
+REG = {
+    '%rax': 0x0, '%rcx': 0x1, '%rdx': 0x2, '%rbx': 0x3,
+    '%rsp': 0x4, '%rbp': 0x5, '%rsi': 0x6, '%rdi': 0x7,
+    '%r8':  0x8, '%r9':  0x9, '%r10': 0xa, '%r11': 0xb,
+    '%r12': 0xc, '%r13': 0xd, '%r14': 0xe, 'F': 0xF
+}
+
+# Instruction mapping from mnemonic to (icode, ifun)
+# icode is the instruction code, ifun is the function code
+INS = {
+    'halt':   (0x0, 0x0), 'nop':    (0x1, 0x0), 'rrmovq': (0x2, 0x0),
+    'cmovle': (0x2, 0x1), 'cmovl':  (0x2, 0x2), 'cmove':  (0x2, 0x3),
+    'cmovne': (0x2, 0x4), 'cmovge': (0x2, 0x5), 'cmovg':  (0x2, 0x6),
+    'irmovq': (0x3, 0x0), 'rmmovq': (0x4, 0x0), 'mrmovq': (0x5, 0x0),
+    'addq':   (0x6, 0x0), 'subq':   (0x6, 0x1), 'andq':   (0x6, 0x2),
+    'xorq':   (0x6, 0x3), 'jmp':    (0x7, 0x0), 'jle':    (0x7, 0x1),
+    'jl':     (0x7, 0x2), 'je':     (0x7, 0x3), 'jne':    (0x7, 0x4),
+    'jge':    (0x7, 0x5), 'jg':     (0x7, 0x6), 'call':   (0x8, 0x0),
+    'ret':    (0x9, 0x0), 'pushq':  (0xA, 0x0), 'popq':   (0xB, 0x0)
+}
+
+class Y86Assembler:
+    """
+    A two-pass assembler for the Y86-64 instruction set.
+    """
+    def __init__(self):
+        self.symbol_table = {}
+        self.pc = 0
+        self.byte_code = {} # Maps address to (size, hex_string, original_line)
+
+    def assemble(self, filepath):
+        """
+        Assembles a Y86-64 source file.
+        
+        Args:
+            filepath (str): The path to the input .txt or .ys file.
+
+        Returns:
+            str: The formatted machine code output.
+        """
+        try:
+            with open(filepath, 'r') as f:
+                lines = f.readlines()
+        except FileNotFoundError:
+            return f"Error: File not found at '{filepath}'"
+
+        print("🚀 Starting assembly process...")
+        self._first_pass(lines)
+        print("✅ First pass complete. Symbol table built.")
+        self._second_pass(lines)
+        print("✅ Second pass complete. Machine code generated.")
+        return self._format_output()
+
+    def _parse_line(self, line):
+        """Strips comments and splits a line into label, instruction, and operands."""
+        line = line.split('#')[0].split('|')[0].strip()
+        if not line:
+            return None, None, []
+
+        label, instruction, operands_str = None, None, ''
+        if ':' in line:
+            label, rest = line.split(':', 1)
+            line = rest.strip()
+        
+        parts = line.split(maxsplit=1)
+        if parts:
+            instruction = parts[0]
+            if len(parts) > 1:
+                operands_str = parts[1]
+        
+        # Split operands by comma, but not inside parentheses
+        operands = re.split(r',\s*(?![^()]*\))', operands_str) if operands_str else []
+        
+        return label, instruction, [op.strip() for op in operands]
+
+    def _get_instruction_size(self, instruction, operands):
+        """Calculates the size of an instruction in bytes."""
+        if not instruction: return 0
+        
+        if instruction in ['.quad']: return 8
+        if instruction in ['.pos', '.align']: return 0
+
+        # ********** MODIFICATION START **********
+        # Handle custom `addq $val, rB` which has size 10
+        if instruction == 'addq' and operands and operands[0].startswith('$'):
+            return 10  # 1 (icode) + 1 (reg) + 8 (val)
+        # ********** MODIFICATION END **********
+            
+        icode = INS[instruction][0]
+        if icode in [0x0, 0x1, 0x9]: return 1
+        if icode in [0x2, 0x6, 0xA, 0xB]: return 2
+        if icode in [0x7, 0x8]: return 9
+        if icode in [0x3, 0x4, 0x5]: return 10
+        return 0
+
+    def _first_pass(self, lines):
+        """
+        Builds the symbol table by mapping labels to addresses.
+        """
+        self.pc = 0
+        for line_num, line in enumerate(lines, 1):
+            label, instruction, operands = self._parse_line(line)
+
+            if label:
+                if label in self.symbol_table:
+                    print(f"Warning: Duplicate label '{label}' on line {line_num}. Using first definition.")
+                else:
+                    self.symbol_table[label] = self.pc
+
+            if not instruction: continue
+
+            if instruction == '.pos':
+                self.pc = int(operands[0], 0)
+            elif instruction == '.align':
+                align_val = int(operands[0])
+                self.pc = (self.pc + align_val - 1) & -align_val
+            else:
+                self.pc += self._get_instruction_size(instruction, operands)
+
+    def _second_pass(self, lines):
+        self.pc = 0
+        for line_num, line in enumerate(lines, 1):
+            original_line = line.strip()
+            label, instruction, operands = self._parse_line(line)
+            
+            if instruction == '.pos':
+                self.pc = int(operands[0], 0)
+                continue
+            elif instruction == '.align':
+                new_pc = (self.pc + int(operands[0]) - 1) & -int(operands[0])
+                if new_pc != self.pc: self.byte_code[self.pc] = (0, '', original_line)
+                self.pc = new_pc
+                continue
+
+            if not instruction:
+                if label: self.byte_code[self.pc] = (0, '', original_line)
+                continue
+
+            start_pc = self.pc
+            size = self._get_instruction_size(instruction, operands)
+            code = bytearray()
+
+            if instruction == '.quad':
+                val = self._parse_value(operands[0])
+                code.extend(struct.pack('<Q', val))
+            else:
+                # ********** MODIFICATION START **********
+                # Handle our custom `addq $imm, rB` instruction
+                if instruction == 'addq' and operands[0].startswith('$'):
+                    icode, ifun = 0xC, 0x0  # Use unused icode 0xC for our custom instruction
+                    code.append((icode << 4) | ifun)
+                    
+                    rB = REG[operands[1]]
+                    rA = REG['F'] # No source register, so rA is F
+                    code.append((rA << 4) | rB)
+                    
+                    val = self._parse_value(operands[0])
+                    code.extend(struct.pack('<q', val))
+                # ********** MODIFICATION END **********
+                else:
+                    # Original logic for all other instructions
+                    icode, ifun = INS[instruction]
+                    b0 = (icode << 4) | ifun
+                    code.append(b0)
+                    
+                    if instruction in ['rrmovq', 'cmovle', 'cmovl', 'cmove', 'cmovne', 'cmovge', 'cmovg', 'addq', 'subq', 'andq', 'xorq']:
+                        rA = REG[operands[0]]
+                        rB = REG[operands[1]]
+                        code.append((rA << 4) | rB)
+                    elif instruction in ['pushq', 'popq']:
+                        rA = REG[operands[0]]
+                        code.append((rA << 4) | 0xF)
+                    elif instruction in ['irmovq', 'rmmovq', 'mrmovq']:
+                        if instruction == 'irmovq':
+                            rA, rB = REG['F'], REG[operands[1]]
+                            val = self._parse_value(operands[0])
+                        elif instruction == 'rmmovq':
+                            rA = REG[operands[0]]
+                            disp, rB_name = self._parse_mem(operands[1])
+                            rB, val = REG[rB_name], disp
+                        elif instruction == 'mrmovq':
+                            rA = REG[operands[1]]
+                            disp, rB_name = self._parse_mem(operands[0])
+                            rB, val = REG[rB_name], disp
+                        code.append((rA << 4) | rB)
+                        code.extend(struct.pack('<q', val))
+                    elif instruction in ['jmp', 'jle', 'jl', 'je', 'jne', 'jge', 'jg', 'call']:
+                        dest = self._parse_value(operands[0])
+                        code.extend(struct.pack('<Q', dest))
+
+            if code:
+                self.byte_code[start_pc] = (size, code.hex(), original_line)
+                self.pc += size
+
+    def _parse_value(self, s):
+        """Converts a string operand to an integer, resolving labels."""
+        s = s.strip()
+        if s.startswith('$'):
+            s = s[1:]
+        
+        if s in self.symbol_table:
+            return self.symbol_table[s]
+        try:
+            return int(s, 0) # Handles decimal and '0x' hex
+        except ValueError:
+            raise ValueError(f"Invalid immediate value or unresolved label: {s}")
+
+    def _parse_mem(self, s):
+        """Parses memory operands like 'D(%rB)' or '(%rB)'."""
+        match = re.match(r'(-?\d+)?\((\%r\w+)\)', s)
+        if not match:
+            raise ValueError(f"Invalid memory operand: {s}")
+        
+        disp_str, reg = match.groups()
+        disp = int(disp_str) if disp_str else 0
+        return disp, reg
+
+    def _format_output(self):
+        """Formats the final output string."""
+        output = []
+        # Sort addresses to print in order
+        sorted_addrs = sorted(self.byte_code.keys())
+        
+        for addr in sorted_addrs:
+            size, hex_code, line = self.byte_code[addr]
+            addr_hex = f"0x{addr:03x}:"
+            
+            # Handle lines that generate no code (labels, .align)
+            if size == 0:
+                output.append(f"{addr_hex: <10}| {line}")
+            else:
+                formatted_code = f"{hex_code:<20}"
+                output.append(f"{addr_hex: <10}{formatted_code}| {line}")
+
+        return '\n'.join(output)
+
+
+if __name__ == '__main__':
+    if len(sys.argv) != 2:
+        print("Usage: python Y86_64_assembler.py <source_file.txt>")
+        sys.exit(1)
+    
+    assembler = Y86Assembler()
+    result = assembler.assemble(sys.argv[1])
+    print("\n--- Assembled Code ---")
+    print(result)
--- a/Y86_as/input.txt
+++ b/Y86_as/input.txt
@@ -0,0 +1,40 @@
+# Execution begins at address 0
+.pos 0
+    irmovq stack, %rsp  # Set up stack pointer
+    call main           # Execute main program
+    halt                # Terminate program
+
+# Array of 4 elements
+.pos 0x18
+array:
+    .quad 0xd000d000d000d
+    .quad 0xc000c000c000c0
+    .quad 0xb000b000b000b
+    .quad 0xa000a000a000a
+
+main:
+    irmovq array, %rdi
+    irmovq $4, %rsi
+    call sum
+    ret
+
+# long sum(long *start, long count)
+# start in %rdi, count in %rsi
+sum:
+    irmovq $8,%r8
+    irmovq $1,%r9
+    xorq %rax,%rax
+    andq %rsi,%rsi
+    jmp test
+loop:
+    mrmovq (%rdi),%r10
+    addq %r10,%rax
+    addq %r8,%rdi      # start++
+    subq %r9,%rsi      # count--
+                       # Set CC
+test:
+    jne loop           # Stop when 0
+    ret                # Return
+
+.pos 0x200
+stack:
--- a/Y86_as/sample2024.txt
+++ b/Y86_as/sample2024.txt
@@ -0,0 +1,10 @@
+.pos 0x200
+sum:
+	mrmovq 8(%rdx), %rcx
+	mrmovq 8(%rax),%rsi
+	rmmovq %rsi,8(%rdx)
+	rmmovq %rcx, 8(%rax)
+	addq $8, %rdx
+	addq $120, %rax
+	subq %rdi, %rax
+	jne sum
--- a/Y86_as/屏幕截图_20250613_013251.png
+++ b/Y86_as/屏幕截图_20250613_013251.png
--- a/branchPrediction.c
+++ b/branchPrediction.c
@@ -0,0 +1,653 @@
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x<max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x>0) return x - 1;
+	return x;
+}
+
+#define BITS_OF_PC 13	// 选择13位的PC作为索引
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32 *State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << BITS_OF_PC);    // 状态数组项数
+
+	State = (UINT32 *)malloc(StateArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+    // 将状态数组，全部初始化为STATE_INIT
+    for(UINT32 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = 2;
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低13位，去索引状态数组State，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+    UINT32 index = PC>>2 & 0x1fff;
+    if(State[index] == 0 || State[index] == 1) return NOT_TAKEN;
+    return TAKEN;
+	//return TAKEN;
+	//return NOT_TAKEN;
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+    UINT32 index = PC>>2 & 0x1fff;
+    if(resolveDir == 'T')
+    {
+        State[index] = SatIncrement(State[index], 3);
+    }
+    else
+    {
+        State[index] = SatDecrement(State[index]);
+    }
+
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+}
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x<max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x>0) return x - 1;
+	return x;
+}
+
+#define BITS_OF_PC 13	// 选择13位的PC作为索引
+
+#define STATE_MAX  7
+#define STATE_INIT 3
+
+UINT32 *State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低3位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << BITS_OF_PC);    // 状态数组项数
+
+	State = (UINT32 *)malloc(StateArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+    // 将状态数组，全部初始化为STATE_INIT
+    for(UINT64 i = 0; i <= StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低13位，去索引状态数组State，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+    UINT64 index = (PC>>2) & 0x1fff;
+    if(State[index] == 0 || State[index] == 1 || State[index] == 2 || State[index] == 3) return NOT_TAKEN;
+    return TAKEN;
+	//return TAKEN;
+	//return NOT_TAKEN;
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+    UINT64 index = (PC>>2) & 0x1fff;
+    if(resolveDir == 'T')
+    {
+        State[index] = SatIncrement(State[index], 7);
+    }
+    else
+    {
+        State[index] = SatDecrement(State[index]);
+    }
+
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+}
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x < max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x > 0) return x - 1;
+	return x;
+}
+
+#define BITS_OF_PC 10		// 选择10位的PC作为索引
+#define LOCAL_HIST_LEN   3	// 局部历史长度，3位
+#define LOCAL_HIST_MASK  ~(~0  << LOCAL_HIST_LEN)
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32* pht;            // pattern history table    模式历史表
+UINT32 phtArraySize;	// pht数组项数
+UINT32* State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << (BITS_OF_PC + LOCAL_HIST_LEN));    // 状态数组项数
+
+	State = (UINT32*)malloc(StateArraySize * sizeof(UINT32));
+
+	phtArraySize = (1 << BITS_OF_PC);	// pht数组项数
+
+	pht = (UINT32*)malloc(phtArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+	// 将状态数组，全部初始化为STATE_INIT
+	// 将模式历史表（pht）全部初始化为0
+    for(UINT64 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+    for(UINT32 i = 0; i < phtArraySize; i++)
+    {
+        pht[i] = 0;
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低10位，去索引模式历史表pht，得到对应的3位历史信息
+    UINT32 index1 = (PC>>2) & 0x3ff;
+	// 将PC的低10位，与3位历史信息进行拼接，形成一个13位的状态数组索引（拼接需要使用C语言的移位、与、或等运算）
+    //UINT64 index2 = (index1<<3) | (pht[index1]);
+    //UINT64 index2 = (index1) | (pht[index1]<<10);
+    UINT64 index2 = (index1 & 0x3ff) | (pht[index1]<<10 & 0x1c00);
+	// 用13位去索引状态数组，得到对应的饱和状态
+    if(State[index2] == 0 || State[index2] == 1) return NOT_TAKEN;
+    return TAKEN;
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+	
+	//return TAKEN;
+	// return NOT_TAKEN;
+
+	// *********** 你需要在上面书写代码 ***********
+
+}
+
+// 2位状态的分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+    // 更新pht中的最近3次分支历史信息，使用移位寄存器来更新
+	// 将其更新到pht中
+    UINT32 index1 = (PC>>2) & 0x3ff;
+    //UINT64 index2 = (index1<<3) | (pht[index1]);
+    //UINT64 index2 = (index1) | (pht[index1]<<10);
+    UINT64 index2 = (index1 & 0x3ff) | (pht[index1]<<10 & 0x1c00);
+    if(resolveDir == 'T')
+    {
+        State[index2] = SatIncrement(State[index2], 3);
+        pht[index1] = (pht[index1]<<1) | 0x1;
+    }
+    else
+    {
+        State[index2] = SatDecrement(State[index2]);
+        pht[index1] = (pht[index1]<<1);
+    }
+
+
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+	free(pht);
+}
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x < max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x > 0) return x - 1;
+	return x;
+}
+
+#define BITS_OF_PC 9		// 选择9位的PC作为索引
+#define LOCAL_HIST_LEN   4	// 局部历史长度，4位
+#define LOCAL_HIST_MASK  ~(~0  << LOCAL_HIST_LEN)
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32* pht;            // pattern history table    模式历史表
+UINT32 phtArraySize;	// pht数组项数
+UINT32* State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << (BITS_OF_PC + LOCAL_HIST_LEN));    // 状态数组项数
+
+	State = (UINT32*)malloc(StateArraySize * sizeof(UINT32));
+
+	phtArraySize = (1 << BITS_OF_PC);	// pht数组项数
+
+	pht = (UINT32*)malloc(phtArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+	// 将状态数组，全部初始化为STATE_INIT
+	// 将模式历史表（pht）全部初始化为0
+    for(UINT64 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+    for(UINT32 i = 0; i < phtArraySize; i++)
+    {
+        pht[i] = 0;
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// 2位状态的分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低10位，去索引模式历史表pht，得到对应的3位历史信息
+	// 将PC的低10位，与3位历史信息进行拼接，形成一个13位的状态数组索引（拼接需要使用C语言的移位、与、或等运算）
+	// 用13位去索引状态数组，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+    UINT32 index1 = (PC>>2) & 0x1ff;
+    UINT64 index2 = (index1 & 0x1ff) | (pht[index1]<<9 & 0x1e00);
+	if(State[index2] == 0 || State[index2] == 1) return NOT_TAKEN;
+    return TAKEN;
+	//return TAKEN;
+	// return NOT_TAKEN;
+
+	// *********** 你需要在上面书写代码 ***********
+
+}
+
+// 2位状态的分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+	// 更新pht中的最近3次分支历史信息，使用移位寄存器来更新
+	// 将其更新到pht中
+    UINT32 index1 = (PC>>2) & 0x1ff;
+    UINT64 index2 = (index1 & 0x1ff) | (pht[index1]<<9 & 0x1e00);
+    if(resolveDir == 'T')
+    {
+        State[index2] = SatIncrement(State[index2], 3);
+        pht[index1] = (pht[index1]<<1) | 0x1;
+    }
+    else
+    {
+        State[index2] = SatDecrement(State[index2]);
+        pht[index1] = (pht[index1]<<1);
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+	free(pht);
+}
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x < max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x > 0) return x - 1;
+	return x;
+}
+
+#define GLOBAL_HIST_LEN   13	// 全局历史长度，13位
+#define GLOBAL_HIST_MASK  ~(~0  << GLOBAL_HIST_LEN)
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32 GHR;				// Global History Register，全局历史寄存器
+UINT32* State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << GLOBAL_HIST_LEN);    // 状态数组项数
+
+	State = (UINT32*)malloc(StateArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+	// 将状态数组，全部初始化为STATE_INIT
+	// 将全局历史寄存器（GHR）初始化为0
+    for(UINT64 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+    GHR = 0;
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// Gshare分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 用13位的GHR去索引状态数组，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+    UINT64 index = GHR & 0x1fff;
+    if(State[index] == 0 || State[index] == 1) return NOT_TAKEN;
+    return TAKEN;
+	// return TAKEN;
+	// return NOT_TAKEN;
+
+	// *********** 你需要在上面书写代码 ***********
+
+}
+
+// Gshare分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+	// 更新GHR中的最近1次分支历史信息，使用移位寄存器来更新
+    UINT64 index = GHR & 0x1fff;
+    if(resolveDir == 'T')
+    {
+        State[index] = SatIncrement(State[index], 3);
+        GHR = GHR << 1 | 0x1;
+    }
+    else
+    {
+        State[index] = SatDecrement(State[index]);
+        GHR = GHR << 1;
+    }
+    
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+}
+
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x < max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x > 0) return x - 1;
+	return x;
+}
+
+#define BITS_OF_PC 3		// 选择3位的PC作为索引
+#define GLOBAL_HIST_LEN   10	// 全局历史长度，10位
+#define STATE_INDEX_MASK  ~(~0  << (BITS_OF_PC + GLOBAL_HIST_LEN))
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32 GHR;				// Global History Register，全局历史寄存器
+UINT32* State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << (BITS_OF_PC +GLOBAL_HIST_LEN));    // 状态数组项数
+
+	State = (UINT32*)malloc(StateArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+	// 将状态数组，全部初始化为STATE_INIT
+	// 将全局历史寄存器（GHR）初始化为0
+    for(UINT64 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+    GHR = 0;
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// Gshare分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低3位，与10位GHR进行拼接，形成一个13位的状态数组索引
+	// 用13位去索引状态数组，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转
+	UINT64 index = (((PC>>2 & 0x7) << 10) & 0x1c00) | (GHR & 0x3ff);
+    if(State[index] == 0 || State[index] == 1) return NOT_TAKEN;
+    return TAKEN;
+	// return TAKEN;
+	// return NOT_TAKEN;
+
+	// *********** 你需要在上面书写代码 ***********
+
+}
+
+// Gshare分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+	// 更新GHR中的最近1次分支历史信息，使用移位寄存器来更新
+    UINT64 index = (((PC>>2 & 0x7) << 10) & 0x1c00) | (GHR & 0x3ff);
+    if(resolveDir == 'T')
+    {
+        State[index] = SatIncrement(State[index], 3);
+        GHR = GHR << 1 | 0x1;
+    }
+    else
+    {
+        State[index] = SatDecrement(State[index]);
+        GHR = GHR << 1;
+    }
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+}
+
+
+
+#include "common.h"
+
+// 饱和计数器：加1
+static inline UINT32 SatIncrement(UINT32 x, UINT32 max)
+{
+	if (x < max) return x + 1;
+	return x;
+}
+
+// 饱和计数器：减1
+static inline UINT32 SatDecrement(UINT32 x)
+{
+	if (x > 0) return x - 1;
+	return x;
+}
+
+#define GLOBAL_HIST_LEN   13	// 全局历史长度，13位
+#define GLOBAL_HIST_MASK  ~(~0  << GLOBAL_HIST_LEN)
+
+#define STATE_MAX  3
+#define STATE_INIT 2
+
+UINT32 GHR;				// Global History Register，全局历史寄存器
+UINT32* State;			// 状态数组，用于保存分支指令的状态机，实际只使用最低2位
+UINT64 StateArraySize;
+
+void PREDICTOR_init(void)
+{
+	StateArraySize = (1 << GLOBAL_HIST_LEN);    // 状态数组项数
+
+	State = (UINT32*)malloc(StateArraySize * sizeof(UINT32));
+
+	// *********** 你需要在下面书写代码 ***********
+	// 将状态数组，全部初始化为STATE_INIT
+	// 将全局历史寄存器（GHR）初始化为0
+    for(UINT64 i = 0; i < StateArraySize; i++)
+    {
+        State[i] = STATE_INIT;
+    }
+    GHR = 0;
+	// *********** 你需要在上面书写代码 ***********
+}
+
+// Gshare分支预测器（预测部分）
+char GetPrediction(UINT64 PC)
+{
+	// *********** 你需要在下面书写代码 ***********
+	// 将PC的低13位，与13位GHR进行异或，形成一个13位的状态数组索引
+	// 用13位去索引状态数组，得到对应的饱和状态
+	// 如果该状态的值超过一半，则预测跳转
+	// 如果该状态的值低于一半，则预测不跳转7]
+    UINT64 nPC = (PC) & 0x1fff;
+    UINT64 index = nPC ^ (GHR & 0x1fff);
+    if(State[index] == 0 || State[index] == 1) return NOT_TAKEN;
+    return TAKEN;
+	// return TAKEN;
+	// return NOT_TAKEN;
+
+	// *********** 你需要在上面书写代码 ***********
+
+}
+
+// Gshare分支预测器（更新部分）
+void  UpdatePredictor(UINT64 PC, OpType opType, char resolveDir, char predDir, UINT64 branchTarget)
+{
+
+	// *********** 你需要在下面书写代码 ***********
+	// 根据分支指令实际执行结果，来更新对应的饱和计数器
+	// 如果结果为跳转，则对应的饱和计数器+1
+	// 如果结果为不跳转，则对应的饱和计数器-1
+	// 更新GHR中的最近1次分支历史信息，使用移位寄存器来更新
+    UINT64 nPC = (PC) & 0x1fff;
+    UINT64 index = nPC ^ (GHR & 0x1fff);
+    if(resolveDir == 'T')
+    {
+        State[index] = SatIncrement(State[index], 3);
+        GHR = GHR << 1 | 0x1;
+    }
+    else
+    {
+        State[index] = SatDecrement(State[index]);
+        GHR = GHR << 1;
+    }
+
+	// *********** 你需要在上面书写代码 ***********
+}
+
+void PREDICTOR_free(void)
+{
+	free(State);
+}
+
+
--- a/cachelab/Cache
+++ b/cachelab/Cache
--- a/cachelab/Cache.c
+++ b/cachelab/Cache.c
@@ -0,0 +1,995 @@
+#include "common.h"
+#include <stdio.h>
+
+#define DEBUG 0
+
+#define GET_POWER_OF_2(X) __builtin_ctz(X)
+
+/*
+    组相联映射Data Cache，16KB大小
+    每行存放16个字节，共1024行
+*/
+#define DCACHE_LINE_PER_SET 256
+#define DCACHE_SIZE 16384
+#define DCACHE_DATA_PER_LINE 16 // 必须是8字节的倍数
+#define DCACHE_DATA_PER_LINE_ADDR_BITS                                         \
+  GET_POWER_OF_2(                                                              \
+      DCACHE_DATA_PER_LINE) // 必须与上面设置一致，即64字节，需要6位地址
+#define DCACHE_SET (DCACHE_SIZE / DCACHE_DATA_PER_LINE / DCACHE_LINE_PER_SET)
+#define DCACHE_SET_ADDR_BITS                                                   \
+  GET_POWER_OF_2(DCACHE_SET) // 必须与上面设置一致，即256行，需要8位地址
+
+/*
+    L2 Cache配置，1MB大小
+    每行存放128个字节，共4096行
+*/
+#define L2CACHE_LINE_PER_SET 4096
+#define L2CACHE_SIZE 1048576
+#define L2CACHE_DATA_PER_LINE 128 // 必须是8字节的倍数
+#define L2CACHE_DATA_PER_LINE_ADDR_BITS GET_POWER_OF_2(L2CACHE_DATA_PER_LINE)
+#define L2CACHE_SET                                                            \
+  (L2CACHE_SIZE / L2CACHE_DATA_PER_LINE / L2CACHE_LINE_PER_SET)
+#define L2CACHE_SET_ADDR_BITS GET_POWER_OF_2(L2CACHE_SET)
+
+/*
+    组相联映射Instruction Cache，16KB大小
+    每行存放16个字节，共1024行
+*/
+#define ICACHE_LINE_PER_SET 64
+#define ICACHE_SIZE 16384
+#define ICACHE_DATA_PER_LINE 16 // 必须是8字节的倍数
+#define ICACHE_DATA_PER_LINE_ADDR_BITS GET_POWER_OF_2(ICACHE_DATA_PER_LINE)
+#define ICACHE_SET (ICACHE_SIZE / ICACHE_DATA_PER_LINE / ICACHE_LINE_PER_SET)
+#define ICACHE_SET_ADDR_BITS GET_POWER_OF_2(ICACHE_SET)
+
+// DCache行的结构
+struct DCACHE_LineStruct {
+  UINT8 Valid;
+  UINT8 Age;
+  UINT8 Dirty;
+  UINT64 Tag;
+  UINT8 Data[DCACHE_DATA_PER_LINE];
+};
+
+struct DCACHE_Set {
+  struct DCACHE_LineStruct Line[DCACHE_LINE_PER_SET];
+} DCache[DCACHE_SET];
+
+// L2Cache行的结构
+struct L2CACHE_LineStruct {
+  UINT8 Valid;
+  UINT8 Age;
+  UINT8 Dirty;
+  UINT64 Tag;
+  UINT8 Data[L2CACHE_DATA_PER_LINE];
+};
+
+struct L2CACHE_Set {
+  struct L2CACHE_LineStruct Line[L2CACHE_LINE_PER_SET];
+} L2Cache[L2CACHE_SET];
+
+// ICache行的结构
+struct ICACHE_LineStruct {
+  UINT8 Valid;
+  UINT8 Age;
+  UINT64 Tag;
+  UINT8 Data[ICACHE_DATA_PER_LINE];
+};
+
+struct ICACHE_Set {
+  struct ICACHE_LineStruct Line[ICACHE_LINE_PER_SET];
+} ICache[ICACHE_SET];
+
+// 函数声明部分 - 防止隐式声明错误
+void LoadDataCacheLineFromMemory(UINT64 Address, UINT32 set, UINT8 line);
+void StoreDataCacheLineToMemory(UINT64 Address, UINT32 set, UINT8 line);
+void LoadInstCacheLineFromMemory(UINT64 Address, UINT32 set, UINT8 line);
+void InitL2Cache(void);
+
+/*
+    DCache初始化代码，一般需要把DCache的有效位Valid设置为0
+    模拟器启动时，会调用此InitDataCache函数
+*/
+void InitDataCache() {
+  UINT32 i, j;
+  printf("[%s] +-----------------------------------+\n", __func__);
+  printf("[%s] |   Cikki 的Data Cache初始化ing.... |\n", __func__);
+  printf("[%s] +-----------------------------------+\n", __func__);
+  for (i = 0; i < DCACHE_SET; i++) {
+    for (j = 0; j < DCACHE_LINE_PER_SET; j++) {
+      DCache[i].Line[j].Valid = 0;
+      DCache[i].Line[j].Dirty = 0;
+      DCache[i].Line[j].Tag = 0;
+      DCache[i].Line[j].Age = j;
+    }
+  }
+}
+
+/*
+    L2Cache初始化代码
+*/
+void InitL2Cache() {
+  UINT32 i, j;
+  printf("[%s] +-----------------------------------+\n", __func__);
+  printf("[%s] |   Cikki 的L2 Cache初始化ing....   |\n", __func__);
+  printf("[%s] +-----------------------------------+\n", __func__);
+  for (i = 0; i < L2CACHE_SET; i++) {
+    for (j = 0; j < L2CACHE_LINE_PER_SET; j++) {
+      L2Cache[i].Line[j].Valid = 0;
+      L2Cache[i].Line[j].Dirty = 0;
+      L2Cache[i].Line[j].Tag = 0;
+      L2Cache[i].Line[j].Age = j;
+    }
+  }
+}
+
+/*
+    ICache初始化代码
+*/
+void InitInstCache(void) {
+  UINT32 i, j;
+  printf("[%s] +-----------------------------------+\n", __func__);
+  printf("[%s] |   Cikki 的Inst Cache初始化ing.... |\n", __func__);
+  printf("[%s] +-----------------------------------+\n", __func__);
+  for (i = 0; i < ICACHE_SET; i++) {
+    for (j = 0; j < ICACHE_LINE_PER_SET; j++) {
+      ICache[i].Line[j].Valid = 0;
+      ICache[i].Line[j].Tag = 0;
+      ICache[i].Line[j].Age = j;
+    }
+  }
+
+  // 初始化L2缓存
+  InitL2Cache();
+}
+
+// 在第Set组中，从DCACHE_LINE_PER_SET路中，找到需要替换的Cache行
+// 如果DCACHE_LINE_PER_SET行中，有某行的Valid=0，则返回该行行号
+// 否则，返回Age最大的行的行号
+UINT8 GetReplaceLineData(UINT32 Set) {
+  int max_index = 0;
+  int max_age = -1;
+  for (int i = 0; i < DCACHE_LINE_PER_SET; i++) {
+    if (DCache[Set].Line[i].Valid == 0)
+      return i;
+    if (DCache[Set].Line[i].Age > max_age) {
+      max_index = i;
+      max_age = DCache[Set].Line[i].Age;
+    }
+  }
+
+  return max_index;
+}
+
+// 在L2 Cache的第Set组中找到需要替换的行
+UINT8 GetReplaceLineL2(UINT32 Set) {
+  int max_index = 0;
+  int max_age = -1;
+  for (int i = 0; i < L2CACHE_LINE_PER_SET; i++) {
+    if (L2Cache[Set].Line[i].Valid == 0)
+      return i;
+    if (L2Cache[Set].Line[i].Age > max_age) {
+      max_index = i;
+      max_age = L2Cache[Set].Line[i].Age;
+    }
+  }
+
+  return max_index;
+}
+
+// LRU替换策略 - ICache
+UINT8 GetReplaceLineInst(UINT32 Set) {
+  int max_index = 0;
+  int max_age = -1;
+  for (int i = 0; i < ICACHE_LINE_PER_SET; i++) {
+    if (ICache[Set].Line[i].Valid == 0)
+      return i;
+    if (ICache[Set].Line[i].Age > max_age) {
+      max_index = i;
+      max_age = ICache[Set].Line[i].Age;
+    }
+  }
+
+  return max_index;
+}
+
+// 更新Age，在第Set组中，将HitLine指定的Cache行的Age设置为0，其他行的Age要相应调整
+// 确保DCACHE_LINE_PER_SET行的Age分别为0~DCACHE_LINE_PER_SET-1，且唯一
+void UpdateAgeData(UINT32 Set, UINT8 HitLine) {
+  UINT8 old_age = DCache[Set].Line[HitLine].Age;
+  for (int i = 0; i < DCACHE_LINE_PER_SET; ++i) {
+    if (DCache[Set].Line[i].Age < old_age)
+      DCache[Set].Line[i].Age++;
+  }
+  DCache[Set].Line[HitLine].Age = 0;
+}
+
+// 更新L2 Cache的Age
+void UpdateAgeL2(UINT32 Set, UINT8 HitLine) {
+  UINT8 old_age = L2Cache[Set].Line[HitLine].Age;
+  for (int i = 0; i < L2CACHE_LINE_PER_SET; ++i) {
+    if (L2Cache[Set].Line[i].Age < old_age)
+      L2Cache[Set].Line[i].Age++;
+  }
+  L2Cache[Set].Line[HitLine].Age = 0;
+}
+
+// 更新Age - ICache
+void UpdateAgeInst(UINT32 Set, UINT8 HitLine) {
+  int HitAge = ICache[Set].Line[HitLine].Age;
+  ICache[Set].Line[HitLine].Age = 0;
+  for (int i = 0; i < ICACHE_LINE_PER_SET; i++) {
+    if (i != HitLine && ICache[Set].Line[i].Age < HitAge)
+      ICache[Set].Line[i].Age++;
+  }
+}
+
+/*
+    从Memory中读入一行数据到Data Cache中
+*/
+void LoadDataCacheLineFromMemory(UINT64 Address, UINT32 set, UINT8 line) {
+  // 一次性从Memory中将DCACHE_DATA_PER_LINE数据读入某个Data Cache行
+  // 提供了一个函数，一次可以读入8个字节
+
+  // 地址对齐到缓存行边界
+  const UINT64 AlignAddress = Address & ~(DCACHE_DATA_PER_LINE - 1);
+  UINT64 *const cache_line_ptr = (UINT64 *)DCache[set].Line[line].Data;
+
+  if (DEBUG) {
+    printf("[%s] Loading cache line (set=%u, line=%u) from memory %016llX\n",
+           __func__, set, line, AlignAddress);
+  }
+
+  // 分8字节块读取
+  for (UINT32 i = 0; i < DCACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+    const UINT64 read_addr = AlignAddress + i * sizeof(UINT64);
+    const UINT64 data = ReadMemory(read_addr);
+
+    cache_line_ptr[i] = data;
+
+    if (DEBUG) {
+      printf("  [LOAD] Address=%016llX -> Data=%016llX\n", read_addr, data);
+    }
+  }
+}
+
+/*
+    从内存加载一行数据到指令缓存中
+*/
+void LoadInstCacheLineFromMemory(UINT64 Address, UINT32 set, UINT8 line) {
+  // 一次性从Memory中将ICACHE_DATA_PER_LINE数据读入某个Instruction Cache行
+  // 提供了一个函数，一次可以读入8个字节
+
+  // 地址对齐到缓存行边界
+  const UINT64 AlignAddress = Address & ~(ICACHE_DATA_PER_LINE - 1);
+  UINT64 *const cache_line_ptr = (UINT64 *)ICache[set].Line[line].Data;
+
+  if (DEBUG) {
+    printf("[%s] Loading cache line (set=%u, line=%u) from memory %016llX\n",
+           __func__, set, line, AlignAddress);
+  }
+
+  // 分8字节块读取
+  for (UINT32 i = 0; i < ICACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+    const UINT64 read_addr = AlignAddress + i * sizeof(UINT64);
+    const UINT64 data = ReadMemory(read_addr);
+
+    cache_line_ptr[i] = data;
+
+    if (DEBUG) {
+      printf("  [LOAD] Address=%016llX -> Data=%016llX\n", read_addr, data);
+    }
+  }
+}
+
+/*
+    将Data Cache中的一行数据，写入存储器
+*/
+void StoreDataCacheLineToMemory(UINT64 Address, UINT32 set, UINT8 line) {
+  // 一次性将DCACHE_DATA_PER_LINE数据从某个Data Cache行写入Memory中
+  // 提供了一个函数，一次可以写入8个字节
+
+  // 地址对齐到缓存行边界
+  const UINT64 AlignAddress = Address & ~(DCACHE_DATA_PER_LINE - 1);
+  UINT64 *const cache_line_ptr = (UINT64 *)DCache[set].Line[line].Data;
+
+  if (DEBUG) {
+    printf("[%s] Storing cache line (set=%u, line=%u) to memory %016llX\n",
+           __func__, set, line, AlignAddress);
+  }
+
+  // 分8字节块写入
+  for (UINT32 i = 0; i < DCACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+    const UINT64 write_addr = AlignAddress + i * sizeof(UINT64);
+    const UINT64 data = cache_line_ptr[i];
+
+    WriteMemory(write_addr, data);
+
+    if (DEBUG) {
+      printf("  [STORE] Address=%016llX <- Data=%016llX\n", write_addr, data);
+    }
+  }
+}
+
+/*
+    从L2 Cache中读取数据到L1 DCache中
+    如果L2命中，则从L2读取数据
+    如果L2未命中，则从内存读取数据并更新L2
+*/
+UINT8 LoadDataFromL2ToL1(UINT64 Address, UINT32 L1_set, UINT8 L1_line) {
+  UINT32 L2_set = (Address >> L2CACHE_DATA_PER_LINE_ADDR_BITS) % L2CACHE_SET;
+  UINT64 L2_tag =
+      Address >> (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS);
+  UINT8 L2_hit = 0;
+  UINT8 L2_line = 0;
+
+  // 检查L2 Cache是否命中
+  for (int i = 0; i < L2CACHE_LINE_PER_SET; i++) {
+    if (L2Cache[L2_set].Line[i].Valid &&
+        L2Cache[L2_set].Line[i].Tag == L2_tag) {
+      L2_hit = 1;
+      L2_line = i;
+      break;
+    }
+  }
+
+  if (L2_hit) {
+    // L2命中，从L2读取数据到L1
+    if (DEBUG) {
+      printf("[%s] L2 Cache hit! Loading from L2 to L1 (Address=%016llX)\n",
+             __func__, Address);
+    }
+
+    // 由于L2缓存行可能比L1大，需要找到正确的偏移量
+    UINT64 L1_aligned_addr = Address & ~(DCACHE_DATA_PER_LINE - 1);
+    UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+    UINT32 offset_in_L2 = (L1_aligned_addr - L2_aligned_addr);
+
+    // 从L2复制数据到L1
+    for (int i = 0; i < DCACHE_DATA_PER_LINE; i++) {
+      DCache[L1_set].Line[L1_line].Data[i] =
+          L2Cache[L2_set].Line[L2_line].Data[offset_in_L2 + i];
+    }
+
+    // 更新L2的LRU信息
+    UpdateAgeL2(L2_set, L2_line);
+    return 'H'; // L2命中
+  } else {
+    // L2未命中，从内存加载数据
+    if (DEBUG) {
+      printf("[%s] L2 Cache miss! Loading from memory (Address=%016llX)\n",
+             __func__, Address);
+    }
+
+    // 首先从内存加载到L1
+    LoadDataCacheLineFromMemory(Address, L1_set, L1_line);
+
+    // 然后更新L2
+    UINT8 L2_replace_line = GetReplaceLineL2(L2_set);
+
+    // 如果L2中要替换的行是脏的，需要先写回内存
+    if (L2Cache[L2_set].Line[L2_replace_line].Valid &&
+        L2Cache[L2_set].Line[L2_replace_line].Dirty) {
+      UINT64 victim_addr =
+          (L2Cache[L2_set].Line[L2_replace_line].Tag
+           << (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS)) |
+          (L2_set << L2CACHE_DATA_PER_LINE_ADDR_BITS);
+
+      // 写回内存
+      for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+        const UINT64 write_addr = victim_addr + i * sizeof(UINT64);
+        const UINT64 *data_ptr = (UINT64 *)&L2Cache[L2_set]
+                                     .Line[L2_replace_line]
+                                     .Data[i * sizeof(UINT64)];
+        WriteMemory(write_addr, *data_ptr);
+      }
+    }
+
+    // 从内存加载数据到L2
+    UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+    for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+      const UINT64 read_addr = L2_aligned_addr + i * sizeof(UINT64);
+      const UINT64 data = ReadMemory(read_addr);
+      UINT64 *data_ptr = (UINT64 *)&L2Cache[L2_set]
+                             .Line[L2_replace_line]
+                             .Data[i * sizeof(UINT64)];
+      *data_ptr = data;
+    }
+
+    // 更新L2缓存行信息
+    L2Cache[L2_set].Line[L2_replace_line].Valid = 1;
+    L2Cache[L2_set].Line[L2_replace_line].Dirty = 0;
+    L2Cache[L2_set].Line[L2_replace_line].Tag = L2_tag;
+    UpdateAgeL2(L2_set, L2_replace_line);
+
+    return 'M'; // L2未命中
+  }
+}
+
+/*
+    将L1 DCache中的一行数据写入L2 Cache
+*/
+void StoreDataFromL1ToL2(UINT64 Address, UINT32 L1_set, UINT8 L1_line) {
+  UINT32 L2_set = (Address >> L2CACHE_DATA_PER_LINE_ADDR_BITS) % L2CACHE_SET;
+  UINT64 L2_tag =
+      Address >> (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS);
+  UINT8 L2_hit = 0;
+  UINT8 L2_line = 0;
+
+  // 检查L2 Cache是否命中
+  for (int i = 0; i < L2CACHE_LINE_PER_SET; i++) {
+    if (L2Cache[L2_set].Line[i].Valid &&
+        L2Cache[L2_set].Line[i].Tag == L2_tag) {
+      L2_hit = 1;
+      L2_line = i;
+      break;
+    }
+  }
+
+  if (!L2_hit) {
+    // L2未命中，需要分配一个新的L2缓存行
+    L2_line = GetReplaceLineL2(L2_set);
+
+    // 如果要替换的L2行是脏的，需要先写回内存
+    if (L2Cache[L2_set].Line[L2_line].Valid &&
+        L2Cache[L2_set].Line[L2_line].Dirty) {
+      UINT64 victim_addr =
+          (L2Cache[L2_set].Line[L2_line].Tag
+           << (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS)) |
+          (L2_set << L2CACHE_DATA_PER_LINE_ADDR_BITS);
+
+      // 写回内存
+      for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+        const UINT64 write_addr = victim_addr + i * sizeof(UINT64);
+        const UINT64 *data_ptr =
+            (UINT64 *)&L2Cache[L2_set].Line[L2_line].Data[i * sizeof(UINT64)];
+        WriteMemory(write_addr, *data_ptr);
+      }
+    }
+
+    // 从内存加载完整的L2缓存行
+    UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+    for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+      const UINT64 read_addr = L2_aligned_addr + i * sizeof(UINT64);
+      const UINT64 data = ReadMemory(read_addr);
+      UINT64 *data_ptr =
+          (UINT64 *)&L2Cache[L2_set].Line[L2_line].Data[i * sizeof(UINT64)];
+      *data_ptr = data;
+    }
+
+    L2Cache[L2_set].Line[L2_line].Valid = 1;
+    L2Cache[L2_set].Line[L2_line].Tag = L2_tag;
+  }
+
+  // 更新L2缓存行中对应的数据
+  UINT64 L1_aligned_addr = Address & ~(DCACHE_DATA_PER_LINE - 1);
+  UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+  UINT32 offset_in_L2 = (L1_aligned_addr - L2_aligned_addr);
+
+  // 从L1复制数据到L2
+  for (int i = 0; i < DCACHE_DATA_PER_LINE; i++) {
+    L2Cache[L2_set].Line[L2_line].Data[offset_in_L2 + i] =
+        DCache[L1_set].Line[L1_line].Data[i];
+  }
+
+  // 标记L2缓存行为脏
+  L2Cache[L2_set].Line[L2_line].Dirty = 1;
+  UpdateAgeL2(L2_set, L2_line);
+}
+
+/*
+    从L2 Cache中加载指令到I-Cache
+    如果L2缓存命中，则从L2读取数据
+    如果L2缓存未命中，则从内存读取数据并同时更新L2缓存
+*/
+UINT8 LoadInstFromL2ToICache(UINT64 Address, UINT32 I_set, UINT8 I_line) {
+  UINT32 L2_set = (Address >> L2CACHE_DATA_PER_LINE_ADDR_BITS) % L2CACHE_SET;
+  UINT64 L2_tag =
+      Address >> (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS);
+  UINT8 L2_hit = 0;
+  UINT8 L2_line = 0;
+
+  // 检查L2 Cache是否命中
+  for (int i = 0; i < L2CACHE_LINE_PER_SET; i++) {
+    if (L2Cache[L2_set].Line[i].Valid &&
+        L2Cache[L2_set].Line[i].Tag == L2_tag) {
+      L2_hit = 1;
+      L2_line = i;
+      break;
+    }
+  }
+
+  if (L2_hit) {
+    // L2命中，从L2读取数据到I-Cache
+    if (DEBUG) {
+      printf("[%s] L2 Cache hit! Loading instruction from L2 to I-Cache "
+             "(Address=%016llX)\n",
+             __func__, Address);
+    }
+
+    // 由于L2缓存行可能比I-Cache大，需要找到正确的偏移量
+    UINT64 I_aligned_addr = Address & ~(ICACHE_DATA_PER_LINE - 1);
+    UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+    UINT32 offset_in_L2 = (I_aligned_addr - L2_aligned_addr);
+
+    // 从L2复制数据到I-Cache
+    for (int i = 0; i < ICACHE_DATA_PER_LINE; i++) {
+      ICache[I_set].Line[I_line].Data[i] =
+          L2Cache[L2_set].Line[L2_line].Data[offset_in_L2 + i];
+    }
+
+    // 更新L2的LRU信息
+    UpdateAgeL2(L2_set, L2_line);
+    return 'H'; // L2命中
+  } else {
+    // L2未命中，从内存加载数据
+    if (DEBUG) {
+      printf("[%s] L2 Cache miss! Loading instruction from memory "
+             "(Address=%016llX)\n",
+             __func__, Address);
+    }
+
+    // 首先从内存加载到I-Cache
+    LoadInstCacheLineFromMemory(Address, I_set, I_line);
+
+    // 然后更新L2
+    UINT8 L2_replace_line = GetReplaceLineL2(L2_set);
+
+    // 如果L2中要替换的行是脏的，需要先写回内存
+    if (L2Cache[L2_set].Line[L2_replace_line].Valid &&
+        L2Cache[L2_set].Line[L2_replace_line].Dirty) {
+      UINT64 victim_addr =
+          (L2Cache[L2_set].Line[L2_replace_line].Tag
+           << (L2CACHE_DATA_PER_LINE_ADDR_BITS + L2CACHE_SET_ADDR_BITS)) |
+          (L2_set << L2CACHE_DATA_PER_LINE_ADDR_BITS);
+
+      // 写回内存
+      for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+        const UINT64 write_addr = victim_addr + i * sizeof(UINT64);
+        const UINT64 *data_ptr = (UINT64 *)&L2Cache[L2_set]
+                                     .Line[L2_replace_line]
+                                     .Data[i * sizeof(UINT64)];
+        WriteMemory(write_addr, *data_ptr);
+      }
+    }
+    // 从内存加载数据到L2
+    UINT64 L2_aligned_addr = Address & ~(L2CACHE_DATA_PER_LINE - 1);
+    for (UINT32 i = 0; i < L2CACHE_DATA_PER_LINE / sizeof(UINT64); i++) {
+      const UINT64 read_addr = L2_aligned_addr + i * sizeof(UINT64);
+      const UINT64 data = ReadMemory(read_addr);
+      UINT64 *data_ptr = (UINT64 *)&L2Cache[L2_set]
+                             .Line[L2_replace_line]
+                             .Data[i * sizeof(UINT64)];
+      *data_ptr = data;
+    }
+
+    // 更新L2缓存行信息
+    L2Cache[L2_set].Line[L2_replace_line].Valid = 1;
+    L2Cache[L2_set].Line[L2_replace_line].Dirty = 0;
+    L2Cache[L2_set].Line[L2_replace_line].Tag = L2_tag;
+    UpdateAgeL2(L2_set, L2_replace_line);
+
+    return 'M'; // L2未命中
+  }
+}
+
+/*
+ * 访问数据缓存的主函数
+ * 参数：
+ *   Address - 访问的内存地址
+ *   Operation - 'L'表示读取，'S'表示写入，'M'表示修改（先读后写）
+ *   DataSize - 访问的数据大小（1、2、4或8字节）
+ *   StoreValue - 要写入的数据（如果是写入操作）
+ *   LoadResult - 指向读取结果的指针（如果是读取操作）
+ * 返回值：
+ *   'H' - 缓存命中
+ *   'M' - 缓存未命中
+ */
+UINT8 AccessDataCache(UINT64 Address, UINT8 Operation, UINT8 DataSize,
+                      UINT64 StoreValue, UINT64 *LoadResult) {
+  UINT32 Set = (Address >> DCACHE_DATA_PER_LINE_ADDR_BITS) % DCACHE_SET;
+  UINT8 Block = Address % DCACHE_DATA_PER_LINE;
+  UINT64 Tag =
+      Address >> (DCACHE_DATA_PER_LINE_ADDR_BITS + DCACHE_SET_ADDR_BITS);
+  UINT8 HitLine;
+  UINT8 MissFlag = 'M';
+  UINT64 ReadValue = 0;
+
+  char L2Result;
+
+  // 检查命中
+  for (int i = 0; i < DCACHE_LINE_PER_SET; i++) {
+    if (DCache[Set].Line[i].Valid && DCache[Set].Line[i].Tag == Tag) {
+      HitLine = i;
+      MissFlag = 'H';
+      break;
+    }
+  }
+
+  if (MissFlag == 'H') // Cache命中
+  {
+    if (Operation == 'L') // 读操作
+    {
+      // 读取数据，注意这里要按DataSize读取
+      switch (DataSize) {
+      case 1: // 1个字节
+        ReadValue = DCache[Set].Line[HitLine].Data[Block];
+        break;
+      case 2:                 // 2个字节
+        Block = Block & 0xFE; // 需对齐到2字节边界
+        ReadValue = DCache[Set].Line[HitLine].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 0];
+        break;
+      case 4:                 // 4个字节
+        Block = Block & 0xFC; // 需对齐到4字节边界
+        ReadValue = DCache[Set].Line[HitLine].Data[Block + 3];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 2];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 0];
+        break;
+      case 8:                 // 8个字节
+        Block = Block & 0xF8; // 需对齐到8字节边界
+        ReadValue = DCache[Set].Line[HitLine].Data[Block + 7];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 6];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 5];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 4];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 3];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 2];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[HitLine].Data[Block + 0];
+        break;
+      }
+      *LoadResult = ReadValue;
+
+      if (DEBUG) {
+        printf("[%s] Address=%016llX Operation=%c DataSize=%u "
+               "StoreValue=%016llX ReadValue=%016llX\n",
+               __func__, Address, Operation, DataSize, StoreValue, ReadValue);
+      }
+    } else if (Operation == 'S' ||
+               Operation == 'M') // 写操作（修改操作在此等价于写操作）
+    {
+      if (DEBUG) {
+        printf("[%s] Address=%016llX Operation=%c DataSize=%u "
+               "StoreValue=%016llX\n",
+               __func__, Address, Operation, DataSize, StoreValue);
+      }
+
+      // 写操作，需要将新的StoreValue更新到CacheLine中
+      switch (DataSize) {
+      case 1: // 1个字节
+        DCache[Set].Line[HitLine].Data[Block + 0] = StoreValue & 0xFF;
+        break;
+      case 2:                 // 2个字节
+        Block = Block & 0xFE; // 需对齐到2字节边界
+        DCache[Set].Line[HitLine].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 1] = StoreValue & 0xFF;
+        break;
+      case 4:                 // 4个字节
+        Block = Block & 0xFC; // 需对齐到4字节边界
+        DCache[Set].Line[HitLine].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 1] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 2] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 3] = StoreValue & 0xFF;
+        break;
+      case 8:                 // 8个字节
+        Block = Block & 0xF8; // 需对齐到8字节边界
+        DCache[Set].Line[HitLine].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 1] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 2] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 3] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 4] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 5] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 6] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[HitLine].Data[Block + 7] = StoreValue & 0xFF;
+        break;
+      }
+      DCache[Set].Line[HitLine].Dirty = 1;
+
+      // 写直达，同时更新L2
+      StoreDataFromL1ToL2(Address, Set, HitLine);
+    }
+    UpdateAgeData(Set, HitLine);
+  } else // Cache未命中
+  {
+    UINT8 replace_Line = GetReplaceLineData(Set);
+    if (DEBUG) {
+      printf(
+          "[%s] Address=%016llX Operation=%c DataSize=%u StoreValue=%016llX\n",
+          __func__, Address, Operation, DataSize, StoreValue);
+    }
+
+    if (Operation == 'L') // 读操作
+    {
+      // 写回脏行到L2
+      if (DCache[Set].Line[replace_Line].Valid &&
+          DCache[Set].Line[replace_Line].Dirty) {
+        UINT64 victim_addr =
+            (DCache[Set].Line[replace_Line].Tag
+             << (DCACHE_DATA_PER_LINE_ADDR_BITS + DCACHE_SET_ADDR_BITS)) |
+            (Set << DCACHE_DATA_PER_LINE_ADDR_BITS);
+        StoreDataFromL1ToL2(victim_addr, Set, replace_Line);
+      }
+
+      // 先从L2加载新行到L1
+      L2Result = LoadDataFromL2ToL1(Address, Set, replace_Line);
+
+      DCache[Set].Line[replace_Line].Valid = 1;
+      DCache[Set].Line[replace_Line].Tag = Tag;
+      DCache[Set].Line[replace_Line].Dirty = 0;
+
+      // 再读取数据，按DataSize读取
+      switch (DataSize) {
+      case 1: // 1个字节
+        ReadValue = DCache[Set].Line[replace_Line].Data[Block];
+        break;
+      case 2:                 // 2个字节
+        Block = Block & 0xFE; // 需对齐到2字节边界
+        ReadValue = DCache[Set].Line[replace_Line].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 0];
+        break;
+      case 4:                 // 4个字节
+        Block = Block & 0xFC; // 需对齐到4字节边界
+        ReadValue = DCache[Set].Line[replace_Line].Data[Block + 3];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 2];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 0];
+        break;
+      case 8:                 // 8个字节
+        Block = Block & 0xF8; // 需对齐到8字节边界
+        ReadValue = DCache[Set].Line[replace_Line].Data[Block + 7];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 6];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 5];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 4];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 3];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 2];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 1];
+        ReadValue = ReadValue << 8;
+        ReadValue |= DCache[Set].Line[replace_Line].Data[Block + 0];
+        break;
+      }
+      *LoadResult = ReadValue;
+    } else if (Operation == 'S' ||
+               Operation == 'M') // 写操作（修改操作在此等价于写操作）
+    {
+      // 写回脏行到L2
+      if (DCache[Set].Line[replace_Line].Valid &&
+          DCache[Set].Line[replace_Line].Dirty) {
+        UINT64 victim_addr =
+            (DCache[Set].Line[replace_Line].Tag
+             << (DCACHE_DATA_PER_LINE_ADDR_BITS + DCACHE_SET_ADDR_BITS)) |
+            (Set << DCACHE_DATA_PER_LINE_ADDR_BITS);
+        StoreDataFromL1ToL2(victim_addr, Set, replace_Line);
+      }
+
+      // 先从L2加载新行到L1
+      L2Result = LoadDataFromL2ToL1(Address, Set, replace_Line);
+
+      DCache[Set].Line[replace_Line].Valid = 1;
+      DCache[Set].Line[replace_Line].Tag = Tag;
+      DCache[Set].Line[replace_Line].Dirty = 0;
+
+      // 写操作，需要将新的StoreValue更新到CacheLine中
+      switch (DataSize) {
+      case 1: // 1个字节
+        DCache[Set].Line[replace_Line].Data[Block + 0] = StoreValue & 0xFF;
+        break;
+      case 2:                 // 2个字节
+        Block = Block & 0xFE; // 需对齐到2字节边界
+        DCache[Set].Line[replace_Line].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 1] = StoreValue & 0xFF;
+        break;
+      case 4:                 // 4个字节
+        Block = Block & 0xFC; // 需对齐到4字节边界
+        DCache[Set].Line[replace_Line].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 1] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 2] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 3] = StoreValue & 0xFF;
+        break;
+      case 8:                 // 8个字节
+        Block = Block & 0xF8; // 需对齐到8字节边界
+        DCache[Set].Line[replace_Line].Data[Block + 0] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 1] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 2] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 3] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 4] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 5] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 6] = StoreValue & 0xFF;
+        StoreValue = StoreValue >> 8;
+        DCache[Set].Line[replace_Line].Data[Block + 7] = StoreValue & 0xFF;
+        break;
+      }
+      DCache[Set].Line[replace_Line].Dirty = 1;
+
+      // 写直达，同时更新L2
+      StoreDataFromL1ToL2(Address, Set, replace_Line);
+    }
+    UpdateAgeData(Set, replace_Line);
+  }
+
+  // 返回L1的命中/未命中标志
+  return MissFlag;
+}
+
+/*
+ * 访问指令缓存的主函数
+ * 参数：
+ *   Address - 访问的内存地址
+ *   Operation - 通常只用于读取指令，但我们保留此参数以保持接口一致
+ *   InstSize - 指令大小（通常为4字节，但支持1、2、4、8字节）
+ *   InstResult - 指向读取结果的指针
+ * 返回值：
+ *   'H' - 缓存命中
+ *   'M' - 缓存未命中
+ */
+UINT8 AccessInstCache(UINT64 Address, UINT8 Operation, UINT8 InstSize,
+                      UINT64 *InstResult) {
+  UINT32 set = (Address >> ICACHE_DATA_PER_LINE_ADDR_BITS) % ICACHE_SET;
+  UINT8 block = Address % ICACHE_DATA_PER_LINE;
+  UINT64 tag =
+      Address >> (ICACHE_DATA_PER_LINE_ADDR_BITS + ICACHE_SET_ADDR_BITS);
+  UINT8 HitLine;
+  UINT8 MissFlag = 'M';
+  UINT64 ReadValue = 0;
+  UINT32 L2Result;
+
+  *InstResult = 0;
+
+  // 检查命中
+  for (int i = 0; i < ICACHE_LINE_PER_SET; i++) {
+    if (ICache[set].Line[i].Valid && ICache[set].Line[i].Tag == tag) {
+      HitLine = i;
+      MissFlag = 'H';
+      break;
+    }
+  }
+
+  if (MissFlag == 'H') {
+    // 命中处理
+    switch (InstSize) {
+    case 1:                 // 8位指令
+      block = block & 0xFF; // 对齐到1字节边界
+      ReadValue = ICache[set].Line[HitLine].Data[block + 0];
+      break;
+    case 2:                 // 16位指令
+      block = block & 0xFE; // 对齐到2字节边界
+      ReadValue = ICache[set].Line[HitLine].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 0];
+      break;
+    case 4:                 // 32位指令
+      block = block & 0xFC; // 对齐到4字节边界
+      ReadValue = ICache[set].Line[HitLine].Data[block + 3];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 2];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 0];
+      break;
+    case 8:                 // 64位指令(如RISC-V的128位指令集扩展)
+      block = block & 0xF8; // 对齐到8字节边界
+      ReadValue = ICache[set].Line[HitLine].Data[block + 7];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 6];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 5];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 4];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 3];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 2];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[HitLine].Data[block + 0];
+      break;
+    default:
+      // 不支持的指令长度
+      return 'M';
+    }
+    *InstResult = ReadValue;
+    UpdateAgeInst(set, HitLine);
+  } else {
+    // 未命中处理
+    UINT8 replace_line = GetReplaceLineInst(set);
+
+    // 从L2加载数据到I-Cache
+    L2Result = LoadInstFromL2ToICache(Address, set, replace_line);
+
+    // 重新读取指令
+    switch (InstSize) {
+    case 1:
+      block = block & 0xFF;
+      ReadValue = ICache[set].Line[replace_line].Data[block + 0];
+      break;
+    case 2:
+      block = block & 0xFE;
+      ReadValue = ICache[set].Line[replace_line].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 0];
+      break;
+    case 4:
+      block = block & 0xFC;
+      ReadValue = ICache[set].Line[replace_line].Data[block + 3];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 2];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 0];
+      break;
+    case 8:
+      block = block & 0xF8;
+      ReadValue = ICache[set].Line[replace_line].Data[block + 7];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 6];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 5];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 4];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 3];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 2];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 1];
+      ReadValue = ReadValue << 8;
+      ReadValue |= ICache[set].Line[replace_line].Data[block + 0];
+      break;
+    default:
+      // 不支持的指令长度
+      return 'M';
+    }
+    *InstResult = ReadValue;
+    ICache[set].Line[replace_line].Valid = 1;
+    ICache[set].Line[replace_line].Tag = tag;
+    UpdateAgeInst(set, replace_line);
+  }
+
+  // 返回I-Cache的命中/未命中标志
+  return MissFlag;
+}
--- a/cachelab/CacheHelper.c
+++ b/cachelab/CacheHelper.c
@@ -0,0 +1,792 @@
+///////////////////////////////////////////////////////////////////////
+////  Copyright 2022 by mars.                                        //
+///////////////////////////////////////////////////////////////////////
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <string.h>
+#include <assert.h>
+#include <time.h>
+#include "getopt.h"
+#include "cbsl.h"
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); }}
+
+/*
+fcn  ideal%     #items   #buckets  dup%  fl   add_usec  find_usec  del-all usec
+---  ------ ---------- ---------- -----  -- ---------- ----------  ------------
+OAT   89.1%     597731     524288    0%  ok     317292     179676         59726
+FNV   88.6%     597731     262144    0%  ok     226650     220626         61619
+JEN   87.8%     597731     524288    0%  ok     321989     175945         59956
+BER   86.4%     597731     262144    0%  ok     198477     179332         60901
+SAX   70.4%     597731     524288    0%  ok     270281     196427         64064
+SFH   69.2%     597731     524288    0%  ok     289843     165105         61860
+FNV1A_Pippip_Yurii 更快？？
+*/
+
+// 使用OAT hash算法，以获得最高性能
+#include "uthash.h"
+#undef HASH_FUNCTION
+//#define HASH_FUNCTION HASH_OAT
+#define HASH_FUNCTION(keyptr,keylen,hashv) (hashv) = FNV1A_Pippip_Yurii((UINT64 *)keyptr)
+
+#define VERBOSE_MSG	0
+
+#ifdef _WIN32
+#define ZLIB_WINAPI
+#endif
+
+#include "common.h"
+
+#ifdef _WIN64
+#pragma comment(lib,"..\\zstd\\libzstd_static-win64.lib")
+#elif  _WIN32
+#pragma comment(lib,"..\\zstd\\libzstd_static-win32.lib")
+#endif
+
+/*
+	构建一个用Hash表访问的Memory，以便能够紧凑存放稀疏、随机的Memory数据
+*/
+
+struct MemoryDataStruct
+{
+	UINT64 Address;			// 地址（默认是64位字地址）
+	UINT64 Data;			// 数据（默认保存64位字数据）
+	UT_hash_handle memory;	// makes this structure hashable
+} *MemoryHash = NULL;
+
+static void WriteMemoryHash(UINT64 Address, UINT64 WriteValue, UINT8 WriteSize);
+static UINT64 ReadMemoryHash(UINT64 Address, UINT8 ReadSize);
+
+#define MEMORY_TRACE_CHUNK	(1<<20)	// MemoryTrace结构，每次增长1M条记录
+struct MemoryTraceStruct
+{
+	UINT8 Operation;
+	UINT64 Address;
+	UINT8 Size;
+} *MemoryTrace;
+UINT64 MemoryTraceCounter, MemoryTraceCapacity;
+
+/*
+*	统计计数器
+*/
+UINT64 GlobalMemoryModifyCounter;
+UINT64 GlobalMemoryInstCounter;
+UINT64 GlobalMemoryWriteCounter;
+UINT64 GlobalCacheWriteHitCounter;
+UINT64 GlobalMemoryReadCounter;
+UINT64 GlobalCacheReadHitCounter;
+UINT64 GlobalCacheModifyHitCounter;
+UINT64 GlobalSimReadMemoryCounter;
+UINT64 GlobalSimWriteMemoryCounter;
+
+UINT64 GlobalCacheInstHitCounter;
+
+#define CHUNK 16384
+
+static void Trim(char* src)
+{
+	char* begin = src;
+	char* end = src + strlen(src);
+
+	if (begin == end) return;
+
+	while (*begin == ' ' || *begin == '\t')
+		++begin;
+	while ((*end) == '\0' || *end == ' ' || *end == '\t' || *end == '\n' || *end == '\r')
+		--end;
+
+	if (begin > end) {
+		*src = '\0';  return;
+	}
+	while (begin != end) {
+		*src++ = *begin++;
+	}
+
+	*src++ = *end;
+	*src = '\0';
+
+	return;
+}
+
+typedef struct {
+	const char* start;
+	size_t len;
+} token;
+
+// https://stackoverflow.com/a/39286524
+static char** split_space(const char* str, int* field_count)
+{
+	char** array;
+	unsigned int start = 0, stop, toks = 0, t;
+	token* tokens = malloc((strlen(str) + 1) * sizeof(token));
+	for (stop = 0; str[stop]; stop++) {
+		if (str[stop] == ' ' || str[stop] == '\t' || str[stop] == ',')
+		{
+			tokens[toks].start = str + start;
+			tokens[toks].len = stop - start;
+			toks++;
+			start = stop + 1;
+		}
+	}
+	/* Mop up the last token */
+	tokens[toks].start = str + start;
+	tokens[toks].len = stop - start;
+	toks++;
+	array = malloc(toks * sizeof(char*));
+	for (t = 0; t < toks; t++) {
+		/* Calloc makes it nul-terminated */
+		char* token = calloc(tokens[t].len + 1, 1);
+		memcpy(token, tokens[t].start, tokens[t].len);
+		array[t] = token;
+	}
+	free(tokens);
+	*field_count = toks;
+	return array;
+}
+
+#define SR_A ((UINT64)1103515245)
+#define SR_C ((UINT64)12345)
+#define SR_M ((UINT64)1<<32)
+UINT64 Xn;
+
+static void SyncRand(UINT64 Seed)
+{
+	Xn = Seed;
+}
+
+static UINT8 GetRand8()
+{
+	Xn = ((SR_A * Xn + SR_C) % SR_M);
+	return (UINT8)Xn;
+}
+
+static UINT16 GetRand16()
+{
+	Xn = ((SR_A * Xn + SR_C) % SR_M);
+	return (UINT16)Xn;
+}
+
+static UINT32 GetRand32()
+{
+	Xn = ((SR_A * Xn + SR_C) % SR_M);
+	return (UINT32)Xn;
+}
+
+static UINT64 GetRand64()
+{
+	UINT32 Hi, Lo;
+	Hi = GetRand32();
+	Lo = GetRand32();
+
+	return ((UINT64)Hi << 32 | Lo);
+}
+
+//https://www.codeproject.com/articles/716530/fastest-hash-function-for-table-lookups-in-c
+static inline UINT32 FNV1A_Pippip_Yurii(UINT64* Address)
+{
+	const UINT32 PRIME = 591798841; UINT32 hash32; UINT64 hash64 = 14695981039346656037ULL;
+	hash64 = (hash64 ^ *Address) * PRIME;
+	hash32 = (uint32_t)(hash64 ^ (hash64 >> 32));
+	return hash32 ^ (hash32 >> 16);
+}
+
+
+static void InitMemoryHash()
+{
+}
+
+static void FreeMemoryHash()
+{
+	struct MemoryDataStruct* p, * tmp;
+	HASH_ITER(memory, MemoryHash, p, tmp)
+	{
+		HASH_DELETE(memory, MemoryHash, p);
+		free(p);
+	}
+}
+
+static void UpdateMemoryData(UINT64* Location, UINT8 Offset, UINT64 WriteValue, UINT8 WriteSize)
+{
+	UINT64 OriginValue;
+	OriginValue = *Location;
+	switch (WriteSize)
+	{
+	case 1:	// 1个字节
+		Offset = Offset << 3;	// 从字节换算成位
+		OriginValue = (OriginValue & ~((UINT64)0xFF << Offset)) | ((WriteValue & (UINT64)0xFF) << Offset);
+		break;
+	case 2:	// 2个字节
+		Offset = Offset & 0xFE;	// 对齐到2字节边界
+		Offset = Offset << 3;	// 从字节换算成位
+		OriginValue = (OriginValue & ~((UINT64)0xFFFF << Offset)) | ((WriteValue & (UINT64)0xFFFF) << Offset);
+		break;
+	case 4:	// 4个字节
+		Offset = Offset & 0xFC;	// 对齐到4字节边界
+		Offset = Offset << 3;	// 从字节换算成位
+		OriginValue = (OriginValue & ~((UINT64)0xFFFFFFFF << Offset)) | ((WriteValue & (UINT64)0xFFFFFFFF) << Offset);
+		break;
+	case 8:	// 8个字节
+		OriginValue = WriteValue;
+		break;
+	}
+	*Location = OriginValue;
+}
+
+static void WriteMemoryHash(UINT64 Address, UINT64 WriteValue, UINT8 WriteSize)
+{
+	UINT64 AlignAddress;
+	UINT8 Offset;
+	struct MemoryDataStruct* s;
+
+	AlignAddress = Address & 0xFFFFFFFFFFFFFFF8;
+	Offset = Address & 0x7;
+
+	HASH_FIND(memory, MemoryHash, &AlignAddress, sizeof(AlignAddress), s);
+	if (s == NULL)
+	{
+		// 没有在MemoryData中命中
+		s = (struct MemoryDataStruct*)malloc(sizeof(struct MemoryDataStruct));
+		s->Address = AlignAddress;
+		s->Data = 0xDEADBEEFDEADC0DE;
+		HASH_ADD(memory, MemoryHash, Address, sizeof(AlignAddress), s);
+	}
+	UpdateMemoryData(&(s->Data), Offset, WriteValue, WriteSize);
+}
+
+static UINT64 ReadMemoryHash(UINT64 Address, UINT8 ReadSize)
+{
+	UINT64 AlignAddress;
+	UINT8 Offset;
+	struct MemoryDataStruct* s;
+	UINT64 OriginValue, ReadValue;
+
+	AlignAddress = Address & 0xFFFFFFFFFFFFFFF8;
+	Offset = Address & 0x7;
+
+	HASH_FIND(memory, MemoryHash, &AlignAddress, sizeof(AlignAddress), s);
+	if (s == NULL)
+	{
+		// 没有在MemoryData中命中，出错了！
+		if (VERBOSE_MSG)
+			printf("[%s] 试图从一个未初始化的内存读取数据Address=%016llX！\n", __func__, Address);
+		OriginValue = 0xDEADBEEFDEADC0DE;
+	}
+	else
+	{
+		OriginValue = s->Data;
+	}
+
+	/*
+	*  根据Offset和Size，对读出的数据进行修正，对齐到小端
+	*/
+	ReadValue = OriginValue;
+	switch (ReadSize)
+	{
+	case 1:	// 1个字节
+		Offset = Offset << 3;	// 从字节换算成位
+		ReadValue = (OriginValue >> Offset) & 0xFF;
+		break;
+	case 2:	// 2个字节
+		Offset = Offset & 0xFE;	// 对齐到2字节边界
+		Offset = Offset << 3;	// 从字节换算成位
+		ReadValue = (OriginValue >> Offset) & 0xFFFF;
+		break;
+	case 4:	// 4个字节
+		Offset = Offset & 0xFC;	// 对齐到4字节边界
+		Offset = Offset << 3;	// 从字节换算成位
+		ReadValue = (OriginValue >> Offset) & 0xFFFFFFFF;
+		break;
+	case 8:	// 8个字节
+		ReadValue = OriginValue;
+		break;
+
+	}
+	return ReadValue;
+}
+
+UINT64 ReadMemory(UINT64 Address)
+{
+	GlobalSimReadMemoryCounter++;
+	return ReadMemoryHash(Address, 8);
+}
+
+void WriteMemory(UINT64 Address, UINT64 WriteData)
+{
+	GlobalSimWriteMemoryCounter++;
+	WriteMemoryHash(Address, WriteData, 8);
+}
+
+static void MemoryTraceStat()
+{
+	UINT64 i;
+
+	GlobalMemoryInstCounter = 0;
+	GlobalMemoryReadCounter = 0;
+	GlobalMemoryWriteCounter = 0;
+	GlobalMemoryModifyCounter = 0;
+
+	for (i = 0; i < MemoryTraceCounter; i++)
+	{
+		if (MemoryTrace[i].Operation == 'I')
+			GlobalMemoryInstCounter++;
+		else if (MemoryTrace[i].Operation == 'L')
+			GlobalMemoryReadCounter++;
+		else if (MemoryTrace[i].Operation == 'S')
+			GlobalMemoryWriteCounter++;
+		else if (MemoryTrace[i].Operation == 'M')
+			GlobalMemoryModifyCounter++;
+	}
+}
+
+static int process_TRACE_line(char* linebuf, UINT64 lineno)
+{
+	int i;
+	int ret = 0;
+	UINT8 Operation;
+	UINT64 Address;
+	UINT8 Size;
+
+	UINT64 RandValue64;
+
+	// 删除行首、行尾空白回车等
+	Trim(linebuf);
+	int linelen = (int)strlen(linebuf);
+	// 跳过空行
+	if (linelen == 0)
+		return 0;
+	// 跳过超长的行
+	if (linelen >= 100)
+		return 0;
+	// 跳过注释行
+	if (linebuf[0] == '#' || linebuf[0] == '/' || linebuf[0] == '=' || linebuf[0] == '-')
+		return 0;
+	//printf("lineno=%llu\n", lineno);
+	char** pt;
+	int field_count;
+	pt = split_space(linebuf, &field_count);
+
+	if (field_count == 3 || field_count == 4)
+	{
+		// 格式： Operation Address,Size
+		Operation = pt[0][0];
+		if (field_count == 3)
+		{
+			Address = strtoull(pt[1], NULL, 16);
+			Size = atoi(pt[2]);
+		}
+		else
+		{
+			Address = strtoull(pt[2], NULL, 16);
+			Size = atoi(pt[3]);
+		}
+
+		if (Operation != 'I' && Operation != 'L' && Operation != 'S' && Operation != 'M')
+		{
+			if (VERBOSE_MSG)
+				printf("[%s] line %lld 操作类型错误，不是I、L、S、M！ %s\n", __func__, lineno, linebuf);
+			ret = -1;
+		}
+		else if (Size != 1 && Size != 2 && Size != 4 && Size != 8)
+		{
+			if (VERBOSE_MSG)
+				printf("[%s] line %lld 数据大小错误，不是1、2、4、8！ %s\n", __func__, lineno, linebuf);
+			ret = -1;
+		}
+		else
+		{
+			RandValue64 = GetRand64();
+
+			// 初始化阶段，需要将所有地址的数据，设置为随机值
+			WriteMemoryHash(Address, RandValue64, Size);
+
+			if (MemoryTraceCounter >= MemoryTraceCapacity)
+			{
+				if (VERBOSE_MSG)
+					printf("[%s] line %lld 扩展内存到%llu！\n", __func__, lineno, MemoryTraceCapacity + MEMORY_TRACE_CHUNK);
+				MemoryTrace = (struct MemoryTraceStruct*)realloc(MemoryTrace, (MemoryTraceCapacity + MEMORY_TRACE_CHUNK) * sizeof(struct MemoryTraceStruct));
+				if (MemoryTrace == NULL)
+				{
+					printf("[%s] line %lld 分配内存失败！\n", __func__, lineno);
+					ret = -1;
+				}
+				else
+					MemoryTraceCapacity += MEMORY_TRACE_CHUNK;
+			}
+
+			if (MemoryTrace)
+			{
+				MemoryTrace[MemoryTraceCounter].Operation = Operation;
+				MemoryTrace[MemoryTraceCounter].Address = Address;
+				MemoryTrace[MemoryTraceCounter].Size = Size;
+				MemoryTraceCounter++;
+
+				ret = 0;
+			}
+		}
+	}
+	else
+	{
+		printf("[%s] line %lld 格式错误！[fields=%d] %s\n", __func__, lineno, field_count, linebuf);
+		ret = -1;
+	}
+
+	for (i = 0; i < field_count; i++)
+		free(pt[i]);
+	free(pt);
+	return ret;
+}
+
+static int parse_TRACE_file(char* filename)
+{
+	UINT64 lineno;
+	int ret_parse_line = 0;
+	clock_t tick1, tick2;
+	cbsl_errors cbsl_ret = cbsl_error;
+	char linebuf[CHUNK];
+
+	tick1 = clock();
+	cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, filename);
+	if (ctx == NULL)
+	{
+		printf("[%s] 不能以读方式打开Trace文件 %s\n", __func__, filename);
+		return -1;
+	}
+
+	lineno = 0;
+	do
+	{
+		lineno++;
+		cbsl_ret = cbsl_readline(ctx, linebuf, sizeof(linebuf));
+		CBSL_ERROR_CHECK(cbsl_ret);	// 从文件中读取1行
+
+		ret_parse_line = process_TRACE_line(linebuf, lineno);		// 分析处理1行
+		if (ret_parse_line == 1 || cbsl_ret == cbsl_end)
+			break;
+
+		if (lineno % 10000 == 0)
+		{
+			printf("\33[?25l[%s] ====已处理%llu行====\r", __func__, lineno);	// 隐藏光标，显示进度
+		}
+	} while (1);
+
+	printf("\n\33[?25h");	// 显示光标
+	CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+	tick2 = clock();
+
+	MemoryTraceStat();
+	printf("[%s] +-----------------------------------------------------+\n", __func__);
+	printf("[%s] |  Memory Trace数量                 \t : %10llu    |\n", __func__, MemoryTraceCounter);
+	printf("[%s] |    Instruction操作数量            \t : %10llu    |\n", __func__, GlobalMemoryInstCounter);
+	printf("[%s] |    Data Load操作数量              \t : %10llu    |\n", __func__, GlobalMemoryReadCounter);
+	printf("[%s] |    Data Store操作数量             \t : %10llu    |\n", __func__, GlobalMemoryWriteCounter);
+	printf("[%s] |    Data Modify操作数量            \t : %10llu    |\n", __func__, GlobalMemoryModifyCounter);
+	printf("[%s] | 时间耗费（ms）                    \t : %10.0f    |\n", __func__, ((float)(tick2 - tick1) / CLOCKS_PER_SEC) * 1000.0);
+	printf("[%s] +-----------------------------------------------------+\n", __func__);
+
+	if (MemoryTraceCounter == 0)
+		return -1;
+	return 0;
+}
+
+int SimTrace()
+{
+	int ret = 0;
+	UINT32 i;
+	UINT8 Operation;
+	UINT64 Address;
+	UINT8 Size;
+
+	UINT64 RandValue64;
+	UINT64 DataFromCache;
+	UINT64 DataFromMemory;
+	UINT8 MissFlag;
+
+	clock_t tick1, tick2;
+	tick1 = clock();
+
+	GlobalMemoryInstCounter = 0;
+	GlobalMemoryReadCounter = 0;
+	GlobalMemoryWriteCounter = 0;
+	GlobalMemoryModifyCounter = 0;
+
+	GlobalCacheInstHitCounter = 0;
+	GlobalCacheReadHitCounter = 0;
+	GlobalCacheWriteHitCounter = 0;
+	GlobalCacheModifyHitCounter = 0;
+
+	GlobalSimReadMemoryCounter = 0;
+	GlobalSimWriteMemoryCounter = 0;
+
+	for (i = 0; i < MemoryTraceCounter; i++)
+	{
+		Operation = MemoryTrace[i].Operation;
+		Address = MemoryTrace[i].Address;
+		Size = MemoryTrace[i].Size;
+
+		if (Operation == 'L' || Operation == 'S' || Operation == 'M')
+		{
+			RandValue64 = GetRand64();
+			MissFlag = AccessDataCache(Address, Operation, Size, RandValue64, &DataFromCache);
+			if (Operation == 'S' || Operation == 'M')
+			{
+				WriteMemoryHash(Address, RandValue64, Size);
+				if (Operation == 'S')
+				{
+					GlobalMemoryWriteCounter++;
+					if (MissFlag == 'H')
+					{
+						GlobalCacheWriteHitCounter++;
+					}
+				}
+				else if (Operation == 'M')
+				{
+					GlobalMemoryModifyCounter++;
+					if (MissFlag == 'H')
+					{
+						GlobalCacheModifyHitCounter++;
+					}
+				}
+			}
+			else if (Operation == 'L')
+			{
+				GlobalMemoryReadCounter++;
+				if (MissFlag == 'H')
+				{
+					DataFromMemory = ReadMemoryHash(Address, Size);
+					if (DataFromMemory == DataFromCache)
+						GlobalCacheReadHitCounter++;
+					else
+					{
+						printf("[%s] 关键错误！数据Cache读错误，内存地址=%016llX 内存数据=%016llX Cache读数据=%016llX 大小%d字节\n", __func__, Address, DataFromMemory, DataFromCache, Size);
+						ret = -1;
+						break;
+					}
+				}
+			}
+		}
+		else if (Operation == 'I')
+		{
+			MissFlag = AccessInstCache(Address, Operation, Size, &DataFromCache);
+			GlobalMemoryInstCounter++;
+			if (MissFlag == 'H')
+			{
+				DataFromMemory = ReadMemoryHash(Address, Size);
+				if (DataFromMemory == DataFromCache)
+					GlobalCacheInstHitCounter++;
+				else
+				{
+					printf("[%s] 关键错误！指令Cache读错误，内存地址=%016llX 内存数据=%016llX Cache读数据=%016llX 大小%d字节\n", __func__, Address, DataFromMemory, DataFromCache, Size);
+					ret = -1;
+					break;
+				}
+			}
+		}
+	}
+	tick2 = clock();
+	printf("[%s] +-----------------------------------------------------+\n", __func__);
+	printf("[%s] |  Memory Trace数量                \t : %10llu    |\n", __func__, MemoryTraceCounter);
+	printf("[%s] |    Instruction操作数量           \t : %10llu    |\n", __func__, GlobalMemoryInstCounter);
+	printf("[%s] |    Data Load操作数量             \t : %10llu    |\n", __func__, GlobalMemoryReadCounter);
+	printf("[%s] |    Data Store操作数量            \t : %10llu    |\n", __func__, GlobalMemoryWriteCounter);
+	printf("[%s] |    Data Modify操作数量           \t : %10llu    |\n", __func__, GlobalMemoryModifyCounter);
+	printf("[%s] |    Instruction操作Cache命中数量  \t : %10llu    |\n", __func__, GlobalCacheInstHitCounter);
+	printf("[%s] |    Data Load操作Cache命中数量    \t : %10llu    |\n", __func__, GlobalCacheReadHitCounter);
+	printf("[%s] |    Data Store操作Cache命中数量   \t : %10llu    |\n", __func__, GlobalCacheWriteHitCounter);
+	printf("[%s] |    Data Modify操作Cache命中数量  \t : %10llu    |\n", __func__, GlobalCacheModifyHitCounter);
+	printf("[%s] |  Cache访存数量                   \t : %10llu    |\n", __func__, GlobalSimReadMemoryCounter + GlobalSimWriteMemoryCounter);
+	printf("[%s] |    Cache读存储器数量             \t : %10llu    |\n", __func__, GlobalSimReadMemoryCounter);
+	printf("[%s] |    Cache写存储器数量             \t : %10llu    |\n", __func__, GlobalSimWriteMemoryCounter);
+	printf("[%s] |  Data Cache命中率                \t : %9.2f%%    |\n", __func__, (double)((GlobalCacheReadHitCounter + GlobalCacheWriteHitCounter + GlobalCacheModifyHitCounter) * 100) / (double)(GlobalMemoryReadCounter + GlobalMemoryWriteCounter + GlobalMemoryModifyCounter));
+	printf("[%s] |  Inst Cache命中率                \t : %9.2f%%    |\n", __func__, (GlobalMemoryInstCounter == 0) ? 0 : (double)(GlobalCacheInstHitCounter * 100) / (double)GlobalMemoryInstCounter);
+	printf("[%s] |  时间耗费（ms）                  \t : %10.0f    |\n", __func__, ((float)(tick2 - tick1) / CLOCKS_PER_SEC) * 1000.0);
+	printf("[%s] +-----------------------------------------------------+\n", __func__);
+	return ret;
+}
+void DisplayHelp(char* argv[])
+{
+	printf("[%s] 请在Cache.c中，实现你自己的Cache，然后编译项目，执行。\n", __func__);
+	printf("[%s] 从文本格式压缩文件中读取Trace:\t%s <trace>.zst\n", __func__, argv[0]);
+	printf("[%s]     例如: %s ./traces/dave.trace.zst\n", __func__, argv[0]);
+	printf("[%s] 将文本格式的Trace转换到bin格式:\t%s -w <trace>.zst\n", __func__, argv[0]);
+	printf("[%s] 从bin格式文件中读取Trace:\t\t%s -r <trace>.bin.zst\n", __func__, argv[0]);
+	printf("[%s] 提示：从bin中读取Trace速度要远远快于从文本格式中读取。\n", __func__);
+}
+
+int main(int argc, char* argv[])
+{
+	int ret_val = -1;
+	UINT8 ReadBinFileFlag, WriteBinFileFlag, ReadTxtFileFlag;
+	char* pfilename;
+	char pfilename_bin[CHUNK];
+	clock_t tick1, tick2;
+	UINT64 i;
+
+	printf("[%s] Cache模拟器框架 v3.0 by mars, 2022\n", __func__);
+
+	pfilename = NULL;
+	ReadBinFileFlag = 0;
+	WriteBinFileFlag = 0;
+	ReadTxtFileFlag = 1;
+	/* check arguments */
+	while (1) {
+		int c = getopt(argc, argv, "-hrw");
+		if (c == -1) break;
+
+		switch (c) {
+		case 'h': DisplayHelp(argv); return 1;
+		case 'r': ReadBinFileFlag = 1; ReadTxtFileFlag = 0; break;
+		case 'w': WriteBinFileFlag = 1; ReadTxtFileFlag = 0; break;
+		case 1: pfilename = optarg; break;
+		}
+	}
+
+	if ((ReadBinFileFlag == 1 || WriteBinFileFlag == 1 || ReadTxtFileFlag == 1) && pfilename == NULL)
+	{
+		DisplayHelp(argv);
+		return 1;
+	}
+
+	InitMemoryHash();
+	printf("[%s] 初始化存储器，读入Trace文件[%s]，请稍后...\n", __func__, pfilename);
+
+	if (ReadTxtFileFlag || WriteBinFileFlag)
+	{
+		MemoryTrace = (struct MemoryTraceStruct*)malloc(MEMORY_TRACE_CHUNK * sizeof(struct MemoryTraceStruct));
+		MemoryTraceCounter = 0;
+		MemoryTraceCapacity = MEMORY_TRACE_CHUNK;
+		ret_val = parse_TRACE_file(pfilename);
+		if (ret_val != 0)
+		{
+			FreeMemoryHash();
+			if (MemoryTrace)
+				free(MemoryTrace);
+			printf("[%s] 解压缩文件失败 %s\n", __func__, argv[1]);
+			return -1;
+		}
+
+		if (WriteBinFileFlag)
+		{
+			// 将内存中的MemoryTrace保存到bin文件中
+			int filenamelen = (int)strlen(pfilename);
+			memcpy(pfilename_bin, pfilename, filenamelen);
+			pfilename_bin[filenamelen] = '\0';
+			if (filenamelen > 5)
+			{
+				if ((pfilename_bin[filenamelen - 4] == '.' && pfilename_bin[filenamelen - 3] == 'z' && pfilename_bin[filenamelen - 2] == 's' && pfilename_bin[filenamelen - 1] == 't') ||
+					(pfilename_bin[filenamelen - 4] == '.' && pfilename_bin[filenamelen - 3] == 'Z' && pfilename_bin[filenamelen - 2] == 'S' && pfilename_bin[filenamelen - 1] == 'T'))
+				{
+					pfilename_bin[filenamelen - 3] = 'b';
+					pfilename_bin[filenamelen - 2] = 'i';
+					pfilename_bin[filenamelen - 1] = 'n';
+					pfilename_bin[filenamelen - 0] = '.';
+					pfilename_bin[filenamelen + 1] = 'z';
+					pfilename_bin[filenamelen + 2] = 's';
+					pfilename_bin[filenamelen + 3] = 't';
+					pfilename_bin[filenamelen + 4] = '\0';
+
+					cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, pfilename_bin);
+					if (ctx == NULL)
+					{
+						printf("[%s] 不能以写方式打开文件 %s\n", __func__, pfilename_bin);
+						ret_val = -1;
+					}
+					else
+					{
+						CBSL_ERROR_CHECK(cbsl_write(ctx, &MemoryTraceCounter, sizeof(MemoryTraceCounter)));
+						CBSL_ERROR_CHECK(cbsl_write(ctx, MemoryTrace, MemoryTraceCounter * sizeof(struct MemoryTraceStruct)));
+						CBSL_ERROR_CHECK(cbsl_close(ctx));
+						printf("[%s] 已经将Trace保存到文件中 %s\n", __func__, pfilename_bin);
+						ret_val = 0;
+					}
+				}
+				else
+				{
+					printf("[%s] 文件扩展名不是.zst或者.ZST！不能转换！\n", __func__);
+					ret_val = -1;
+				}
+			}
+			else
+			{
+				printf("[%s] 文件名长度不足5字符！不能转换！\n", __func__);
+				ret_val = -1;
+			}
+
+			FreeMemoryHash();
+			if (MemoryTrace)
+				free(MemoryTrace);
+			return ret_val;
+		}
+	}
+	else if (ReadBinFileFlag)
+	{
+		cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, pfilename);
+		if (ctx == NULL)
+		{
+			printf("[%s] 不能以读方式打开文件 %s\n", __func__, pfilename);
+			ret_val = -1;
+		}
+		else
+		{
+			tick1 = clock();
+			CBSL_ERROR_CHECK(cbsl_read(ctx, &MemoryTraceCounter, sizeof(MemoryTraceCounter)));
+			{
+				MemoryTrace = (struct MemoryTraceStruct*)malloc(MemoryTraceCounter * sizeof(struct MemoryTraceStruct));
+				MemoryTraceCapacity = MemoryTraceCounter;
+
+				CBSL_ERROR_CHECK(cbsl_read(ctx, MemoryTrace, MemoryTraceCounter * sizeof(struct MemoryTraceStruct)));
+				CBSL_ERROR_CHECK(cbsl_close(ctx));
+				{
+					// 初始化阶段，需要将所有地址的数据，设置为随机值
+					UINT64 RandValue64;
+					for (i = 0; i < MemoryTraceCounter; i++)
+					{
+						RandValue64 = GetRand64();
+						WriteMemoryHash(MemoryTrace[i].Address, RandValue64, MemoryTrace[i].Size);
+					}
+
+					MemoryTraceStat();
+					tick2 = clock();
+					printf("[%s] +-----------------------------------------------------+\n", __func__);
+					printf("[%s] |  Memory Trace数量                 \t : %10llu    |\n", __func__, MemoryTraceCounter);
+					printf("[%s] |    Instruction操作数量            \t : %10llu    |\n", __func__, GlobalMemoryInstCounter);
+					printf("[%s] |    Data Load操作数量              \t : %10llu    |\n", __func__, GlobalMemoryReadCounter);
+					printf("[%s] |    Data Store操作数量             \t : %10llu    |\n", __func__, GlobalMemoryWriteCounter);
+					printf("[%s] |    Data Modify操作数量            \t : %10llu    |\n", __func__, GlobalMemoryModifyCounter);
+					printf("[%s] | 时间耗费（ms）                    \t : %10.0f    |\n", __func__, ((float)(tick2 - tick1) / CLOCKS_PER_SEC) * 1000.0);
+					printf("[%s] +-----------------------------------------------------+\n", __func__);
+					printf("[%s] 已经将Trace从文件中读取 %s\n", __func__, pfilename);
+					ret_val = 0;
+				}
+			}
+		}
+
+		if (ret_val == -1)
+		{
+			if (MemoryTrace)
+				free(MemoryTrace);
+			FreeMemoryHash();
+			return ret_val;
+		}
+	}
+	printf("[%s] 处理Trace文件完毕\n", __func__);
+	InitDataCache();
+	InitInstCache();
+	printf("[%s] 开始Cache模拟，请稍后...\n", __func__);
+	ret_val = SimTrace();
+	if (ret_val != 0)
+	{
+		FreeMemoryHash();
+		if (MemoryTrace)
+			free(MemoryTrace);
+		printf("[%s] Cache模拟失败\n", __func__);
+		return -1;
+	}
+	else
+		printf("[%s] Cache模拟成功完成\n", __func__);
+	if (MemoryTrace)
+		free(MemoryTrace);
+	FreeMemoryHash();
+	return 0;
+}
--- a/cachelab/Makefile
+++ b/cachelab/Makefile
@@ -0,0 +1,29 @@
+# Copyright 2022 by mars
+
+# Description: Makefile for building a Cache Simulator.
+#
+
+
+LDFLAGS += 
+
+LDLIBS   += -lzstd
+
+
+CPPFLAGS := -Ofast -Wall -Wextra -Winit-self \
+           -Wno-unused-function -fPIC -W -Wcast-qual -Wpointer-arith -Icbsl/include
+#CPPFLAGS := -O3 -Wall -Wextra -Winline -Winit-self -Wno-sequence-point\
+           -Wno-unused-function -Wno-inline -fPIC -W -Wcast-qual -Wpointer-arith -Icbsl/include
+
+#CPPFLAGS := -g
+PROGRAMS := Cache
+
+objects = Cache.o CacheHelper.o getopt.o cbsl/src/buffer.o cbsl/src/file.o cbsl/src/flush.o cbsl/src/read.o cbsl/src/record.o cbsl/src/utils.o cbsl/src/write.o
+
+all: $(PROGRAMS)
+
+Cache : $(objects)
+	icpx $(CPPFLAGS) $(LDFLAGS) -o $@ $^ $(LDLIBS)
+	rm -f $(objects)
+
+clean:
+	rm -f $(PROGRAMS) $(objects)
--- a/cachelab/MyCache/MyCache.sln
+++ b/cachelab/MyCache/MyCache.sln
@@ -0,0 +1,31 @@
+
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio Version 16
+VisualStudioVersion = 16.0.31829.152
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "MyCache", "MyCache.vcxproj", "{A5677060-D4C9-432A-A29F-858971B64066}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|x64 = Debug|x64
+		Debug|x86 = Debug|x86
+		Release|x64 = Release|x64
+		Release|x86 = Release|x86
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{A5677060-D4C9-432A-A29F-858971B64066}.Debug|x64.ActiveCfg = Debug|x64
+		{A5677060-D4C9-432A-A29F-858971B64066}.Debug|x64.Build.0 = Debug|x64
+		{A5677060-D4C9-432A-A29F-858971B64066}.Debug|x86.ActiveCfg = Debug|Win32
+		{A5677060-D4C9-432A-A29F-858971B64066}.Debug|x86.Build.0 = Debug|Win32
+		{A5677060-D4C9-432A-A29F-858971B64066}.Release|x64.ActiveCfg = Release|x64
+		{A5677060-D4C9-432A-A29F-858971B64066}.Release|x64.Build.0 = Release|x64
+		{A5677060-D4C9-432A-A29F-858971B64066}.Release|x86.ActiveCfg = Release|Win32
+		{A5677060-D4C9-432A-A29F-858971B64066}.Release|x86.Build.0 = Release|Win32
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(ExtensibilityGlobals) = postSolution
+		SolutionGuid = {D4625C4E-654D-406B-A238-D6F64DAF03BB}
+	EndGlobalSection
+EndGlobal
--- a/cachelab/MyCache/MyCache.vcxproj
+++ b/cachelab/MyCache/MyCache.vcxproj
@@ -0,0 +1,158 @@
+<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <VCProjectVersion>16.0</VCProjectVersion>
+    <Keyword>Win32Proj</Keyword>
+    <ProjectGuid>{a5677060-d4c9-432a-a29f-858971b64066}</ProjectGuid>
+    <RootNamespace>MyCache</RootNamespace>
+    <WindowsTargetPlatformVersion>10.0</WindowsTargetPlatformVersion>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Label="Shared">
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <LinkIncremental>true</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <LinkIncremental>false</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <LinkIncremental>true</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <LinkIncremental>false</LinkIncremental>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>WIN32;_DEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>_DEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+      <AdditionalIncludeDirectories>..\zstd;..\cbsl\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+      <AdditionalIncludeDirectories>..\zstd;..\cbsl\include;%(AdditionalIncludeDirectories)</AdditionalIncludeDirectories>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\Cache.c" />
+    <ClCompile Include="..\CacheHelper.c" />
+    <ClCompile Include="..\cbsl\src\buffer.c" />
+    <ClCompile Include="..\cbsl\src\file.c" />
+    <ClCompile Include="..\cbsl\src\flush.c" />
+    <ClCompile Include="..\cbsl\src\read.c" />
+    <ClCompile Include="..\cbsl\src\record.c" />
+    <ClCompile Include="..\cbsl\src\utils.c" />
+    <ClCompile Include="..\cbsl\src\write.c" />
+    <ClCompile Include="..\getopt.c" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
--- a/cachelab/Readme.txt
+++ b/cachelab/Readme.txt
@@ -0,0 +1,26 @@
+注意！你只能修改Cache.c文件，其他文件请勿修改！
+
+
+Linux:
+  1. make
+  2. ./Cache traces/long.trace.zst
+
+提醒:Linux下需要安装libzstd-dev软件包，例如apt install libzstd-dev zstd
+
+Windows VS 2019:
+  1. 进入MyCache目录，打开MyCache.sln
+  2. 编译即可生成可执行文件
+  3. 启动命令行窗口， 运行.\MyCache.exe traces/long.trace.zst
+
+
+提示：在traces目录下，有多个trace可以跑。
+
+
+自行生成trace文件：
+1、安装valgrind，Ubuntu下，可以使用apt install valgrind完成；
+2、运行valgrind生成某个应用的trace文件。比如，为了生成ls命令运行时的trace，可以输入下列命令：
+valgrind --tool=lackey -v --trace-mem=yes --log-file=ls.trace ls -l
+3、将生成的trace文件打包为zst压缩格式，例如
+   zstd ls.trace -o ls.trace.zst
+4、使用Cache跑这个trace：
+   ./Cache ./ls.trace.zst
--- a/cachelab/cbsl/CMakeLists.txt
+++ b/cachelab/cbsl/CMakeLists.txt
@@ -0,0 +1,125 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+cmake_minimum_required(VERSION 3.3)
+
+enable_testing()
+
+set(CMAKE_C_STANDARD 99)
+
+project(cbsl
+        VERSION   2019.5.0
+        LANGUAGES C Fortran
+        )
+
+
+if (CMAKE_BUILD_TYPE)
+  string(TOUPPER "${CMAKE_BUILD_TYPE}" uppercase_CMAKE_BUILD_TYPE)
+  if (NOT uppercase_CMAKE_BUILD_TYPE MATCHES "^(DEBUG|RELEASE|RELWITHDEBINFO|MINSIZEREL)$")
+    message(FATAL_ERROR "Invalid value for CMAKE_BUILD_TYPE: ${CMAKE_BUILD_TYPE}")
+  endif()
+
+  if (${uppercase_CMAKE_BUILD_TYPE} MATCHES "DEBUG")
+    set(CBSL_DEBUG 1)
+  endif ()
+endif ()
+
+
+if (INSTALL_ZSTD)
+  message(STATUS "Enable installation Zstandard library version 1.4.0")
+  include(ExternalProject)
+  ExternalProject_Add(zstd
+    GIT_REPOSITORY   "https://github.com/facebook/zstd.git"
+    GIT_TAG          "v1.4.0"
+    PREFIX           "${CMAKE_BINARY_DIR}/zstd"
+    SOURCE_SUBDIR    "build/cmake"
+    CMAKE_ARGS       -D CMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE} -D CMAKE_INSTALL_PREFIX=${CMAKE_INSTALL_PREFIX}
+    STEP_TARGETS     install
+    EXCLUDE_FROM_ALL on
+  )
+  include_directories(${CMAKE_INSTALL_PREFIX}/include)
+  link_directories(${CMAKE_INSTALL_PREFIX}/lib)
+endif ()
+find_library(ZSTD_LIB NAMES "zstd")
+
+
+include(CheckCCompilerFlag)
+CHECK_C_COMPILER_FLAG("-Wall"            C_HAS_WALL)
+CHECK_C_COMPILER_FLAG("-Wshadow"         C_HAS_WSHADOW)
+CHECK_C_COMPILER_FLAG("-Werror"          C_HAS_WERROR)
+CHECK_C_COMPILER_FLAG("-pedantic-errors" C_HAS_PEDANTIC_ERRORS)
+
+set(ADD_C_EXTRA_FLAGS)
+
+if (C_HAS_WALL)
+  set(ADD_C_EXTRA_FLAGS "${ADD_C_EXTRA_FLAGS} -Wall")
+endif ()
+
+if (C_HAS_WSHADOW)
+  set(ADD_C_EXTRA_FLAGS "${ADD_C_EXTRA_FLAGS} -Wshadow")
+endif ()
+
+if (C_HAS_WERROR)
+  set(ADD_C_EXTRA_FLAGS "${ADD_C_EXTRA_FLAGS} -Werror")
+endif ()
+
+if (C_HAS_PEDANTIC_ERRORS)
+  set(ADD_C_EXTRA_FLAGS "${ADD_C_EXTRA_FLAGS} -pedantic-errors")
+endif ()
+
+set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${ADD_C_EXTRA_FLAGS}")
+
+
+include(CheckFortranCompilerFlag)
+CHECK_Fortran_COMPILER_FLAG("-Wall -Wextra"    Fortran_HAS_WALL_EXTRA)
+CHECK_Fortran_COMPILER_FLAG("-Wshadow"         Fortran_HAS_WERROR)
+CHECK_Fortran_COMPILER_FLAG("-pedantic-errors" Fortran_HAS_PEDANTIC_ERRORS)
+
+set(ADD_Fortran_EXTRA_FLAGS)
+
+if (Fortran_HAS_WALL_EXTRA)
+  set(ADD_Fortran_EXTRA_FLAGS "${ADD_Fortran_EXTRA_FLAGS} -Wall -Wextra")
+endif ()
+
+if (Fortran_HAS_WERROR)
+  set(ADD_Fortran_EXTRA_FLAGS "${ADD_Fortran_EXTRA_FLAGS} -Werror")
+endif ()
+
+if (Fortran_HAS_PEDANTIC_ERRORS)
+  set(ADD_Fortran_EXTRA_FLAGS "${ADD_Fortran_EXTRA_FLAGS} -pedantic-errors")
+endif ()
+
+set(CMAKE_Fortran_FLAGS "${CMAKE_Fortran_FLAGS} ${ADD_Fortran_EXTRA_FLAGS}")
+
+
+include_directories(${PROJECT_SOURCE_DIR}/include)
+include_directories(${PROJECT_BINARY_DIR}/include)
+set(CMAKE_Fortran_MODULE_DIRECTORY ${PROJECT_BINARY_DIR}/include)
+
+
+set(CBSL_LIB  "cbsl")
+set(CBSL_FLIB "${CBSL_LIB}f")
+
+add_subdirectory(include)
+add_subdirectory(src)
+add_subdirectory(examples)
+add_subdirectory(tests)
+add_subdirectory(benchmarks)
+
+if (INSTALL_ZSTD)
+  # install zstd before building the library
+  add_dependencies(${CBSL_FLIB} ${CBSL_LIB})
+  add_dependencies(${CBSL_LIB}  zstd-install)
+endif ()
--- a/cachelab/cbsl/LICENSE
+++ b/cachelab/cbsl/LICENSE
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
--- a/cachelab/cbsl/README.md
+++ b/cachelab/cbsl/README.md
@@ -0,0 +1,93 @@
+# CBSL: Compressed Binary Serialization Library
+
+## What's this?
+
+The library provides the binary serialization with the compression by [Zstandard](https://facebook.github.io/zstd/).
+A motivation of the library is to implement the data-compressed checkpoint/restart, which is well-known technique to recover computer failures in high-performance computing.
+This library aims to simple and lightweight access for users.
+
+The library support C99 or later, and Fortran 2008 or later: perhaps we use the features are all supported by major compilers.
+
+## How to build and test
+
+The library uses [CMake](https://cmake.org/) version 3.3.x or later.
+
+    $ cmake --version
+    cmake version 3.14.3
+ 
+    CMake suite maintained and supported by Kitware (kitware.com/cmake).
+    $ mkdir build && cd build
+    $ cmake -D CMAKE_BUILD_TYPE=Release -D CMAKE_INSTALL_PREFIX=/install/path ..
+    $ make
+    $ make test
+    $ make install
+
+## Do you need help to install `zstd` package?
+
+We can build and install `zstd` automatically in the build process.
+Please pass `-D INSTALL_ZSTD=on` to cmake, we will install `zstd` package where `CMAKE_INSTALL_PREFIX` directory before building the library.
+
+    $ cmake -D CMAKE_BUILD_TYPE=Release -D CMAKE_INSTALL_PREFIX=/install/path -D INSTALL_ZSTD=on ..
+    $ make
+    $ make test
+    $ make install
+
+## Test environments
+
+1. CMake version 3.14.3
+2. GCC version 4.8.5
+3. Zstandard version 1.4.0
+4. CentOS Linux release 7.5.1804 (Core)
+
+## Benchmark
+
+We provide the library performance benchmark with best and worst case.
+Please be reminded that **the benchmark results not indicate the performance of Zstandard**, these measure the overhead (use cost) of this library.
+
+1. Best case : all data is zero filled (A compression ratio achieves up to 99%)
+2. Worst case : data is generated by rand() (A compression ratio is lower than 1%)
+
+`benchmark` target executes the benchmarks.
+
+    ...
+    $ make benchmark
+    min data size = 262144.00 [B]
+    max data size = 134217728.00 [B]
+    data is zero filled (maximum compression)
+    <write data [Byte]> <time [seconds]> <speed [MiB/sec]>
+    262144    0.002397    109.360615
+    524288    0.002887    181.572393
+    1048576    0.003440    304.827177
+    ...
+
+## Use `zstd` command
+
+A compressed file by the library can be decompressed by `zstd` command.
+
+## License
+
+    Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+  
+    Licensed under the Apache License, Version 2.0 (the "License");
+    you may not use this file except in compliance with the License.
+    You may obtain a copy of the License at
+  
+        http://www.apache.org/licenses/LICENSE-2.0
+  
+    Unless required by applicable law or agreed to in writing, software
+    distributed under the License is distributed on an "AS IS" BASIS,
+    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+    See the License for the specific language governing permissions and
+    limitations under the License.
+
+## Future work
+
+1. API error code
+2. Refectoring tests
+
+## NOTE
+
+### Unsupported binary compatibility
+
+The library does not support the binary compatibility and endianness conversion, which is required on the communication across machine.
+If you want it, please consider using other serialization libraries such as [MessagePack](https://msgpack.org/).
--- a/cachelab/cbsl/benchmarks/CMakeLists.txt
+++ b/cachelab/cbsl/benchmarks/CMakeLists.txt
@@ -0,0 +1,46 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+include(CheckLibraryExists)
+CHECK_LIBRARY_EXISTS(rt clock_gettime "time.h" HAVE_CLOCK_GETTIME)
+
+if (HAVE_CLOCK_GETTIME)
+  link_libraries(rt)
+else ()
+  include(CheckFunctionExists)
+  CHECK_FUNCTION_EXISTS(gettimeofday HAVE_GETTIMEOFDAY)
+  if (not HAVE_GETTIMEOFDAY)
+    message(WARNING "Benchmark program uses low resolution timer...")
+  endif ()
+endif ()
+
+configure_file(${CMAKE_CURRENT_SOURCE_DIR}/config.h.in ${CMAKE_CURRENT_BINARY_DIR}/config.h)
+
+link_libraries(${CBSL_LIB} ${ZSTD_LIB} m)
+include_directories(${CMAKE_CURRENT_BINARY_DIR})
+
+
+add_executable(serialize   serialize.c)
+add_executable(deserialize deserialize.c)
+
+add_custom_target(benchmark_serialize_bestcase   ./serialize   18 27 -f DEPENDS serialize)
+add_custom_target(benchmark_deserialize_bestcase ./deserialize 18 27 -f DEPENDS deserialize benchmark_serialize_bestcase)
+add_custom_target(benchmark_fast DEPENDS benchmark_serialize_bestcase benchmark_deserialize_bestcase)
+
+add_custom_target(benchmark_serialize_worstcase   ./serialize   18 27 -r DEPENDS serialize)
+add_custom_target(benchmark_deserialize_worstcase ./deserialize 18 27 -r DEPENDS deserialize benchmark_serialize_worstcase)
+add_custom_target(benchmark_slow DEPENDS benchmark_serialize_worstcase benchmark_deserialize_worstcase)
+
+add_custom_target(benchmark DEPENDS benchmark_fast benchmark_slow)
--- a/cachelab/cbsl/benchmarks/config.h.in
+++ b/cachelab/cbsl/benchmarks/config.h.in
@@ -0,0 +1,22 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#ifndef CBSL_BENCHMARK_CONFIG_INCLUDED
+#define CBSL_BENCHMARK_CONFIG_INCLUDED
+
+#cmakedefine01 HAVE_CLOCK_GETTIME
+#cmakedefine01 HAVE_GETTIMEOFDAY
+
+#endif /* CBSL_BENCHMARK_CONFIG_INCLUDED */
--- a/cachelab/cbsl/benchmarks/deserialize.c
+++ b/cachelab/cbsl/benchmarks/deserialize.c
@@ -0,0 +1,99 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#ifdef HAVE_GETTIMEOFDAY
+#include <sys/time.h>
+#endif
+#include <math.h>
+#include <cbsl.h>
+
+#include "config.h"
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void deserialize_bench(double ds);
+extern double seconds();
+
+int main(int argc, char** argv)
+{
+  if (argc <= 2)
+    exit(1);
+
+  int max_data_size_exp2, min_data_size_exp2;
+  sscanf(argv[1], "%d", &min_data_size_exp2);
+  sscanf(argv[2], "%d", &max_data_size_exp2);
+  printf("min data size = %.2lf [B]\n", pow(2,min_data_size_exp2));
+  printf("max data size = %.2lf [B]\n", pow(2,max_data_size_exp2));
+
+  srand((unsigned int)(time(NULL)));
+
+  printf("<read data [Byte]> <time [seconds]> <speed [MiB/sec]>\n");
+
+  for (int i = min_data_size_exp2; i <= max_data_size_exp2; ++i)
+  {
+    deserialize_bench(pow(2,i));
+  }
+
+  return 0;
+}
+
+void deserialize_bench(double ds)
+{
+  const uint64_t data_size = (uint64_t)(ds);
+
+  char cname[128];
+  sprintf(cname, "serialize_%lu.zst", data_size);
+
+  byte_t* a = (byte_t*)(malloc(data_size));
+
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+
+  const double beg = seconds();
+  {
+    CBSL_ERROR_CHECK(cbsl_read(ctx, a, data_size));
+  }
+  const double end = seconds();
+  const double rt  = end - beg;
+
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  printf("%lu    %lf    %lf\n", data_size, rt, (data_size/rt)/1.0e6);
+
+  free(a);
+}
+
+double seconds() {
+#if defined(HAVE_CLOCK_GETTIME)
+  struct timespec ts;
+  clock_gettime(CLOCK_REALTIME, &ts);
+  return ts.tv_sec + (ts.tv_nsec / 1.0e9);
+#elif defined(HAVE_GETTIMEOFDAY)
+  struct timeval tv;
+  gettimeofday(&tv, NULL);
+  return tv.tv_sec + (ts.tv_usec / 1.0e6);
+#else
+  return (double)(clock() / CLOCKS_PER_SEC);
+#endif
+}
--- a/cachelab/cbsl/benchmarks/serialize.c
+++ b/cachelab/cbsl/benchmarks/serialize.c
@@ -0,0 +1,136 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <string.h>
+#ifdef HAVE_GETTIMEOFDAY
+#include <sys/time.h>
+#endif
+#include <math.h>
+#include <cbsl.h>
+
+#include "config.h"
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void serialize_bench(double ds);
+extern void rand_byte_t(uint64_t n, byte_t* a);
+extern void zero_filled(uint64_t n, byte_t* a);
+extern double seconds();
+
+int rand_generate = 0;
+
+int main(int argc, char** argv)
+{
+  if (argc < 4)
+    exit(1);
+
+  int max_data_size_exp2, min_data_size_exp2;
+  sscanf(argv[1], "%d", &min_data_size_exp2);
+  sscanf(argv[2], "%d", &max_data_size_exp2);
+  printf("min data size = %.2lf [B]\n", pow(2,min_data_size_exp2));
+  printf("max data size = %.2lf [B]\n", pow(2,max_data_size_exp2));
+
+  rand_generate = (strcmp(argv[3],"-r") == 0);
+
+  if (rand_generate)
+  {
+    printf("data is random generated (stressful compression)\n");
+  }
+  else
+  {
+    printf("data is zero filled (maximum compression)\n");
+  }
+
+  srand((unsigned int)(time(NULL)));
+
+  printf("<write data [Byte]> <time [seconds]> <speed [MiB/sec]>\n");
+
+  for (int i = min_data_size_exp2; i <= max_data_size_exp2; ++i)
+  {
+    serialize_bench(pow(2,i));
+  }
+
+  return 0;
+}
+
+void serialize_bench(double ds)
+{
+  const uint64_t data_size = (uint64_t)(ds);
+
+  char cname[128];
+  sprintf(cname, "serialize_%lu.zst", data_size);
+
+  byte_t* a = (byte_t*)(malloc(data_size));
+  if (rand_generate)
+  {
+    rand_byte_t(data_size / sizeof(byte_t), a);
+  }
+  else
+  {
+    zero_filled(data_size / sizeof(byte_t), a);
+  }
+
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+
+  const double beg = seconds();
+  {
+    CBSL_ERROR_CHECK(cbsl_write(ctx, a, data_size));
+    CBSL_ERROR_CHECK(cbsl_flush(ctx));
+  }
+  const double end = seconds();
+  const double wt  = end - beg;
+
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  printf("%lu    %lf    %lf\n", data_size, wt, (data_size/wt)/1.0e6);
+
+  free(a);
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
+
+void zero_filled(uint64_t n, byte_t* a)
+{
+  for(uint64_t i = 0; i < n; ++i)
+    a[i] = 0; /* all data fills zero */
+}
+
+double seconds() {
+#if defined(HAVE_CLOCK_GETTIME)
+  struct timespec ts;
+  clock_gettime(CLOCK_REALTIME, &ts);
+  return ts.tv_sec + (ts.tv_nsec / 1.0e9);
+#elif defined(HAVE_GETTIMEOFDAY)
+  struct timeval tv;
+  gettimeofday(&tv, NULL);
+  return tv.tv_sec + (ts.tv_usec / 1.0e6);
+#else
+  return (double)(clock() / CLOCKS_PER_SEC);
+#endif
+}
--- a/cachelab/cbsl/examples/CMakeLists.txt
+++ b/cachelab/cbsl/examples/CMakeLists.txt
@@ -0,0 +1,22 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+add_executable(simple_usage simple_usage.c)
+add_dependencies(simple_usage ${CBSL_LIB})
+target_link_libraries(simple_usage ${CBSL_LIB} ${ZSTD_LIB})
+
+add_executable(recommend_usage recommend_usage.c)
+add_dependencies(recommend_usage ${CBSL_LIB})
+target_link_libraries(recommend_usage ${CBSL_LIB} ${ZSTD_LIB})
--- a/cachelab/cbsl/examples/recommend_usage.c
+++ b/cachelab/cbsl/examples/recommend_usage.c
@@ -0,0 +1,101 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK_BINARY(X,Y)    {if (memcmp(&(X),&(Y),sizeof((X))) != 0) { fprintf(stderr, "error: binary check %s == %s\n", (#X), (#Y)); exit(1); }}
+#define CHECK(X)             {if (!(X)) { fprintf(stderr, "error: %s\n", (#X)); }}
+#define SAFE_FREE(X)         {if ((X) != NULL) { free((X)); }}
+
+static const int    data0 = 43;
+static const double data1 = 3.14159265;
+static const int    data2 = 14142;
+
+extern void checkpoint_restart(cbsl_mode, int*, double*, int*, int**);
+
+char cname[128];
+
+int main(int argc, char** argv)
+{
+  int    c0;
+  double c1;
+  int    c2;
+  int*   a0;
+
+  if (argc < 2)
+    return 1;
+
+  sprintf(cname, "checkpoint.zst");
+
+  cbsl_mode mode = cbsl_unknown_mode;
+  if (strcmp(argv[1],"-c") == 0)
+  {
+    mode = cbsl_store_mode;
+    c0 = data0;
+    c1 = data1;
+    c2 = data2;
+    a0 = (int*)(malloc(sizeof(int) * 42));
+    for (int i = 0; i < 42; ++i)
+      a0[i] = 42;
+  }
+  else if (strcmp(argv[1],"-r") == 0)
+  {
+    mode = cbsl_load_mode;
+    c0 = c1 = c2 = 0;
+    a0 = NULL;
+  }
+  else
+  {
+    return 1;
+  }
+
+  checkpoint_restart(mode, &c0, &c1, &c2, &a0);
+
+  CHECK_BINARY(c0, data0);
+  CHECK_BINARY(c1, data1);
+  CHECK_BINARY(c2, data2);
+
+  for (int i = 0; i < 42; ++i)
+  {
+    CHECK(a0[i] == 42);
+  }
+
+  SAFE_FREE(a0);
+
+  return 0;
+}
+
+void checkpoint_restart(cbsl_mode mode, int* c0, double* c1, int* c2, int** a0)
+{
+  int a0_size;
+  cbsl_ctx* ctx = cbsl_open(mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c0, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c1, sizeof(double)));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c2, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, &a0_size, sizeof(int)));
+  if (mode == cbsl_load_mode)
+    (*a0) = (int*)(malloc(sizeof(int) * a0_size));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, (*a0), sizeof(int) * a0_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
--- a/cachelab/cbsl/examples/simple_usage.c
+++ b/cachelab/cbsl/examples/simple_usage.c
@@ -0,0 +1,99 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define ARRAY_SIZE(X)        (sizeof((X))/sizeof(*(X)))
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); }}
+
+int    a[1024]; /* 4 KiB */
+double b[1024]; /* 8 KiB */
+
+extern void save(void);
+extern void load(void);
+extern void rand_int(int, int*);
+extern void rand_double(int, double*);
+
+char cname[128];
+
+int main(int argc, char** argv) {
+  srand((unsigned int)(time(NULL)));
+
+  sprintf(cname, "checkpoint.zst");
+
+  if (strcmp(argv[1],"-c") == 0)
+  {
+    rand_int(ARRAY_SIZE(a), a);
+    rand_double(ARRAY_SIZE(b), b);
+    save();
+  }
+  else if (strcmp(argv[1],"-r") == 0)
+  {
+    load();
+  }
+  else
+  {
+    return 1;
+  }
+
+  return 0;
+}
+
+void save(void) {
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, "./checkpoint.data");
+
+  if (ctx == NULL) {
+    fprintf(stderr, "error: cbsl_open save\n");
+    exit(1);
+  }
+
+  CBSL_ERROR_CHECK(cbsl_write(ctx, a, sizeof(a)));
+  CBSL_ERROR_CHECK(cbsl_write(ctx, b, sizeof(b)));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  printf("before compressed a[%d] = %d\n", 124, a[124]);
+  printf("before compressed b[%d] = %e\n", 514, b[514]);
+}
+
+void load(void) {
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, "./checkpoint.data");
+
+  if (ctx == NULL) {
+    fprintf(stderr, "error: cbsl_open load\n");
+    exit(1);
+  }
+
+  CBSL_ERROR_CHECK(cbsl_read(ctx, a, sizeof(a)));
+  CBSL_ERROR_CHECK(cbsl_read(ctx, b, sizeof(b)));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  printf("decompressed a[%d] = %d\n", 124, a[124]);
+  printf("decompressed b[%d] = %e\n", 514, b[514]);
+}
+
+
+void rand_int(int n, int *v) {
+  for(int i = 0; i < n; ++i)
+    v[i] = rand();
+}
+
+void rand_double(int n, double *v) {
+  for(int i = 0; i < n; ++i)
+    v[i] = 1.0 / (double)(rand());
+}
--- a/cachelab/cbsl/include/CMakeLists.txt
+++ b/cachelab/cbsl/include/CMakeLists.txt
@@ -0,0 +1,23 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+configure_file(${CMAKE_CURRENT_SOURCE_DIR}/cbsl_config.h.in
+               ${CMAKE_CURRENT_BINARY_DIR}/cbsl_config.h)
+
+install(FILES
+        ${CMAKE_CURRENT_SOURCE_DIR}/cbsl.h
+        ${CMAKE_CURRENT_BINARY_DIR}/cbsl_config.h
+        TYPE INCLUDE
+        )
--- a/cachelab/cbsl/include/cbsl.h
+++ b/cachelab/cbsl/include/cbsl.h
@@ -0,0 +1,63 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#ifndef CBSL_HEADER_INCLUDED
+#define CBSL_HEADER_INCLUDED
+
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
+#include <stdint.h>
+#include "cbsl_config.h"
+
+	typedef enum
+	{
+		cbsl_load_mode = 1,
+		cbsl_store_mode = 2,
+		cbsl_unknown_mode = -1
+	}
+	cbsl_mode;
+
+	typedef enum
+	{
+		cbsl_success = 0,
+		cbsl_end = 1,
+		cbsl_error = -1
+	}
+	cbsl_errors;
+
+	typedef struct cbsl_ctx_ cbsl_ctx;
+
+
+	cbsl_ctx* cbsl_open(cbsl_mode open_mode, char* path);
+	cbsl_errors    cbsl_close(cbsl_ctx* ctx);
+	cbsl_errors    cbsl_flush(cbsl_ctx* ctx);
+
+	cbsl_errors    cbsl_write(cbsl_ctx* ctx, const void* data, uint64_t size);
+	cbsl_errors    cbsl_read(cbsl_ctx* ctx, void* data, uint64_t size);
+	cbsl_errors    cbsl_readline(cbsl_ctx* ctx, char* linebuf, uint64_t size);
+	cbsl_errors    cbsl_record(cbsl_ctx* ctx, void* data, uint64_t size);
+	cbsl_errors    cbsl_record_heap(cbsl_ctx* ctx, void** data, uint64_t* size);
+
+	cbsl_mode      cbsl_get_mode(cbsl_ctx* ctx);
+	cbsl_errors    cbsl_set_compression_level(cbsl_ctx* ctx, int clevel);
+	int            cbsl_get_compression_level(cbsl_ctx* ctx);
+
+#if defined(__cplusplus)
+} /* extern "C" */
+#endif
+
+#endif /* CBSL_HEADER_INCLUDED */
--- a/cachelab/cbsl/include/cbsl_config.h
+++ b/cachelab/cbsl/include/cbsl_config.h
@@ -0,0 +1,27 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#ifndef CBSL_CONFIG_HEADER_INCLUDED
+#define CBSL_CONFIG_HEADER_INCLUDED
+
+#define CBSL_VERSION          201950
+#define CBSL_VERSION_STRING   "2019.5.0"
+#define CBSL_MAJOR_VERSION    2019
+#define CBSL_MINOR_VERSION    5
+#define CBSL_PATCH_VERSION    0
+
+ /* #undef CBSL_DEBUG */
+
+#endif /* CBSL_CONFIG_HEADER_INCLUDED */
--- a/cachelab/cbsl/include/cbsl_config.h.in
+++ b/cachelab/cbsl/include/cbsl_config.h.in
@@ -0,0 +1,27 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#ifndef CBSL_CONFIG_HEADER_INCLUDED
+#define CBSL_CONFIG_HEADER_INCLUDED
+
+#define CBSL_VERSION          @cbsl_VERSION_MAJOR@@cbsl_VERSION_MINOR@@cbsl_VERSION_PATCH@
+#define CBSL_VERSION_STRING   "@cbsl_VERSION@"
+#define CBSL_MAJOR_VERSION    @cbsl_VERSION_MAJOR@
+#define CBSL_MINOR_VERSION    @cbsl_VERSION_MINOR@
+#define CBSL_PATCH_VERSION    @cbsl_VERSION_PATCH@
+
+#cmakedefine CBSL_DEBUG
+
+#endif /* CBSL_CONFIG_HEADER_INCLUDED */
--- a/cachelab/cbsl/references.md
+++ b/cachelab/cbsl/references.md
@@ -0,0 +1,443 @@
+# CBSL library references
+
+# Build and link libraries
+
+## C
+
+```bash
+export CBSL_INCLUDE_PATH=${CBSL_INSTALLED_PATH}/include
+export CBSL_LIBRARY_PATH=${CBSL_INSTALLED_PATH}/lib
+
+cc -c xcbsl_use_code.c -I${CBSL_INCLUDE_PATH}
+cc -o xcbsl_use_program ${OBJS} -lcbsl -lzstd -L${CBSL_LIBRARY_PATH}
+```
+
+## Fortran
+
+```bash
+export CBSL_INCLUDE_PATH=${CBSL_INSTALLED_PATH}/include
+export CBSL_LIBRARY_PATH=${CBSL_INSTALLED_PATH}/lib
+
+f95 -c xcbslf_use_code.f95 -I${CBSL_INCLUDE_PATH}
+f95 -o xcbslf_use_program ${OBJS} -lcbslf -lcbsl -lzstd -L${CBSL_LIBRARY_PATH}
+```
+
+# API
+
+We provide `cbslf` module for using the library in Fortran application.
+
+## Versioning
+
+|Version|Value                  |
+|-------|-----------------------|
+|major  |release year (ex. 2019)|
+|minor  |release month (ex. 5)  |
+|patch  |patch version (0-9)    |
+
+### C
+
+```c
+#define CBSL_VERSION        // full version (integer)
+#define CBSL_VERSION_STRING // full version (string)
+#define CBSL_MAJOR_VERSION  // major
+#define CBSL_MINOR_VERSION  // minor
+#define CBSL_PATCH_VERSION  // patch
+```
+
+### Fortran
+
+```fortran
+integer(8),   parameter :: CBSL_VERSION
+character(*), parameter :: CBSL_VERSION_STRING
+integer(4),   parameter :: CBSL_MAJOR_VERSION
+integer(4),   parameter :: CBSL_MINOR_VERSION
+integer(4),   parameter :: CBSL_PATCH_VERSION
+```
+
+## Types
+
+### C
+
+```c
+// library context
+typedef struct cbsl_ctx_ cbsl_ctx;
+```
+### Fortran
+
+```fortran
+type(cbslf_context)
+```
+
+## Constant values
+
+### C
+
+```c
+// Context mode
+typedef enum
+{
+  cbsl_load_mode,    // deserialize mode
+  cbsl_store_mode,   // serialize mode
+  cbsl_unknown_mode  // unknown
+}
+cbsl_mode;
+
+// Errors
+typedef enum
+{
+  cbsl_success,  // no error
+  cbsl_error     // function happens any error
+}
+cbsl_errors;
+```
+
+### Fortran
+
+```fortran
+integer(4), parameter :: cbslf_load_mode
+integer(4), parameter :: cbslf_store_mode
+integer(4), parameter :: cbslf_unknown_mode
+
+integer(4), parameter :: cbslf_success
+integer(4), parameter :: cbslf_errors
+```
+
+## API
+
+### C
+
+```c
+/*
+   [brief]
+        open serialized data file stream.
+   [arguments]
+        open_mode: specifies load/store mode
+        path     : data file path
+   [return]
+        success  : return context pointer
+        fail     : NULL pointer
+ */
+cbsl_ctx* cbsl_open(cbsl_mode open_mode, char* path);
+
+/*
+   [brief]
+        close serialized data file stream.
+        this function calls cbsl_flush() before closing stream.
+   [arguments]
+        ctx      : context pointer
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_close(cbsl_ctx* ctx);
+
+/*
+   [brief]
+        flush file stream.
+        this function executes data compression and write to file stream.
+   [arguments]
+        ctx      : context pointer
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_flush(cbsl_ctx* ctx);
+
+/*
+   [brief]
+        the data stores with compression.
+        this function stores internal buffer to stored data.
+        When the stored data fills enough size to compress, this function calls cbsl_flush().
+   [arguments]
+        ctx      : context pointer
+        data     : write data pointer (must be allocated)
+        size     : byte size of data
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_write(cbsl_ctx* ctx, const void* data, uint64_t size);
+
+/*
+   [brief]
+        the data loads with decompression.
+        this function decompresses data from a file stream, and loads from internal decompressed buffer.
+   [arguments]
+        ctx      : context pointer
+        data     : read data pointer (must be allocated)
+        size     : byte size of data
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_read(cbsl_ctx* ctx, void* data, uint64_t size);
+
+/*
+   [brief]
+        the data loads/stores with compression/decompression.
+        this function calls cbsl_read()/cbsl_write() by context mode to help the implementation of checkpoint/restart in the application.
+   [argumetns]
+        ctx      : context pointer
+        data     : read/write data pointer (must be allocated)
+        size     : byte size of data
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_record(cbsl_ctx* ctx, void* data, uint64_t size);
+
+/*
+   [brief]
+        this is a specialized function of cbsl_record() for heap allocated array.
+        the function loads/stores array data size [bytes] and array values from/to a file stream.
+        an array will be allocated on heap memory by malloc() routine if `data` is null pointer.
+   [arguments]
+        ctx      : context pointer
+        data     : read/write data pointer (it accepts NULL pointer)
+        size     : byte size of data
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_record_heap(cbsl_ctx* ctx, void** data, uint64_t* size);
+
+/*
+   [brief]
+        gets context mode.
+   [arguments]
+        ctx      : context pointer
+   [return]
+        success  : context mode
+ */
+cbsl_mode cbsl_get_mode(cbsl_ctx* ctx);
+
+/*
+   [brief]
+        sets zstd compression level of serialized data.
+   [arguments]
+        ctx      : context pointer
+        clevel   : compression level 1-22 (zstd 1.4.0)
+   [return]
+        success  : cbsl_success
+        fail     : cbsl_error
+ */
+cbsl_errors cbsl_set_compression_level(cbsl_ctx* ctx, int clevel);
+
+/*
+   [brief]
+        gets zstd compression level of serialized data.
+   [arguments]
+        ctx      : context pointer
+   [return]
+        success  : compression level 1-22 (zstd 1.4.0)
+        fail     : -1
+ */
+int cbsl_get_compression_level(cbsl_ctx* ctx);
+```
+
+### Fortran
+
+```fortran
+!
+! [brief]
+!      open serialized data file stream.
+! [arguments]
+!      open_mode: specifies load/store mode
+!      path     : data file path
+!      errcode  : error code
+! [return]
+!      success  : return context pointer
+!      fail     : NULL pointer
+!
+function cbslf_open(open_mode, path, errcode) result(ctx)
+  integer(4),   intent(in)          :: open_mode
+  character(*), intent(in)          :: path
+  integer(4), intent(out), optional :: errcode
+  type(cbslf_context)               :: ctx
+end function
+
+!
+! [brief]
+!      close serialized data file stream.
+!      this subroutine calls cbslf_flush() before closing stream.
+! [arguments]
+!      ctx      : context pointer
+!      errcode  : error code
+!
+subroutine cbslf_close(ctx, errcode)
+  type(cbslf_context), intent(in)   :: ctx
+  integer(4), intent(out), optional :: errcode
+end subroutine
+
+!
+! [brief]
+!      flush file stream.
+!      this subroutine executes data compression and write to file stream.
+! [arguments]
+!      ctx      : context pointer
+!      errcode  : error code
+!
+subroutine cbslf_flush(ctx, errcode)
+  type(cbslf_context), intent(in)   :: ctx
+  integer(4), intent(out), optional :: errcode
+end subroutine
+
+!
+! [brief]
+!      this is a generic interface.
+!      the data stores with compression.
+!      this subroutine stores internal buffer to stored data.
+!      When the stored data fills enough size to compress, this subroutine calls cbslf_flush().
+! [supported types]
+!      scalar   : logical, character(*)
+!      +array   : integer(4), integer(8), real(4), real(8), complex(4), complex(8) by up to 7-dimensional array
+! [arguments]
+!      ctx      : context pointer
+!      data     : write data (array must be allocated)
+!      errcode  : error code
+!
+interface cbslf_write(ctx, data, errcode)
+  type(cbslf_context), intent(in)   :: ctx
+  GENERIC_TYPE,         intent(in)  :: data
+  integer(4), intent(out), optional :: errcode
+end interface
+
+!
+! [brief]
+!      this is a generic interface.
+!      the data loads with decompression.
+!      this subroutine decompresses data from a file stream, and loads from internal decompressed buffer.
+! [supported types]
+!      scalar   : logical, character(*)
+!      +array   : integer(4), integer(8), real(4), real(8), complex(4), complex(8) by 7-dimensional array
+! [arguments]
+!      ctx      : context pointer
+!      data     : write data (array must be allocated)
+!      errcode  : error code
+!
+interface cbslf_read(ctx, data, errcode)
+  type(cbslf_context), intent(in)   :: ctx
+  GENERIC_TYPE,         intent(out) :: data
+  integer(4), intent(out), optional :: errcode
+end interface
+
+!
+! [brief]
+!      this is a generic interface.
+!      the data loads/stores with compression/decompression.
+!      this subroutine calls cbsl_read()/cbsl_write() by context mode to help the implementation of checkpoint/restart in the application.
+! [supported types]
+!      scalar   : logical, character(*)
+!      +array   : integer(4), integer(8), real(4), real(8), complex(4), complex(8) by up to 7-dimensional array
+! [arguments]
+!      ctx      : context pointer
+!      data     : read/write data (array must be allocated)
+!      size     : byte size of data
+!      errcode  : error code (return value)
+!
+interface cbslf_record(ctx, data, errcode)
+  type(cbslf_context), intent(in)     :: ctx
+  GENERIC_TYPE,         intent(inout) :: data
+  integer(4), intent(out), optional   :: errcode
+end interface
+
+!
+! [brief]
+!      this is a generic interface for allocatable array.
+!      the data loads/stores with compression/decompression.
+!      this subroutine calls cbsl_read()/cbsl_write() by context mode to help the implementation of checkpoint/restart in the application.
+!      this subroutine behaves as like as cbsl_record_heap() in C API.
+!      an array will be allocated on the memory if it is not allocated.
+! [supported types]
+!      array    : integer(4), integer(8), real(4), real(8), complex(4), complex(8) by up to 7-dimensional array
+! [arguments]
+!      ctx      : context pointer
+!      data     : read/write data (accepts not allocated array)
+!      size     : byte size of data
+!      errcode  : error code
+!
+interface cbslf_record_heap(ctx, data, errcode)
+  type(cbslf_context), intent(in)     :: ctx
+  GENERIC_TYPE,         intent(inout) :: data
+  integer(4), intent(out), optional   :: errcode
+end interface
+
+!
+! [brief]
+!      gets context mode.
+! [arguments]
+!      ctx      : context pointer
+!      errcode  : error code (return value)
+! [return]
+!      success  : context mode
+!
+function cbslf_get_mode(ctx, errcode) result(mode)
+  type(cbslf_context), intent(in)   :: ctx
+  integer(4), intent(out), optional :: errcode
+  integer(4)                        :: mode
+end function
+
+!
+! [brief]
+!      sets zstd compression level of serialized data.
+! [arguments]
+!      ctx      : context pointer
+!      clevel   : compression level 1-22 (zstd 1.4.0)
+!      errcode  : error code (return value)
+!
+subroutine cbslf_set_compression_level(ctx, clevel)
+  type(cbslf_context), intent(in)   :: ctx
+  ingeter(4),           intent(in)  :: clevel
+  integer(4), intent(out), optional :: errcode
+end subroutine
+
+!
+! [brief]
+!      gets zstd compression level of serialized data.
+! [arguments]
+!      ctx      : context pointer
+! [return]
+!      success  : compression level 1-22 (zstd 1.4.0)
+!      fail     : -1
+!
+function cbslf_get_compression_level(ctx, errcode) result(clevel)
+  type(cbslf_context), intent(in)   :: ctx
+  integer(4), intent(out), optional :: errcode
+  ingeter(4),                       :: clevel
+end function
+```
+
+## Data format
+
+```
+BDATA: binary data                  [1 byte]
+BSIZE: total size of binary data    [4 bytes]
+RSIZE: rank size of a fortran array [4 bytes]
+NRANK: number of rank size of a fortran array
+
+sizeof(TYPE):     gets byte size of TYPE
+Array-value-type: element type of an array
+```
+
+### Header
+
+```
+[BDATA * 8]: cbsl library version (64-bit integer)
+```
+
+### C API
+
+```
+Scalar data: HEAD -> [BDATA * sizeof(Scalar)] -> TAIL
+Array data : HEAD -> [BSIZE][BDATA * sizeof(Array-value-type) * BSIZE] -> TAIL
+```
+
+### Fortran API
+
+```
+Scalar data: HEAD -> [BDATA * sizeof(Scalar)] -> TAIL
+Array data : HEAD -> [BSIZE][ARRAY_LOWER_BOUNDS][ARRAY_UPPER_BOUNDS][BDATA * sizeof(Array-value-type) * BSIZE] -> TAIL
+
+ARRAY_LOWER_BOUNDS: lower bounds of a fortran array [RSIZE * NRANK]
+ARRAY_UPPER_BOUNDS: upper bounds of a fortran array [RSIZE * NRANK]
+```
--- a/cachelab/cbsl/src/CMakeLists.txt
+++ b/cachelab/cbsl/src/CMakeLists.txt
@@ -0,0 +1,46 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+set(LIB_SOURCES
+    buffer.c
+    file.c
+    utils.c
+    flush.c
+    write.c
+    read.c
+    record.c
+    )
+
+set(FLIB_SOURCES
+    ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90
+    )
+configure_file(fortran_bindings.f90.in ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90.in.2)
+
+find_program(CPP cpp)
+if (CPP_NOTFOUND)
+  message(FATAL_ERROR "C preprocessor (cpp) command not found.")
+endif ()
+add_custom_command(OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90
+                   COMMAND ${CPP} ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90.in.2 ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90
+                   COMMAND ${CMAKE_COMMAND} -P ${CMAKE_CURRENT_SOURCE_DIR}/gen_fortran_bindings.cmake ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90
+                   DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90.in.2
+                  )
+add_custom_target(generate_preprocessed_fortran_file SOURCES ${CMAKE_CURRENT_BINARY_DIR}/fortran_bindings.f90)
+
+add_library(${CBSL_LIB}  ${LIB_SOURCES})
+add_library(${CBSL_FLIB} ${FLIB_SOURCES})
+
+install(TARGETS ${CBSL_LIB} ${CBSL_FLIB})
+install(FILES "${CMAKE_Fortran_MODULE_DIRECTORY}/${CBSL_FLIB}.mod" DESTINATION include)
--- a/cachelab/cbsl/src/buffer.c
+++ b/cachelab/cbsl/src/buffer.c
@@ -0,0 +1,85 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdint.h>
+
+#include "./cbsl_internal.h"
+
+cbsl_errors create_streaming_buffers(cbsl_ctx* ctx)
+{
+	ZSTD_CCtx* zstd_cctx = NULL;
+	ZSTD_DCtx* zstd_dctx = NULL;
+	uint64_t in_buffer_size;
+	uint64_t out_buffer_size;
+	void* in_buffer = NULL;
+	void* out_buffer = NULL;
+	void* line_buffer = NULL;
+
+	switch (ctx->mode)
+	{
+	case cbsl_load_mode:
+		zstd_dctx = ZSTD_createDCtx();
+		if (zstd_dctx == NULL) return cbsl_error;
+		in_buffer_size = ZSTD_DStreamInSize();
+		out_buffer_size = ZSTD_DStreamOutSize();
+		break;
+	case cbsl_store_mode:
+		zstd_cctx = ZSTD_createCCtx();
+		if (zstd_cctx == NULL) return cbsl_error;
+		in_buffer_size = ZSTD_CStreamInSize();
+		out_buffer_size = ZSTD_CStreamOutSize();
+		break;
+	default:
+		return cbsl_error;
+	}
+
+	in_buffer = (byte_t*)(malloc(in_buffer_size));
+	out_buffer = (byte_t*)(malloc(out_buffer_size));
+	line_buffer = (byte_t*)(malloc(CBSL_LINEBUF_SIZE));
+
+	if (in_buffer == NULL || out_buffer == NULL || line_buffer == NULL)
+	{
+		CBSL_SAFE_FREE_ZSTD_CCTX(zstd_cctx);
+		CBSL_SAFE_FREE_ZSTD_DCTX(zstd_dctx);
+		CBSL_SAFE_FREE(in_buffer);
+		CBSL_SAFE_FREE(out_buffer);
+		CBSL_SAFE_FREE(line_buffer);
+		return cbsl_error;
+	}
+
+	ctx->zstd_cctx = zstd_cctx;
+	ctx->zstd_dctx = zstd_dctx;
+	ctx->in_buffer = in_buffer;
+	ctx->out_buffer = out_buffer;
+	ctx->line_buffer = line_buffer;
+
+	ctx->in_buffer_size = in_buffer_size;
+	ctx->out_buffer_size = out_buffer_size;
+
+	ctx->in_buffer_pos = 0;
+	ctx->out_buffer_pos = 0;
+
+	ctx->in_buffer_used = 0;
+	ctx->out_buffer_used = 0;
+	ctx->line_buffer_used = 0;
+	ctx->line_buffer_read_from_zst = 0;
+
+	ctx->zstd_buf_end = 0;
+	ctx->zstd_file_end = 0;
+
+	return cbsl_success;
+}
--- a/cachelab/cbsl/src/cbsl_internal.h
+++ b/cachelab/cbsl/src/cbsl_internal.h
@@ -0,0 +1,78 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#ifndef CBSL_INTERNAL_HEADER_INCLUDED
+#define CBSL_INTERNAL_HEADER_INCLUDED
+
+#include <stdio.h>
+#include <stdint.h>
+#include <zstd.h>
+
+#include <cbsl.h>
+
+#define CBSL_LINEBUF_SIZE	8192
+
+typedef unsigned char byte_t;
+
+struct cbsl_ctx_
+{
+	FILE* fp;
+	ZSTD_CCtx* zstd_cctx;
+	ZSTD_DCtx* zstd_dctx;
+	byte_t* in_buffer;
+	byte_t* out_buffer;
+	uint64_t      in_buffer_size;
+	uint64_t      out_buffer_size;
+	uint64_t      in_buffer_pos;
+	uint64_t      in_buffer_used;
+	uint64_t      out_buffer_pos;
+	uint64_t      out_buffer_used;
+	cbsl_mode     mode;
+
+	// support readline
+	byte_t		zstd_buf_end;
+	byte_t		zstd_file_end;
+	byte_t* line_buffer;
+	uint64_t      line_buffer_used;
+	uint64_t		line_buffer_read_from_zst;
+};
+
+cbsl_errors create_streaming_buffers(cbsl_ctx* ctx);
+
+#define MIN(x, y) (x) < (y) ? (x) : (y)
+
+#ifdef CBSL_DEBUG
+# include <assert.h>
+# define CBSL_ASSERT(COND)       { assert((COND)); }
+# define CBSL_DEBUG_MESSAGE(...) { fprintf(stderr, __VA_ARGS__); }
+#else
+# define CBSL_ASSERT(COND)       /* */
+# define CBSL_DEBUG_MESSAGE(...) /* */
+#endif
+
+/* error check */
+#define CBSL_CHECK_COND_MSG_IMPL(X,MSG,FINALIZE)      { if (!(X)) { fprintf(stderr, "%s at %s l.%d: condition error %s; %s\n", __func__, __FILE__, __LINE__, (#X), (MSG)); FINALIZE; } }
+#define CBSL_CHECK_COND(X)                            CBSL_CHECK_COND_MSG_IMPL((X), "", /* noreturn */)
+#define CBSL_CHECK_COND_AND_RETURN(X,RETCODE)         CBSL_CHECK_COND_MSG_IMPL((X), "", { return (RETCODE); })
+#define CBSL_CHECK_COND_MSG_AND_RETURN(X,MSG,RETCODE) CBSL_CHECK_COND_MSG_IMPL((X), (MSG), { return (RETCODE); })
+
+/* safe memory control */
+#define CBSL_SAFE_FREE_RESOURCE(X,FREEFUNC) { if ((X) != NULL) { (FREEFUNC)((X)); (X) = NULL; } }
+#define CBSL_SAFE_FCLOSE(X)                 CBSL_SAFE_FREE_RESOURCE((X), fclose);
+#define CBSL_SAFE_FREE(X)                   CBSL_SAFE_FREE_RESOURCE((X), free)
+#define CBSL_SAFE_FREE_ZSTD_CCTX(X)         CBSL_SAFE_FREE_RESOURCE((X), ZSTD_freeCCtx)
+#define CBSL_SAFE_FREE_ZSTD_DCTX(X)         CBSL_SAFE_FREE_RESOURCE((X), ZSTD_freeDCtx)
+
+#endif /* CBSL_INTERNAL_HEADER_INCLUDED */
--- a/cachelab/cbsl/src/file.c
+++ b/cachelab/cbsl/src/file.c
@@ -0,0 +1,94 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdint.h>
+
+#include "./cbsl_internal.h"
+
+static
+cbsl_ctx* cbsl_open_safe_finalize(cbsl_ctx** ctx)
+{
+	if (*ctx != NULL)
+	{
+		cbsl_close(*ctx);
+	}
+	return NULL;
+}
+
+cbsl_ctx* cbsl_open(cbsl_mode mode, char* path)
+{
+	CBSL_CHECK_COND_AND_RETURN(path != NULL, NULL);
+
+	cbsl_ctx* ctx = (cbsl_ctx*)(malloc(sizeof(cbsl_ctx)));
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, NULL);
+
+	char const* fopen_mode;
+	switch (mode)
+	{
+	case cbsl_load_mode:  fopen_mode = "rb"; break;
+	case cbsl_store_mode: fopen_mode = "wb"; break;
+	default:              free(ctx);         return NULL;
+	}
+
+#ifdef _WIN32
+	errno_t err;
+	FILE* fp;
+	err = fopen_s(&fp, path, fopen_mode);
+	CBSL_CHECK_COND_AND_RETURN(err == 0, cbsl_open_safe_finalize(&ctx));
+#else
+	FILE* fp = fopen(path, fopen_mode);
+	CBSL_CHECK_COND_AND_RETURN(fp != NULL, cbsl_open_safe_finalize(&ctx));
+#endif
+
+	ctx->mode = mode;
+	ctx->fp = fp;
+	CBSL_CHECK_COND_AND_RETURN(create_streaming_buffers(ctx) == cbsl_success, cbsl_open_safe_finalize(&ctx));
+
+	/*
+	uint64_t file_version;
+	if (mode == cbsl_load_mode)
+	{
+	  file_version = 0;
+	  CBSL_CHECK_COND_AND_RETURN(cbsl_read(ctx, &file_version, sizeof(file_version)) == cbsl_success, cbsl_open_safe_finalize(&ctx));
+	  CBSL_CHECK_COND_AND_RETURN(file_version == CBSL_VERSION, cbsl_open_safe_finalize(&ctx));
+	}
+	else if (mode == cbsl_store_mode)
+	{
+	  file_version = CBSL_VERSION;
+	  CBSL_CHECK_COND_AND_RETURN(cbsl_write(ctx, &file_version, sizeof(file_version)) == cbsl_success, cbsl_open_safe_finalize(&ctx));
+	}
+	*/
+
+	return ctx;
+}
+
+cbsl_errors cbsl_close(cbsl_ctx* ctx)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_success);
+	if (ctx->mode == cbsl_store_mode)
+	{
+		cbsl_flush(ctx);
+	}
+	CBSL_SAFE_FREE_ZSTD_CCTX(ctx->zstd_cctx);
+	CBSL_SAFE_FREE_ZSTD_DCTX(ctx->zstd_dctx);
+	CBSL_SAFE_FREE(ctx->in_buffer);
+	CBSL_SAFE_FREE(ctx->out_buffer);
+	CBSL_SAFE_FREE(ctx->line_buffer);
+	CBSL_SAFE_FCLOSE(ctx->fp);
+	CBSL_SAFE_FREE(ctx);
+	return cbsl_success;
+}
--- a/cachelab/cbsl/src/flush.c
+++ b/cachelab/cbsl/src/flush.c
@@ -0,0 +1,55 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdint.h>
+
+#include "./cbsl_internal.h"
+
+static
+cbsl_errors flush_serialize(cbsl_ctx* ctx)
+{
+	if (ctx->in_buffer_used > 0)
+	{
+		ZSTD_inBuffer input = { ctx->in_buffer, ctx->in_buffer_used, 0 };
+		ZSTD_EndDirective mode = (ctx->in_buffer_used < ctx->in_buffer_size) ? ZSTD_e_end : ZSTD_e_continue;
+		do
+		{
+			ZSTD_outBuffer output = { ctx->out_buffer, ctx->out_buffer_size, 0 };
+			const size_t remaining = ZSTD_compressStream2(ctx->zstd_cctx, &output, &input, mode);
+			CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(remaining), ZSTD_getErrorName(remaining), cbsl_error);
+
+			const size_t written = fwrite(ctx->out_buffer, 1, output.pos, ctx->fp);
+			CBSL_CHECK_COND_AND_RETURN(written == output.pos, cbsl_error);
+		} while (input.pos < input.size);
+
+		ctx->in_buffer_used = 0;
+	}
+
+	fflush(ctx->fp);
+
+	return cbsl_success;
+}
+
+cbsl_errors cbsl_flush(cbsl_ctx* ctx)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	if (ctx->mode == cbsl_store_mode)
+	{
+		return flush_serialize(ctx);
+	}
+	return cbsl_success;
+}
--- a/cachelab/cbsl/src/fortran_bindings.f90.in
+++ b/cachelab/cbsl/src/fortran_bindings.f90.in
@@ -0,0 +1,471 @@
+!
+!  Copyright 2019 Yuta Hirokawa (University of Tsukuba)
+!
+!  Licensed under the Apache License, Version 2.0 (the "License");
+!  you may not use this file except in compliance with the License.
+!  You may obtain a copy of the License at
+!
+!      http://www.apache.org/licenses/LICENSE-2.0
+!
+!  Unless required by applicable law or agreed to in writing, software
+!  distributed under the License is distributed on an "AS IS" BASIS,
+!  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+!  See the License for the specific language governing permissions and
+!  limitations under the License.
+!
+module cbslf
+  use, intrinsic :: iso_c_binding
+  implicit none
+
+  type cbslf_context
+    integer(c_intptr_t) :: ctx
+  end type
+  public :: cbslf_context
+
+  public :: cbslf_store_mode
+  public :: cbslf_load_mode
+  public :: cbslf_unknown_mode
+
+  public :: cbslf_success
+  public :: cbslf_error
+
+  public :: cbslf_open
+  public :: cbslf_close
+  public :: cbslf_flush
+
+  public :: cbslf_write
+  public :: cbslf_read
+  public :: cbslf_record
+  public :: cbslf_record_heap
+
+  public :: cbslf_get_mode
+  public :: cbslf_set_compression_level
+  public :: cbslf_get_compression_level
+
+#define PASTE(a,b) a##b
+#define CONCAT(a,b) PASTE(a,b)
+
+#define SET_ERRCODE(CODE) \
+        if (present(errcode)) errcode = CODE
+
+#define SET_ERRCODE_COND(COND) \
+        if (present(errcode)) then \
+__NL__    if (COND) then \
+__NL__      errcode = cbslf_success \
+__NL__    else \
+__NL__      errcode = cbslf_error \
+__NL__    end if \
+__NL__  end if
+
+#define FORTRAN_ARRAY_1       :
+#define FORTRAN_ARRAY_2       :,:
+#define FORTRAN_ARRAY_3       :,:,:
+#define FORTRAN_ARRAY_4       :,:,:,:
+#define FORTRAN_ARRAY_5       :,:,:,:,:
+#define FORTRAN_ARRAY_6       :,:,:,:,:,:
+#define FORTRAN_ARRAY_7       :,:,:,:,:,:,:
+
+#define FORTRAN_ARRAY_VALUE_1 1
+#define FORTRAN_ARRAY_VALUE_2 1,1
+#define FORTRAN_ARRAY_VALUE_3 1,1,1
+#define FORTRAN_ARRAY_VALUE_4 1,1,1,1
+#define FORTRAN_ARRAY_VALUE_5 1,1,1,1,1
+#define FORTRAN_ARRAY_VALUE_6 1,1,1,1,1,1
+#define FORTRAN_ARRAY_VALUE_7 1,1,1,1,1,1,1
+
+#define FORTRAN_ARRAY_SHAPE_1 lb(1):ub(1)
+#define FORTRAN_ARRAY_SHAPE_2 lb(1):ub(1),lb(2):ub(2)
+#define FORTRAN_ARRAY_SHAPE_3 lb(1):ub(1),lb(2):ub(2),lb(3):ub(3)
+#define FORTRAN_ARRAY_SHAPE_4 lb(1):ub(1),lb(2):ub(2),lb(3):ub(3),lb(4):ub(4)
+#define FORTRAN_ARRAY_SHAPE_5 lb(1):ub(1),lb(2):ub(2),lb(3):ub(3),lb(4):ub(4),lb(5):ub(5)
+#define FORTRAN_ARRAY_SHAPE_6 lb(1):ub(1),lb(2):ub(2),lb(3):ub(3),lb(4):ub(4),lb(5):ub(5),lb(6):ub(6)
+#define FORTRAN_ARRAY_SHAPE_7 lb(1):ub(1),lb(2):ub(2),lb(3):ub(3),lb(4):ub(4),lb(5):ub(5),lb(6):ub(6),lb(7):ub(7)
+
+#define DECLARE_SCALAR_INTERFACE(SAVE_LOAD,ROUTINE_NAME)  \
+          module procedure CONCAT(CONCAT(SAVE_LOAD,_scalar_),ROUTINE_NAME)
+
+#define DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,DIMS)  \
+          module procedure CONCAT(CONCAT(SAVE_LOAD,CONCAT(_array_,DIMS)),CONCAT(_,ROUTINE_NAME))
+
+#define DECLARE_ARRAY_INTERFACE(SAVE_LOAD,ROUTINE_NAME) \
+          DECLARE_SCALAR_INTERFACE(SAVE_LOAD,ROUTINE_NAME) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,1) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,2) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,3) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,4) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,5) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,6) \
+__NL__    DECLARE_ARRAY_INTERFACE_N(SAVE_LOAD,ROUTINE_NAME,7) \
+
+#define DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,DIMS)  \
+          module procedure CONCAT(CONCAT(SAVE_LOAD,CONCAT(_array_heap_,DIMS)),CONCAT(_,ROUTINE_NAME))
+
+#define DECLARE_ARRAY_INTERFACE_ALLOCATABLE(SAVE_LOAD,ROUTINE_NAME) \
+          DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,1) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,2) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,3) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,4) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,5) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,6) \
+__NL__    DECLARE_ARRAY_INTERFACE_ALLOCATABLE_N(SAVE_LOAD,ROUTINE_NAME,7)
+
+#define IMPLEMENT_SCALAR_INTERFACE(ROUTINE_NAME,DATA_TYPE)  \
+          subroutine CONCAT(write_scalar_,ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, target, intent(in) :: val \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(c_int64_t) :: psize \
+__NL__      integer(4) :: ret \
+__NL__      psize = c_sizeof(val) \
+__NL__      ret = cbsl_write(ctx%ctx, loc(val), psize) \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine \
+__NL__    subroutine CONCAT(read_scalar_,ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, target, intent(out) :: val \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(c_int64_t) :: psize \
+__NL__      integer(4) :: ret \
+__NL__      psize = c_sizeof(val) \
+__NL__      ret = cbsl_read(ctx%ctx, loc(val), psize) \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine \
+__NL__    subroutine CONCAT(record_scalar_,ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, target, intent(inout) :: val \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(c_int64_t) :: psize \
+__NL__      integer(4) :: ret \
+__NL__      psize = c_sizeof(val) \
+__NL__      ret = cbsl_record(ctx%ctx, loc(val), psize) \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine
+
+#define IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,DIMS)  \
+__NL__    subroutine CONCAT(CONCAT(write_array_,CONCAT(DIMS,_)),ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof, c_int64_t \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, intent(in) :: val(CONCAT(FORTRAN_ARRAY_,DIMS)) \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(4) :: lb(DIMS),ub(DIMS),nsize,i \
+__NL__      integer(c_int64_t) :: bsize \
+__NL__      integer(4) :: ret \
+__NL__      nsize   = size(val, kind=kind(nsize)) \
+__NL__      do i=1,size(lb) \
+__NL__        lb(i) = lbound(val, i, kind(lb(i))) \
+__NL__        ub(i) = ubound(val, i, kind(ub(i))) \
+__NL__      end do \
+__NL__      call cbslf_write(ctx, nsize, ret) \
+__NL__      bsize = size(lb) * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__      ret   = iand(cbsl_write(ctx%ctx, loc(lb), bsize), ret) \
+__NL__      ret   = iand(cbsl_write(ctx%ctx, loc(ub), bsize), ret) \
+__NL__      bsize = nsize * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__      ret   = iand(cbsl_write(ctx%ctx, loc(val), bsize), ret) \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine \
+__NL__    subroutine CONCAT(CONCAT(read_array_,CONCAT(DIMS,_)),ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof, c_int64_t \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, intent(out) :: val(CONCAT(FORTRAN_ARRAY_,DIMS)) \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(4) :: lb(DIMS),ub(DIMS),nsize \
+__NL__      integer(c_int64_t) :: bsize \
+__NL__      integer(4) :: ret \
+__NL__      ret = cbslf_error \
+__NL__      if (size(val) > 0) then \
+__NL__        call cbslf_read(ctx, nsize, ret) \
+__NL__        if (ret == cbslf_success .and. nsize > 0) then \
+__NL__          bsize = size(lb) * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__          ret   = iand(cbsl_read(ctx%ctx, loc(lb), bsize), ret) \
+__NL__          ret   = iand(cbsl_read(ctx%ctx, loc(ub), bsize), ret) \
+__NL__          bsize = nsize * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__          ret   = iand(cbsl_read(ctx%ctx, loc(val), bsize), ret) \
+__NL__        else \
+__NL__          ret = cbslf_error \
+__NL__        end if \
+__NL__      end if \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine \
+__NL__    subroutine CONCAT(CONCAT(record_array_,CONCAT(DIMS,_)),ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof, c_int64_t \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, allocatable, intent(inout) :: val(CONCAT(FORTRAN_ARRAY_,DIMS)) \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(4) :: mode,ret \
+__NL__      mode = cbslf_get_mode(ctx) \
+__NL__      select case(mode) \
+__NL__        case(cbslf_store_mode) \
+__NL__          call cbslf_write(ctx, val, ret) \
+__NL__        case(cbslf_load_mode) \
+__NL__          call cbslf_read(ctx, val, ret) \
+__NL__        case default \
+__NL__          ret = cbslf_error \
+__NL__      end select \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine \
+__NL__    subroutine CONCAT(CONCAT(record_array_heap_,CONCAT(DIMS,_)),ROUTINE_NAME)(ctx, val, errcode) \
+__NL__      use, intrinsic :: iso_c_binding, only: c_sizeof, c_int64_t \
+__NL__      implicit none \
+__NL__      type(cbslf_context), intent(in) :: ctx \
+__NL__      DATA_TYPE, allocatable, intent(inout) :: val(CONCAT(FORTRAN_ARRAY_,DIMS)) \
+__NL__      integer(4), intent(out), optional :: errcode \
+__NL__      integer(4) :: lb(DIMS),ub(DIMS),nsize,mode \
+__NL__      integer(4) :: ret \
+__NL__      integer(c_int64_t) :: bsize \
+__NL__      mode = cbslf_get_mode(ctx) \
+__NL__      select case(mode) \
+__NL__        case(cbslf_store_mode) \
+__NL__          call cbslf_write(ctx, val, ret) \
+__NL__        case(cbslf_load_mode) \
+__NL__          if (allocated(val)) then \
+__NL__            call cbslf_read(ctx, val, ret) \
+__NL__          else \
+__NL__            call cbslf_read(ctx, nsize, ret) \
+__NL__            if (ret == cbslf_success .and. nsize > 0) then \
+__NL__              bsize = size(lb) * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__              ret   = iand(cbsl_read(ctx%ctx, loc(lb), bsize), ret) \
+__NL__              ret   = iand(cbsl_read(ctx%ctx, loc(ub), bsize), ret) \
+__NL__              allocate(val(CONCAT(FORTRAN_ARRAY_SHAPE_,DIMS))) \
+__NL__              bsize = nsize * c_sizeof(val(CONCAT(FORTRAN_ARRAY_VALUE_,DIMS))) \
+__NL__              ret   = iand(cbsl_read(ctx%ctx, loc(val), bsize), ret) \
+__NL__            else \
+__NL__              ret = cbslf_error \
+__NL__            end if \
+__NL__          end if \
+__NL__        case default \
+__NL__          ret = cbslf_error \
+__NL__      end select \
+__NL__      SET_ERRCODE(ret) \
+__NL__    end subroutine
+
+#define IMPLEMENT_ARRAY_INTERFACE(ROUTINE_NAME,DATA_TYPE)  \
+          IMPLEMENT_SCALAR_INTERFACE(ROUTINE_NAME,DATA_TYPE) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,1) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,2) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,3) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,4) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,5) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,6) \
+          IMPLEMENT_ARRAY_INTERFACE_N(ROUTINE_NAME,DATA_TYPE,7)
+
+!======
+private
+
+  integer(8),   parameter :: CBSL_VERSION         = @cbsl_VERSION_MAJOR@@cbsl_VERSION_MINOR@@cbsl_VERSION_PATCH@
+  character(*), parameter :: CBSL_VERSTION_STRING = '@cbsl_VERSION@'
+  integer(4),   parameter :: CBSL_MAJOR_VERSION   = @cbsl_VERSION_MAJOR@
+  integer(4),   parameter :: CBSL_MINOR_VERSION   = @cbsl_VERSION_MINOR@
+  integer(4),   parameter :: CBSL_PATCH_VERSION   = @cbsl_VERSION_PATCH@
+
+  integer(4), parameter :: cbslf_load_mode    = 1
+  integer(4), parameter :: cbslf_store_mode   = 2
+  integer(4), parameter :: cbslf_unknown_mode = -1
+
+  integer(4), parameter :: cbslf_success = 0
+  integer(4), parameter :: cbslf_error   = -1
+
+  ! C function interfaces
+  interface
+    function cbsl_open(open_mode, path) result(ctx) &
+        bind(C,name='cbsl_open')
+      use, intrinsic :: iso_c_binding
+      integer(c_int),value,  intent(in) :: open_mode
+      character(kind=c_char),intent(in) :: path(*)
+      integer(c_intptr_t) :: ctx
+    end function
+
+    function cbsl_close(ctx) result(retcode) &
+        bind(C,name='cbsl_close')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_flush(ctx) result(retcode) &
+        bind(C,name='cbsl_flush')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_get_mode(ctx) result(retcode) &
+        bind(C,name='cbsl_get_mode')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_write(ctx, pdata, psize) result(retcode) &
+        bind(C,name='cbsl_write')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_intptr_t),value,intent(in) :: pdata
+      integer(c_int64_t),value,intent(in)  :: psize
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_read(ctx, pdata, psize) result(retcode) &
+        bind(C,name='cbsl_read')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_intptr_t),value,intent(in) :: pdata
+      integer(c_int64_t),value,intent(in)  :: psize
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_record(ctx, pdata, psize) result(retcode) &
+        bind(C,name='cbsl_record')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_intptr_t),value,intent(in) :: pdata
+      integer(c_int64_t),value,intent(in)  :: psize
+      integer(c_int) :: retcode
+    end function
+
+    ! cbsl_record_heap() not binds because the function uses malloc()
+
+    function cbsl_set_compression_level(ctx,clevel) result(retcode) &
+        bind(C,name='cbsl_set_compression_level')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_int),value,intent(in) :: clevel
+      integer(c_int) :: retcode
+    end function
+
+    function cbsl_get_compression_level(ctx) result(clevel) &
+        bind(C,name='cbsl_get_compression_level')
+      use, intrinsic :: iso_c_binding
+      integer(c_intptr_t),value,intent(in) :: ctx
+      integer(c_int) :: clevel
+    end function
+  end interface
+
+  ! Generic routines
+  interface cbslf_write
+    DECLARE_SCALAR_INTERFACE(write,character)
+    DECLARE_SCALAR_INTERFACE(write,logical)
+
+    DECLARE_ARRAY_INTERFACE(write,integer4)
+    DECLARE_ARRAY_INTERFACE(write,integer8)
+    DECLARE_ARRAY_INTERFACE(write,sreal)
+    DECLARE_ARRAY_INTERFACE(write,dreal)
+    DECLARE_ARRAY_INTERFACE(write,ccomplex)
+    DECLARE_ARRAY_INTERFACE(write,zcomplex)
+  end interface
+
+  interface cbslf_read
+    DECLARE_SCALAR_INTERFACE(read,character)
+    DECLARE_SCALAR_INTERFACE(read,logical)
+
+    DECLARE_ARRAY_INTERFACE(read,integer4)
+    DECLARE_ARRAY_INTERFACE(read,integer8)
+    DECLARE_ARRAY_INTERFACE(read,sreal)
+    DECLARE_ARRAY_INTERFACE(read,dreal)
+    DECLARE_ARRAY_INTERFACE(read,ccomplex)
+    DECLARE_ARRAY_INTERFACE(read,zcomplex)
+  end interface
+
+  interface cbslf_record
+    DECLARE_SCALAR_INTERFACE(record,character)
+    DECLARE_SCALAR_INTERFACE(record,logical)
+
+    DECLARE_ARRAY_INTERFACE(record,integer4)
+    DECLARE_ARRAY_INTERFACE(record,integer8)
+    DECLARE_ARRAY_INTERFACE(record,sreal)
+    DECLARE_ARRAY_INTERFACE(record,dreal)
+    DECLARE_ARRAY_INTERFACE(record,ccomplex)
+    DECLARE_ARRAY_INTERFACE(record,zcomplex)
+  end interface
+
+  interface cbslf_record_heap
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,integer4)
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,integer8)
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,sreal)
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,dreal)
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,ccomplex)
+    DECLARE_ARRAY_INTERFACE_ALLOCATABLE(record,zcomplex)
+  end interface
+
+contains
+  IMPLEMENT_SCALAR_INTERFACE(character,character(*,kind=c_char))
+  IMPLEMENT_SCALAR_INTERFACE(logical,logical(c_bool))
+
+  IMPLEMENT_ARRAY_INTERFACE(integer4,integer(c_int32_t))
+  IMPLEMENT_ARRAY_INTERFACE(integer8,integer(c_int64_t))
+  IMPLEMENT_ARRAY_INTERFACE(sreal,real(c_float))
+  IMPLEMENT_ARRAY_INTERFACE(dreal,real(c_double))
+  IMPLEMENT_ARRAY_INTERFACE(ccomplex,complex(c_float_complex))
+  IMPLEMENT_ARRAY_INTERFACE(zcomplex,complex(c_double_complex))
+
+  function cbslf_open(open_mode, path, errcode) result(ctx)
+    implicit none
+    integer(4),   intent(in)            :: open_mode
+    character(*), intent(in)            :: path
+    integer(4),   intent(out), optional :: errcode
+    type(cbslf_context) :: ctx
+    character(1,c_char)  :: cpath(len_trim(path)+1)
+    integer(4) :: n,i
+    n = len_trim(path, kind=4)
+    do i=1,n
+      cpath(i) = path(i:i)
+    end do
+    cpath(n+1) = c_null_char
+    ctx%ctx = cbsl_open(open_mode, cpath)
+    SET_ERRCODE_COND(ctx%ctx /= 0) ! is not null pointer
+  end function
+
+  subroutine cbslf_close(ctx, errcode)
+    implicit none
+    type(cbslf_context), intent(in)            :: ctx
+    integer(4),          intent(out), optional :: errcode
+    integer(4) :: ret
+    ret = cbsl_close(ctx%ctx)
+    SET_ERRCODE(ret)
+  end subroutine
+
+  subroutine cbslf_flush(ctx, errcode)
+    implicit none
+    type(cbslf_context), intent(in)            :: ctx
+    integer(4),          intent(out), optional :: errcode
+    integer(4) :: ret
+    ret = cbsl_flush(ctx%ctx)
+    SET_ERRCODE(ret)
+  end subroutine
+
+  function cbslf_get_mode(ctx, errcode) result(open_mode)
+    implicit none
+    type(cbslf_context), intent(in)            :: ctx
+    integer(4),          intent(out), optional :: errcode
+    integer(4) :: open_mode
+    open_mode = cbsl_get_mode(ctx%ctx)
+    SET_ERRCODE_COND(open_mode == cbslf_unknown_mode)
+  end function
+
+  subroutine cbslf_set_compression_level(ctx, clevel, errcode)
+    implicit none
+    type(cbslf_context), intent(in)            :: ctx
+    integer(4),          intent(in)            :: clevel
+    integer(4),          intent(out), optional :: errcode
+    integer(4) :: ret
+    ret = cbsl_set_compression_level(ctx%ctx, clevel)
+    SET_ERRCODE(ret)
+  end subroutine
+
+  function cbslf_get_compression_level(ctx, errcode) result(clevel)
+    implicit none
+    type(cbslf_context), intent(in)            :: ctx
+    integer(4),          intent(out), optional :: errcode
+    integer(4) :: clevel
+    clevel = cbsl_get_compression_level(ctx%ctx)
+    SET_ERRCODE_COND(clevel > 0)
+  end function
+end module
--- a/cachelab/cbsl/src/gen_fortran_bindings.cmake
+++ b/cachelab/cbsl/src/gen_fortran_bindings.cmake
@@ -0,0 +1,31 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+cmake_minimum_required(VERSION 3.3)
+
+if (${CMAKE_ARGC} LESS 4)
+  message(FATAL_ERROR "Usage ${CMAKE_ARGV2} <input file> <output file>")
+endif ()
+
+set(INPUT_FILE  ${CMAKE_ARGV3})
+if (CMAKE_ARGV4)
+  set(OUTPUT_FILE ${CMAKE_ARGV4})
+else ()
+  set(OUTPUT_FILE ${CMAKE_ARGV3})
+endif ()
+
+file(READ ${INPUT_FILE} FBIND_SOURCE_TEXT)
+string(REGEX REPLACE "__NL__" "\n" FBIND_GEN_TEXT ${FBIND_SOURCE_TEXT})
+file(WRITE ${OUTPUT_FILE} ${FBIND_GEN_TEXT})
--- a/cachelab/cbsl/src/read.c
+++ b/cachelab/cbsl/src/read.c
@@ -0,0 +1,208 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdint.h>
+#include <string.h>
+#include <zstd.h>
+
+#include "./cbsl_internal.h"
+
+static
+cbsl_errors streaming_read_immediate(cbsl_ctx* ctx, void* data, uint64_t size)
+{
+	CBSL_DEBUG_MESSAGE("%s: call\n", __func__);
+
+	/* previous all decompressed data loaded */
+	CBSL_CHECK_COND_AND_RETURN(ctx->out_buffer_pos >= ctx->out_buffer_used, cbsl_error);
+
+	ZSTD_outBuffer output = { data, size, 0 }; /* decompressed data stores directly */
+	while (output.pos < output.size)
+	{
+		/* previous read data from file */
+		if (ctx->in_buffer_pos < ctx->in_buffer_used)
+		{
+			/* input buffer has remained data from the previous decompression */
+			memmove(ctx->in_buffer, ctx->in_buffer + ctx->in_buffer_pos, ctx->in_buffer_used - ctx->in_buffer_pos);
+			ctx->in_buffer_used -= ctx->in_buffer_pos;
+		}
+		else
+		{
+			ctx->in_buffer_used = 0ULL;
+		}
+		ctx->in_buffer_pos = 0ULL;
+
+		ctx->in_buffer_used += fread(ctx->in_buffer + ctx->in_buffer_used, 1, ctx->in_buffer_size - ctx->in_buffer_used, ctx->fp);
+
+		ZSTD_inBuffer input = { ctx->in_buffer, ctx->in_buffer_used, ctx->in_buffer_pos };
+		while (input.pos < input.size && output.pos < output.size)
+		{
+			const size_t ret = ZSTD_decompressStream(ctx->zstd_dctx, &output, &input);
+			CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(ret), ZSTD_getErrorName(ret), cbsl_error);
+		}
+		ctx->in_buffer_used = input.size;
+		ctx->in_buffer_pos = input.pos;
+	}
+	CBSL_ASSERT(output.pos == output.size);
+	ctx->out_buffer_pos = output.pos;
+	ctx->out_buffer_used = output.size;
+
+	return cbsl_success;
+}
+
+static
+uint64_t read_from_buffer(cbsl_ctx* ctx, byte_t* data, uint64_t size)
+{
+	uint64_t read = 0;
+	if (ctx->out_buffer_pos < ctx->out_buffer_used)
+	{
+		const uint64_t read_size = MIN(ctx->out_buffer_used - ctx->out_buffer_pos, size);
+		memcpy(data, ctx->out_buffer + ctx->out_buffer_pos, read_size);
+		ctx->out_buffer_pos += read_size;
+		read = read_size;
+	}
+	return read;
+}
+
+static
+cbsl_errors streaming_read_buffered(cbsl_ctx* ctx, void* data, uint64_t size)
+{
+	CBSL_DEBUG_MESSAGE("%s: call\n", __func__);
+
+	size_t zstd_ret = -1;
+
+	/* memcpy from the previous decompression data */
+	uint64_t read = read_from_buffer(ctx, data, size);
+
+	byte_t* pdata = (byte_t*)(data);
+
+	/* streaming decompression and memcpy */
+	while (read < size)
+	{
+		if (ctx->in_buffer_pos < ctx->in_buffer_used)
+		{
+			/* input buffer has remained data from the previous decompression */
+			memmove(ctx->in_buffer, ctx->in_buffer + ctx->in_buffer_pos, ctx->in_buffer_used - ctx->in_buffer_pos);
+			ctx->in_buffer_used -= ctx->in_buffer_pos;
+		}
+		else
+		{
+			/* input buffer is already consumed by the previous decompression */
+			ctx->in_buffer_used = 0;
+		}
+		ctx->in_buffer_pos = 0ULL;
+
+		ctx->in_buffer_used += fread(ctx->in_buffer + ctx->in_buffer_used, 1, ctx->in_buffer_size - ctx->in_buffer_used, ctx->fp);
+
+		if (ctx->in_buffer_used == 0)   // 从文件中，读取不到数据了，无法解压
+			break;
+		ZSTD_inBuffer input = { ctx->in_buffer, ctx->in_buffer_used, ctx->in_buffer_pos };
+		while (input.pos < input.size && read < size)
+		{
+			ZSTD_outBuffer output = { ctx->out_buffer, ctx->out_buffer_size, 0 };
+			zstd_ret = ZSTD_decompressStream(ctx->zstd_dctx, &output, &input);
+			CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(zstd_ret), ZSTD_getErrorName(zstd_ret), cbsl_error);
+			ctx->out_buffer_pos = 0ULL;
+			ctx->out_buffer_used = output.pos;
+			read += read_from_buffer(ctx, pdata + read, size - read);
+		}
+		ctx->in_buffer_pos = input.pos;
+		ctx->in_buffer_used = input.size;
+
+		if (zstd_ret == 0)
+		{
+			// zstd stream end
+			ctx->zstd_file_end = 1;
+			break;
+		}
+	}
+	if (ctx->zstd_file_end == 1 && ctx->out_buffer_pos == ctx->out_buffer_used)
+		ctx->zstd_buf_end = 1;
+	CBSL_ASSERT(read == size || ctx->zstd_end == 1);
+
+	ctx->line_buffer_read_from_zst = read;
+
+	return cbsl_success;
+}
+
+cbsl_errors cbsl_read(cbsl_ctx* ctx, void* data, uint64_t size)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(ctx->mode == cbsl_load_mode, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(data != NULL, cbsl_error);
+
+	CBSL_DEBUG_MESSAGE("read: %lu bytes\n", size);
+
+	if (size > ctx->out_buffer_size)
+	{
+		/* data size is larger than compression buffer */
+		return streaming_read_immediate(ctx, data, size);
+	}
+	else
+	{
+		return streaming_read_buffered(ctx, data, size);
+	}
+}
+
+// readline from stream
+cbsl_errors cbsl_readline(cbsl_ctx* ctx, char* data, uint64_t size)
+{
+	cbsl_errors ret = cbsl_success;
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(ctx->mode == cbsl_load_mode, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(data != NULL, cbsl_error);
+
+	CBSL_DEBUG_MESSAGE("%s: %lu bytes\n", __func__, size);
+	uint64_t line_buffer_space = 0;
+	line_buffer_space = CBSL_LINEBUF_SIZE - ctx->line_buffer_used;
+
+	if (ctx->zstd_buf_end == 0)
+	{
+		if (line_buffer_space > ctx->out_buffer_size)
+		{
+			/* line_buffer size is larger than compression buffer */
+			ret = streaming_read_immediate(ctx, ctx->line_buffer + ctx->line_buffer_used, line_buffer_space);
+		}
+		else
+		{
+			ret = streaming_read_buffered(ctx, ctx->line_buffer + ctx->line_buffer_used, line_buffer_space);
+		}
+		ctx->line_buffer_used += ctx->line_buffer_read_from_zst;
+	}
+
+	uint64_t i;
+	char* ptr;
+	ptr = (char*)ctx->line_buffer;
+	data[0] = '\0';
+	for (i = 0; i < ctx->line_buffer_used; i++)
+	{
+		if (*ptr == '\n' || *ptr == '\r')
+		{
+			CBSL_CHECK_COND_AND_RETURN(size >= i - 1, cbsl_error);
+			memcpy(data, ctx->line_buffer, i + 1);
+			memmove(ctx->line_buffer, ctx->line_buffer + i + 1, ctx->line_buffer_used - i - 1);
+			ctx->line_buffer_used -= i + 1;
+			data[i + 1] = '\0';
+			break;
+		}
+		ptr++;
+	}
+
+	if (ctx->line_buffer_used == 0)
+		return cbsl_end;
+	else
+		return ret;
+}
--- a/cachelab/cbsl/src/record.c
+++ b/cachelab/cbsl/src/record.c
@@ -0,0 +1,70 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdint.h>
+#include <stdlib.h>
+
+#include "./cbsl_internal.h"
+
+cbsl_errors cbsl_record(cbsl_ctx* ctx, void* data, uint64_t size)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(data != NULL, cbsl_error);
+
+	switch (ctx->mode)
+	{
+	case cbsl_load_mode:  return cbsl_read(ctx, data, size);
+	case cbsl_store_mode: return cbsl_write(ctx, data, size);
+	default:              return cbsl_error;
+	}
+}
+
+cbsl_errors cbsl_record_heap(cbsl_ctx* ctx, void** data, uint64_t* size)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(data != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(size != NULL, cbsl_error);
+
+	switch (ctx->mode)
+	{
+	case cbsl_load_mode:
+	{
+		uint64_t rsize;
+		void* rdata = *data;
+		CBSL_CHECK_COND_AND_RETURN(cbsl_read(ctx, &rsize, sizeof(rsize)) == cbsl_success, cbsl_error);
+		if (rdata == NULL)
+		{
+			CBSL_CHECK_COND_AND_RETURN((rdata = malloc(rsize)) != NULL, cbsl_error);
+		}
+		else
+		{
+			CBSL_CHECK_COND_AND_RETURN(rsize == *size, cbsl_error);
+		}
+		CBSL_CHECK_COND_AND_RETURN(cbsl_read(ctx, rdata, rsize) == cbsl_success, cbsl_error);
+		*size = rsize;
+		*data = rdata;
+	}
+	break;
+	case cbsl_store_mode:
+	{
+		CBSL_CHECK_COND_AND_RETURN(cbsl_write(ctx, size, sizeof(*size)) == cbsl_success, cbsl_error);
+		CBSL_CHECK_COND_AND_RETURN(cbsl_write(ctx, *data, *size) == cbsl_success, cbsl_error);
+	}
+	break;
+	default:
+		return cbsl_error;
+	}
+	return cbsl_success;
+}
--- a/cachelab/cbsl/src/utils.c
+++ b/cachelab/cbsl/src/utils.c
@@ -0,0 +1,49 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "./cbsl_internal.h"
+
+ /* FIXME: implicit declaration??? */
+extern ZSTDLIB_API size_t ZSTD_CCtx_getParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, int* value);
+
+
+cbsl_mode cbsl_get_mode(cbsl_ctx* ctx)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_unknown_mode);
+	return ctx->mode;
+}
+
+cbsl_errors cbsl_set_compression_level(cbsl_ctx* ctx, int clevel)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(ctx->mode == cbsl_store_mode, cbsl_error);
+
+	const size_t ret = ZSTD_CCtx_setParameter(ctx->zstd_cctx, ZSTD_c_compressionLevel, clevel);
+	CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(ret), ZSTD_getErrorName(ret), cbsl_error);
+
+	return cbsl_success;
+}
+
+int cbsl_get_compression_level(cbsl_ctx* ctx)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(ctx->mode == cbsl_store_mode, cbsl_error);
+
+	int clevel;
+	const size_t ret = ZSTD_CCtx_getParameter(ctx->zstd_cctx, ZSTD_c_compressionLevel, &clevel);
+	CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(ret), ZSTD_getErrorName(ret), cbsl_error);
+
+	return clevel;
+}
--- a/cachelab/cbsl/src/write.c
+++ b/cachelab/cbsl/src/write.c
@@ -0,0 +1,101 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdint.h>
+#include <string.h>
+
+#include "./cbsl_internal.h"
+
+static
+cbsl_errors streaming_write_flush(cbsl_ctx* ctx, uint64_t size)
+{
+	if (ctx->in_buffer_used > 0 && ctx->in_buffer_used + size > ctx->in_buffer_size)
+	{
+		CBSL_CHECK_COND_AND_RETURN(cbsl_flush(ctx) == cbsl_success, cbsl_error);
+	}
+	return cbsl_success;
+}
+
+static
+cbsl_errors streaming_write_immediate(cbsl_ctx* ctx, const void* data, uint64_t size)
+{
+	CBSL_DEBUG_MESSAGE("%s: call\n", __func__);
+	CBSL_CHECK_COND_AND_RETURN(streaming_write_flush(ctx, size) == cbsl_success, cbsl_error);
+
+	uint64_t written = 0;
+	const byte_t* pdata = (const byte_t*)(data);
+	while (written < size)
+	{
+		/* compressing data copies to internal input buffer */
+		const uint64_t write_size = MIN(size - written, ctx->in_buffer_size);
+		memcpy(ctx->in_buffer, pdata + written, write_size);
+		written += write_size;
+
+		ZSTD_inBuffer input = { ctx->in_buffer, write_size, 0 };
+		ZSTD_EndDirective mode = (size - written < ctx->in_buffer_size) ? ZSTD_e_end : ZSTD_e_continue;
+		do
+		{
+			ZSTD_outBuffer output = { ctx->out_buffer, ctx->out_buffer_size, 0 };
+			const size_t remaining = ZSTD_compressStream2(ctx->zstd_cctx, &output, &input, mode);
+			CBSL_CHECK_COND_MSG_AND_RETURN(!ZSTD_isError(remaining), ZSTD_getErrorName(remaining), cbsl_error);
+			CBSL_CHECK_COND_AND_RETURN(fwrite(ctx->out_buffer, 1, output.pos, ctx->fp) == output.pos, cbsl_error);
+		} while (input.pos < input.size);
+		CBSL_ASSERT(input.pos == input.size);
+	}
+	CBSL_ASSERT(written == size);
+
+	return cbsl_success;
+}
+
+static
+cbsl_errors streaming_write_buffered(cbsl_ctx* ctx, const void* data, uint64_t size)
+{
+	CBSL_DEBUG_MESSAGE("%s: call\n", __func__);
+	CBSL_CHECK_COND_AND_RETURN(streaming_write_flush(ctx, size) == cbsl_success, cbsl_error);
+
+	uint64_t written = 0;
+	const byte_t* pdata = (const byte_t*)(data);
+	do
+	{
+		const uint64_t write_size = MIN(size - written, ctx->in_buffer_size);
+		memcpy(ctx->in_buffer, pdata + written, write_size);
+		ctx->in_buffer_used = write_size;
+		CBSL_CHECK_COND_AND_RETURN(cbsl_flush(ctx) == cbsl_success, cbsl_error);
+		written += write_size;
+	} while (written < size);
+	CBSL_ASSERT(written == size);
+
+	return cbsl_success;
+}
+
+cbsl_errors cbsl_write(cbsl_ctx* ctx, const void* data, uint64_t size)
+{
+	CBSL_CHECK_COND_AND_RETURN(ctx != NULL, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(ctx->mode == cbsl_store_mode, cbsl_error);
+	CBSL_CHECK_COND_AND_RETURN(data != NULL, cbsl_error);
+
+	CBSL_DEBUG_MESSAGE("write: %lu bytes\n", size);
+	if (size > ctx->in_buffer_size)
+	{
+		/* data size is larger than compression buffer */
+		return streaming_write_immediate(ctx, data, size);
+	}
+	else
+	{
+		return streaming_write_buffered(ctx, data, size);
+	}
+}
--- a/cachelab/cbsl/tests/CMakeLists.txt
+++ b/cachelab/cbsl/tests/CMakeLists.txt
@@ -0,0 +1,106 @@
+#
+# Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+link_libraries(${CBSL_LIB} ${ZSTD_LIB})
+
+add_executable(scalar_data scalar_data.c)
+add_executable(single_array single_array.c)
+add_executable(multi_array multi_array.c)
+add_executable(utility utility.c)
+add_executable(split_compression split_compression.c)
+add_executable(variable_size_array variable_size_array.c)
+add_executable(various_size_array various_size_array.c)
+
+add_executable(cbsl_record       cbsl_record.c)
+add_executable(cbsl_record_array cbsl_record_array.c)
+
+add_executable(fortran_bindings fortran_bindings.f90)
+target_link_libraries(fortran_bindings ${CBSL_FLIB} ${CBSL_LIB} ${ZSTD_LIB})
+
+add_test(NAME utility COMMAND utility)
+
+
+#
+# very short data compression/decompression
+#
+add_test(NAME scalar_data_compression   COMMAND scalar_data -c)
+add_test(NAME scalar_data_decompression COMMAND scalar_data -d)
+set_tests_properties(scalar_data_decompression PROPERTIES DEPENDS scalar_data_compression)
+
+
+#
+# boundary checking with single array
+#
+function(add_simple_test_size_boundary DATA_SIZE)
+  math(EXPR DATA_SIZE_B "${DATA_SIZE} - 1")
+  add_test(NAME single_array_${DATA_SIZE_B} COMMAND single_array ${DATA_SIZE_B})
+  add_test(NAME single_array_${DATA_SIZE}   COMMAND single_array ${DATA_SIZE})
+  math(EXPR DATA_SIZE_B "${DATA_SIZE} + 1")
+  add_test(NAME single_array_${DATA_SIZE_B} COMMAND single_array ${DATA_SIZE_B})
+endfunction()
+
+foreach(count RANGE 10 20)
+  math(EXPR DATA_SIZE "1 << ${count}")
+  add_simple_test_size_boundary(${DATA_SIZE})
+endforeach()
+
+
+#
+# boundary checking with multiple arrays
+#
+function(add_multiple_test_size NUM_VARS)
+  foreach(count RANGE 10 20)
+    math(EXPR DATA_SIZE "1 << ${count}")
+    add_test(NAME multi_array_${DATA_SIZE}_by_${NUM_VARS}  COMMAND multi_array ${NUM_VARS} ${DATA_SIZE})
+  endforeach()
+endfunction()
+
+add_multiple_test_size(2)
+add_multiple_test_size(3)
+add_multiple_test_size(11)
+
+
+#
+# test compression/decompression form
+#
+add_test(NAME variable_size_array COMMAND variable_size_array)
+math(EXPR DATA_SIZE "1 << 17")
+add_test(NAME buffered_read_write COMMAND variable_size_array ${DATA_SIZE})
+math(EXPR DATA_SIZE "(1 << 17) + 1")
+add_test(NAME immediate_read_write COMMAND variable_size_array ${DATA_SIZE})
+
+add_test(NAME various_size_array COMMAND various_size_array)
+
+
+add_test(NAME cbsl_record        COMMAND cbsl_record)
+add_test(NAME cbsl_record_array  COMMAND cbsl_record_array)
+
+
+#
+# large array compression/decompression by splitting small block
+#
+math(EXPR BLOCK_SIZE "1 << 18") # 256 KiB
+math(EXPR TOTAL_SIZE "1 << 28") # 256 MiB
+add_test(NAME split_compression_256KiB_256MiB COMMAND split_compression ${BLOCK_SIZE} ${TOTAL_SIZE})
+
+math(EXPR BLOCK_SIZE "(1 << 18) - (1 << 16)") # 192 KiB
+math(EXPR TOTAL_SIZE "1 << 28")               # 256 MiB
+add_test(NAME split_compression_192KiB_256MiB COMMAND split_compression ${BLOCK_SIZE} ${TOTAL_SIZE})
+
+
+#
+# Fortran bindings API
+#
+add_test(NAME fortran_bindings COMMAND fortran_bindings)
--- a/cachelab/cbsl/tests/cbsl_record.c
+++ b/cachelab/cbsl/tests/cbsl_record.c
@@ -0,0 +1,64 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK_BINARY(X,Y)    {if (memcmp(&(X),&(Y),sizeof((X))) != 0) { fprintf(stderr, "error: binary check %s == %s\n", (#X), (#Y)); exit(1); }}
+
+static const int    data0 = 43;
+static const double data1 = 3.14159265;
+static const int    data2 = 14142;
+
+extern void record(cbsl_mode, int*, double*, int*);
+
+char cname[128];
+
+int main(int argc, char** argv)
+{
+  sprintf(cname, "check_record_scalar.zst");
+
+  int    c0 = data0;
+  double c1 = data1;
+  int    c2 = data2;
+  record(cbsl_store_mode, &c0, &c1, &c2);
+
+  c0 = c2 = 0;
+  c1 = 0;
+  record(cbsl_load_mode, &c0, &c1, &c2);
+
+  CHECK_BINARY(c0, data0);
+  CHECK_BINARY(c1, data1);
+  CHECK_BINARY(c2, data2);
+
+  return 0;
+}
+
+void record(cbsl_mode mode, int* c0, double* c1, int* c2)
+{
+  cbsl_ctx* ctx = cbsl_open(mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c0, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c1, sizeof(double)));
+  CBSL_ERROR_CHECK(cbsl_record(ctx, c2, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
--- a/cachelab/cbsl/tests/cbsl_record_array.c
+++ b/cachelab/cbsl/tests/cbsl_record_array.c
@@ -0,0 +1,96 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK(X)             {if (!(X)) { fprintf(stderr, "error: check %s\n", (#X)); exit(1); }}
+#define CHECK_BINARY(X,Y)    {if (memcmp(&(X),&(Y),sizeof((X))) != 0) { fprintf(stderr, "error: binary check %s == %s\n", (#X), (#Y)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void rand_byte_t(uint64_t data_size, byte_t* a);
+extern void record(cbsl_mode, uint64_t* size, void** data);
+
+char cname[128];
+
+int main(int argc, char** argv)
+{
+  sprintf(cname, "check_record_scalar.zst");
+
+  uint64_t size = 1024 * 1024 * sizeof(byte_t);
+  byte_t*  data = (byte_t*)(malloc(size));
+
+  rand_byte_t(size, data);
+  record(cbsl_store_mode, &size, (void**) &data);
+
+  uint64_t rsize = 0;
+  byte_t*  rdata = NULL;
+  record(cbsl_load_mode, &rsize, (void**) &rdata);
+
+  CHECK(size == rsize);
+  CHECK(rdata != NULL);
+  for (uint64_t i = 0; i < (size/sizeof(byte_t)); ++i)
+  {
+    if (data[i] != rdata[i])
+    {
+      fprintf(stderr, "1: mismatch!\n");
+      exit(1);
+    }
+    else
+    {
+      rdata[i] = 0;
+    }
+  }
+
+  CHECK(size == rsize);
+  CHECK(rdata != NULL);
+  record(cbsl_load_mode, &rsize, (void**) &rdata);
+
+  for (uint64_t i = 0; i < (size/sizeof(byte_t)); ++i)
+  {
+    if (data[i] != rdata[i])
+    {
+      fprintf(stderr, "2: mismatch!\n");
+      exit(1);
+    }
+  }
+
+  free(data);
+  free(rdata);
+
+  return 0;
+}
+
+void record(cbsl_mode mode, uint64_t* size, void** data)
+{
+  cbsl_ctx* ctx = cbsl_open(mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_record_heap(ctx, data, size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/cbsl/tests/fortran_bindings.f90
+++ b/cachelab/cbsl/tests/fortran_bindings.f90
@@ -0,0 +1,159 @@
+!
+! Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+!
+! Licensed under the Apache License, Version 2.0 (the "License");
+! you may not use this file except in compliance with the License.
+! You may obtain a copy of the License at
+!
+!     http://www.apache.org/licenses/LICENSE-2.0
+!
+! Unless required by applicable law or agreed to in writing, software
+! distributed under the License is distributed on an "AS IS" BASIS,
+! WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+! See the License for the specific language governing permissions and
+! limitations under the License.
+!
+program test_fortran_bindings
+  use cbslf
+  integer, parameter :: array_size = 100000
+  real :: source_stack_array(array_size), dest_stack_array(array_size)
+  real, allocatable :: source_heap_array(:), dest_heap_array(:), dest_heap_array2(:)
+  character(128) :: source_string, dest_string
+  character(*), parameter :: cname = 'data_fortran.zst'
+
+  allocate(source_heap_array(array_size))
+  allocate(dest_heap_array(array_size))
+  call random_number(source_stack_array)
+  call random_number(source_heap_array)
+
+  source_string = 'abcdefgABCDEFG%'
+  dest_string   = ''
+
+  print *, 'serialize...'
+  call serialize
+
+  print *, 'deserialize...'
+  call deserialize
+
+  print *, 'compare...'
+  if (.not. compare_real_array(array_size, source_stack_array, dest_stack_array)) then
+    print *, 'fail: compare stack array'
+    stop 1
+  end if
+
+  if (.not. compare_real_array(array_size, source_heap_array, dest_heap_array)) then
+    print *, 'fail: compare heap array'
+    stop 1
+  end if
+
+  if (.not. compare_real_array(array_size, source_heap_array, dest_heap_array2)) then
+    print *, 'fail: compare heap array'
+    stop 1
+  end if
+
+  if (trim(source_string) /= trim(dest_string)) then
+    print *, 'fail: compare string'
+    stop 1
+  end if
+
+contains
+  subroutine serialize
+    implicit none
+    type(cbslf_context) :: ctx
+    integer(4) :: errcode
+
+    ctx = cbslf_open(cbslf_store_mode, cname, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_open(store)'
+      stop 1
+    end if
+
+    call cbslf_set_compression_level(ctx, 10, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_set_compression_level'
+      stop 1
+    end if
+
+    call cbslf_write(ctx, source_stack_array, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_write(stack array)'
+      stop 1
+    end if
+
+    call cbslf_write(ctx, source_heap_array, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_write(heap array)'
+      stop 1
+    end if
+
+    call cbslf_write(ctx, source_heap_array, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_write(heap array2)'
+      stop 1
+    end if
+
+    call cbslf_write(ctx, source_string, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_write(string)'
+      stop 1
+    end if
+
+    call cbslf_close(ctx)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_close'
+      stop 1
+    end if
+  end subroutine
+
+  subroutine deserialize
+    implicit none
+    type(cbslf_context) :: ctx
+    integer(4) :: errcode
+    ctx = cbslf_open(cbslf_load_mode, cname, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_open(load)'
+      stop 1
+    end if
+
+    call cbslf_read(ctx, dest_stack_array, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_read(stack array)'
+      stop 1
+    end if
+
+    call cbslf_read(ctx, dest_heap_array, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_read(heap array)'
+      stop 1
+    end if
+
+    call cbslf_record_heap(ctx, dest_heap_array2, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_record_heap(heap array2)'
+      stop 1
+    end if
+
+    call cbslf_read(ctx, dest_string, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_read(string)'
+      stop 1
+    end if
+
+    call cbslf_close(ctx, errcode)
+    if (errcode /= cbslf_success) then
+      print *, 'fail: cbslf_close'
+      stop 1
+    end if
+  end subroutine
+
+  function compare_real_array(n, a, b) result(ret)
+    implicit none
+    integer, intent(in) :: n
+    real,    intent(in) :: a(n), b(n)
+    logical :: ret
+    integer :: i
+    do i=1,n
+      ret = (abs(a(i) - b(i)) <= epsilon(a(i)))
+    end do
+  end function
+end program
--- a/cachelab/cbsl/tests/multi_array.c
+++ b/cachelab/cbsl/tests/multi_array.c
@@ -0,0 +1,150 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <math.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void compress(uint64_t num_vars, uint64_t data_size, byte_t** a);
+extern void raw_write(uint64_t num_vars, uint64_t data_size, byte_t** a);
+extern void decompress(uint64_t num_vars, uint64_t data_size, byte_t** a);
+extern void raw_read(uint64_t num_vars, uint64_t data_size, byte_t** a);
+extern void rand_byte_t(uint64_t data_size, byte_t* a);
+
+char cname[128], sname[128];
+
+int main(int argc, char** argv)
+{
+  if (argc <= 2)
+    exit(1);
+
+  uint64_t data_size, num_vars;
+  sscanf(argv[1], "%lu", &num_vars);
+  sscanf(argv[2], "%lu", &data_size);
+  data_size = data_size / num_vars;
+
+  printf("variables = %lu\n", num_vars);
+  printf("data size = %lf [MiB] * %lu\n", (double)(data_size)/pow(2,20), num_vars);
+
+  sprintf(cname, "multiple_compressed_%lu.zst", data_size * num_vars);
+  sprintf(sname, "multiple_raw_%lu.dat", data_size);
+
+  srand((unsigned int)(time(NULL)));
+
+  byte_t** a = malloc(sizeof(byte_t*) * num_vars);
+  byte_t** b = malloc(sizeof(byte_t*) * num_vars);
+  byte_t** c = malloc(sizeof(byte_t*) * num_vars);
+  for(uint64_t i = 0; i < num_vars; ++i)
+  {
+    a[i] = (byte_t*)(malloc(data_size));
+    rand_byte_t(data_size / sizeof(byte_t), a[i]);
+    b[i] = (byte_t*)(malloc(data_size));
+    c[i] = (byte_t*)(malloc(data_size));
+  }
+
+  compress(num_vars, data_size, a);
+  raw_write(num_vars, data_size, a);
+
+  decompress(num_vars, data_size, b);
+  raw_read(num_vars, data_size, c);
+
+  for(uint64_t i = 0; i < num_vars; ++i)
+  {
+    for(uint64_t j = 0; j < data_size; ++j)
+    {
+      if (b[i][j] != c[i][j])
+      {
+        fprintf(stderr, "mismatch!\n");
+        exit(1);
+      }
+    }
+  }
+
+  for(uint64_t i = 0; i < num_vars; ++i)
+  {
+    free(a[i]);
+    free(b[i]);
+    free(c[i]);
+  }
+  free(a);
+  free(b);
+  free(c);
+
+  return 0;
+}
+
+void compress(uint64_t num_vars, uint64_t data_size, byte_t** a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  for(uint64_t i = 0; i < num_vars; ++i)
+    CBSL_ERROR_CHECK(cbsl_write(ctx, a[i], data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_write(uint64_t num_vars, uint64_t data_size, byte_t** a)
+{
+  FILE* fp = fopen(sname, "wb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen\n");
+    exit(1);
+  }
+  for(int i = 0; i < num_vars; ++i)
+    fwrite(a[i], 1, data_size, fp);
+  fclose(fp);
+}
+
+void decompress(uint64_t num_vars, uint64_t data_size, byte_t** a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  for(uint64_t i = 0; i < num_vars; ++i)
+    CBSL_ERROR_CHECK(cbsl_read(ctx, a[i], data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_read(uint64_t num_vars, uint64_t data_size, byte_t** a)
+{
+  FILE* fp = fopen(sname, "rb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen\n");
+    exit(1);
+  }
+  for(uint64_t i = 0; i < num_vars; ++i)
+    fread(a[i], 1, data_size, fp);
+  fclose(fp);
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/cbsl/tests/scalar_data.c
+++ b/cachelab/cbsl/tests/scalar_data.c
@@ -0,0 +1,111 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK_BINARY(X,Y)    {if (memcmp(&(X),&(Y),sizeof((X))) != 0) { fprintf(stderr, "error: binary check %s == %s\n", (#X), (#Y)); exit(1); }}
+
+static const int    data0 = 43;
+static const double data1 = 3.14159265;
+static const int    data2 = 14142;
+
+extern void compress();
+extern void decompress();
+
+char cname[128], sname[128];
+
+int main(int argc, char** argv)
+{
+  if (argc < 2)
+    return 1;
+
+  sprintf(cname, "scalar_compressed.zst");
+  sprintf(sname, "scalar_raw.dat");
+
+  if (strcmp(argv[1],"-c") == 0)
+    compress();
+  else if (strcmp(argv[1],"-d") == 0)
+    decompress();
+  else
+    return 1;
+
+  return 0;
+}
+
+void compress()
+{
+  const int    c0 = data0;
+  const double c1 = data1;
+  const int    c2 = data2;
+
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_write(ctx, &c0, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_write(ctx, &c1, sizeof(double)));
+  CBSL_ERROR_CHECK(cbsl_write(ctx, &c2, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  FILE* fp = fopen(sname, "wb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen\n");
+    exit(1);
+  }
+  fwrite(&c0, sizeof(int),    1, fp);
+  fwrite(&c1, sizeof(double), 1, fp);
+  fwrite(&c2, sizeof(int),    1, fp);
+  fclose(fp);
+}
+
+void decompress()
+{
+  int    d0, r0;
+  double d1, r1;
+  int    d2, r2;
+
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_read(ctx, &d0, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_read(ctx, &d1, sizeof(double)));
+  CBSL_ERROR_CHECK(cbsl_read(ctx, &d2, sizeof(int)));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  FILE* fp = fopen(sname, "rb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen\n");
+    exit(1);
+  }
+  fread(&r0, sizeof(int),    1, fp);
+  fread(&r1, sizeof(double), 1, fp);
+  fread(&r2, sizeof(int),    1, fp);
+  fclose(fp);
+
+  CHECK_BINARY(d0, r0); CHECK_BINARY(d0, data0);
+  CHECK_BINARY(d1, r1); CHECK_BINARY(d1, data1);
+  CHECK_BINARY(d2, r2); CHECK_BINARY(d2, data2);
+}
--- a/cachelab/cbsl/tests/single_array.c
+++ b/cachelab/cbsl/tests/single_array.c
@@ -0,0 +1,129 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <math.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void compress(uint64_t data_size, const byte_t* a);
+extern void raw_write(uint64_t data_size, const byte_t* a);
+extern void decompress(uint64_t data_size, byte_t* a);
+extern void raw_read(uint64_t data_size, byte_t* a);
+
+extern void rand_byte_t(uint64_t data_size, byte_t* a);
+
+char cname[128], sname[128];
+
+int main(int argc, char** argv)
+{
+  if (argc < 2)
+    exit(1);
+
+  int data_size;
+  sscanf(argv[1], "%d", &data_size);
+  printf("data size = %lf [MiB]\n", (double)(data_size)/pow(2,20));
+
+  sprintf(cname, "simple_compressed_%d.zst", data_size);
+  sprintf(sname, "simple_raw_%d.dat", data_size);
+
+  srand((unsigned int)(time(NULL)));
+
+  byte_t* a = (byte_t*)(malloc(data_size));
+  rand_byte_t(data_size / sizeof(byte_t), a);
+  
+  compress(data_size, a);
+  raw_write(data_size, a);
+
+  byte_t* b = (byte_t*)(malloc(data_size));
+  byte_t* c = (byte_t*)(malloc(data_size));
+
+  decompress(data_size, b);
+  raw_read(data_size, c);
+
+  for (uint64_t i = 0; i < data_size; ++i)
+  {
+    if (a[i] != b[i])
+    {
+      fprintf(stderr, "mismatch!\n");
+      exit(1);
+    }
+  }
+
+  free(a);
+  free(b);
+  free(c);
+
+  return 0;
+}
+
+void compress(uint64_t data_size, const byte_t* a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_store_mode)\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_write(ctx, a, data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_write(uint64_t data_size, const byte_t* a)
+{
+  FILE* fp = fopen(sname, "wb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(wb)\n");
+    exit(1);
+  }
+  fwrite(a, 1, data_size, fp);
+  fclose(fp);
+}
+
+void decompress(uint64_t data_size, byte_t* a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_load_mode)\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_read(ctx, a, data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_read(uint64_t data_size, byte_t* a)
+{
+  FILE* fp = fopen(sname, "rb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(rb)\n");
+    exit(1);
+  }
+  fread(a, 1, data_size, fp);
+  fclose(fp);
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/cbsl/tests/split_compression.c
+++ b/cachelab/cbsl/tests/split_compression.c
@@ -0,0 +1,93 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK_BINARY(X,Y)    {if (memcmp(&(X),&(Y),sizeof((X))) != 0) { fprintf(stderr, "error: binary check %s == %s\n", (#X), (#Y)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void record(cbsl_mode, int, byte_t*, int);
+extern void rand_byte_t(int n, byte_t* a);
+
+char cname[128];
+
+int main(int argc, char** argv)
+{
+  if (argc < 3)
+    return 1;
+
+  sprintf(cname, "split.zst");
+
+  int block_size, total_size;
+  sscanf(argv[1], "%d\n", &block_size);
+  sscanf(argv[2], "%d\n", &total_size);
+
+  if (total_size < block_size)
+    return 2;
+
+  byte_t* a = malloc(sizeof(byte_t) * total_size);
+  byte_t* b = malloc(sizeof(byte_t) * total_size);
+  rand_byte_t(total_size, a);
+
+  record(cbsl_store_mode, total_size, a, block_size);
+  record(cbsl_load_mode,    total_size, b, block_size);
+
+  for (int i = 0; i < total_size; ++i)
+  {
+    if (a[i] != b[i])
+    {
+      fprintf(stderr, "mismatch!\n");
+      exit(1);
+    }
+  }
+
+  return 0;
+}
+
+void record(cbsl_mode mode, int total_size, byte_t* a, int block_size)
+{
+  cbsl_ctx* ctx = cbsl_open(mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+
+  int total = 0;
+  do
+  {
+    int size = (total_size - total < block_size) ? total_size - total : block_size;
+    CBSL_ERROR_CHECK(cbsl_record(ctx, a + total, size));
+    total += size;
+  }
+  while(total < total_size);
+  if (total != total_size)
+  {
+    fprintf(stderr, "total != total_size\n");
+    exit(1);
+  }
+
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void rand_byte_t(int n, byte_t* a) {
+  for(int i = 0; i < n; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/cbsl/tests/utility.c
+++ b/cachelab/cbsl/tests/utility.c
@@ -0,0 +1,43 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+#define CHECK(X)             {if (!(X)) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+char cname[128];
+
+int main(int argc, char** argv)
+{
+  sprintf(cname, "data.zst");
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open\n");
+    exit(1);
+  }
+
+  CHECK(cbsl_get_mode(ctx) == cbsl_store_mode);
+  CBSL_ERROR_CHECK(cbsl_set_compression_level(ctx, 20));
+  CHECK(cbsl_get_compression_level(ctx) == 20);
+
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+
+  return 0;
+}
--- a/cachelab/cbsl/tests/variable_size_array.c
+++ b/cachelab/cbsl/tests/variable_size_array.c
@@ -0,0 +1,155 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <math.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void compress(uint64_t data_size, const byte_t* a);
+extern void raw_write(uint64_t data_size, const byte_t* a);
+extern void decompress(uint64_t* data_size, byte_t** a);
+extern void raw_read(uint64_t* data_size, byte_t** a);
+
+extern uint64_t rand_size();
+extern void     rand_byte_t(uint64_t data_size, byte_t* a);
+
+char cname[128], sname[128];
+
+int main(int argc, char** argv)
+{
+  sprintf(cname, "varsize_compressed.zst");
+  sprintf(sname, "varsize_raw.dat");
+
+  srand((unsigned int)(time(NULL)));
+
+  uint64_t data_size;
+  if (argc >= 2)
+  {
+    sscanf(argv[1], "%lu\n", &data_size);
+    printf("specified data size: %lu byte\n", data_size);
+  }
+  else
+  {
+    data_size = rand_size();
+    printf("random generate data size: %lu byte\n", data_size);
+  }
+
+  byte_t* a = (byte_t*)(malloc(data_size));
+  rand_byte_t(data_size / sizeof(byte_t), a);
+  
+  compress(data_size, a);
+  raw_write(data_size, a);
+
+  uint64_t b_data_size; byte_t* b;
+  uint64_t c_data_size; byte_t* c;
+
+  decompress(&b_data_size, &b);
+  raw_read(&c_data_size, &c);
+
+  if (data_size != b_data_size || b_data_size != c_data_size)
+  {
+    fprintf(stderr, "data size is mismatch!\n");
+    exit(1);
+  }
+
+  for (uint64_t i = 0; i < data_size; ++i)
+  {
+    if (a[i] != b[i] || b[i] != c[i])
+    {
+      fprintf(stderr, "data value is mismatch!\n");
+      exit(1);
+    }
+  }
+
+  free(a);
+  free(b);
+  free(c);
+
+  return 0;
+}
+
+void compress(uint64_t data_size, const byte_t* a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_store_mode)\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_write(ctx, &data_size, sizeof(data_size)));
+  CBSL_ERROR_CHECK(cbsl_write(ctx, a, data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_write(uint64_t data_size, const byte_t* a)
+{
+  FILE* fp = fopen(sname, "wb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(wb)\n");
+    exit(1);
+  }
+  fwrite(&data_size, 1, sizeof(data_size), fp);
+  fwrite(a, 1, data_size, fp);
+  fclose(fp);
+}
+
+void decompress(uint64_t* data_size, byte_t** a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_load_mode)\n");
+    exit(1);
+  }
+  CBSL_ERROR_CHECK(cbsl_read(ctx, data_size, sizeof(data_size)));
+  *a = (byte_t*)(malloc(sizeof(byte_t) * *data_size));
+  CBSL_ERROR_CHECK(cbsl_read(ctx, *a, *data_size));
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_read(uint64_t* data_size, byte_t** a)
+{
+  FILE* fp = fopen(sname, "rb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(rb)\n");
+    exit(1);
+  }
+  fread(data_size, 1, sizeof(data_size), fp);
+  *a = (byte_t*)(malloc(sizeof(byte_t) * *data_size));
+  fread(*a, 1, *data_size, fp);
+  fclose(fp);
+}
+
+uint64_t rand_size()
+{
+  const uint64_t min_data_size = 1024;
+  const uint64_t max_data_size = 1048576; /* 1 MiB */
+  uint64_t size = rand() % max_data_size;
+  return (size < min_data_size) ? min_data_size : size;
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/cbsl/tests/various_size_array.c
+++ b/cachelab/cbsl/tests/various_size_array.c
@@ -0,0 +1,189 @@
+/*
+ * Copyright 2019 Yuta Hirokawa (University of Tsukuba, Japan)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#include <math.h>
+#include <cbsl.h>
+
+#define CBSL_ERROR_CHECK(X)  {if ((X) == cbsl_error) { fprintf(stderr, "error: %s\n", (#X)); exit(1); }}
+
+typedef unsigned char byte_t;
+
+extern void compress(uint64_t n, uint64_t* sizes, byte_t** a);
+extern void raw_write(uint64_t n, uint64_t* sizes, byte_t** a);
+extern void decompress(uint64_t n, uint64_t* sizes, byte_t** a);
+extern void raw_read(uint64_t n, uint64_t* sizes, byte_t** a);
+
+extern uint64_t rand_size();
+extern void     rand_byte_t(uint64_t data_size, byte_t* a);
+
+char cname[128], sname[128];
+
+int main(int argc, char** argv)
+{
+  sprintf(cname, "various_compressed.zst");
+  sprintf(sname, "various_raw.dat");
+
+  srand((unsigned int)(time(NULL)));
+
+  uint64_t num_vars;
+  if (argc < 2)
+  {
+    num_vars = rand() % 100 + 2;
+  }
+  else
+  {
+    sscanf(argv[1], "%lu\n", &num_vars);
+  }
+  printf("number of array (data sets): %lu\n", num_vars);
+
+  byte_t**  a = (byte_t**)(malloc(sizeof(byte_t**) * num_vars));
+  byte_t**  b = (byte_t**)(malloc(sizeof(byte_t**) * num_vars));
+  byte_t**  c = (byte_t**)(malloc(sizeof(byte_t**) * num_vars));
+  uint64_t* asizes = (uint64_t*)(malloc(sizeof(uint64_t*) * num_vars));
+  uint64_t* bsizes = (uint64_t*)(malloc(sizeof(uint64_t*) * num_vars));
+  uint64_t* csizes = (uint64_t*)(malloc(sizeof(uint64_t*) * num_vars));
+
+  for(uint64_t i = 0; i < num_vars; ++i)
+  {
+    asizes[i] = rand_size();
+    a[i] = (byte_t*)(malloc(sizeof(byte_t*) * asizes[i]));
+    rand_byte_t(asizes[i] / sizeof(byte_t), a[i]);
+    printf("array[%lu] = %lu bytes\n", i, asizes[i]);
+
+    b[i] = (byte_t*)(malloc(sizeof(byte_t*) * asizes[i]));
+    c[i] = (byte_t*)(malloc(sizeof(byte_t*) * asizes[i]));
+  }
+  
+  compress(num_vars, asizes, a);
+  raw_write(num_vars, asizes, a);
+
+  decompress(num_vars, bsizes, b);
+  raw_read(num_vars, csizes, c);
+
+  for (uint64_t i = 0; i < num_vars; ++i)
+  {
+    if (asizes[i] != bsizes[i] || bsizes[i] != csizes[i])
+    {
+      fprintf(stderr, "array size is mismatch!\n");
+      exit(1);
+    }
+  }
+
+  for (uint64_t i = 0; i < num_vars; ++i)
+  for (uint64_t j = 0; j < asizes[i]; ++j)
+  {
+    if (a[i][j] != b[i][j] || b[i][j] != c[i][j])
+    {
+      fprintf(stderr, "data value is mismatch! (a,b,c)[%lu][%lu]\n", i, j);
+      exit(1);
+    }
+  }
+
+  for (uint64_t i = 0; i < num_vars; ++i)
+  {
+    free(a[i]);
+    free(b[i]);
+    free(c[i]);
+  }
+  free(a);
+  free(b);
+  free(c);
+  free(asizes);
+  free(bsizes);
+  free(csizes);
+
+  return 0;
+}
+
+void compress(uint64_t n, uint64_t* sizes, byte_t** a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_store_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_store_mode)\n");
+    exit(1);
+  }
+  for (uint64_t i = 0; i < n; ++i)
+  {
+    CBSL_ERROR_CHECK(cbsl_write(ctx, &sizes[i], sizeof(sizes[i])));
+    CBSL_ERROR_CHECK(cbsl_write(ctx, a[i], sizes[i]));
+  }
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_write(uint64_t n, uint64_t* sizes, byte_t** a)
+{
+  FILE* fp = fopen(sname, "wb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(wb)\n");
+    exit(1);
+  }
+  for (uint64_t i = 0; i < n; ++i)
+  {
+    fwrite(&sizes[i], 1, sizeof(sizes[i]), fp);
+    fwrite(a[i], 1, sizes[i], fp);
+  }
+  fclose(fp);
+}
+
+void decompress(uint64_t n, uint64_t* sizes, byte_t** a)
+{
+  cbsl_ctx* ctx = cbsl_open(cbsl_load_mode, cname);
+  if (ctx == NULL)
+  {
+    fprintf(stderr, "error: cbsl_open(cbsl_load_mode)\n");
+    exit(1);
+  }
+  for (uint64_t i = 0; i < n; ++i)
+  {
+    CBSL_ERROR_CHECK(cbsl_read(ctx, &sizes[i], sizeof(sizes[i])));
+    CBSL_ERROR_CHECK(cbsl_read(ctx, a[i], sizes[i]));
+  }
+  CBSL_ERROR_CHECK(cbsl_close(ctx));
+}
+
+void raw_read(uint64_t n, uint64_t* sizes, byte_t** a)
+{
+  FILE* fp = fopen(sname, "rb");
+  if (fp == NULL)
+  {
+    fprintf(stderr, "error: fopen(rb)\n");
+    exit(1);
+  }
+  for (uint64_t i = 0; i < n; ++i)
+  {
+    fread(&sizes[i], 1, sizeof(sizes[i]), fp);
+    fread(a[i], 1, sizes[i], fp);
+  }
+  fclose(fp);
+}
+
+uint64_t rand_size()
+{
+  const uint64_t min_data_size = 1024;
+  const uint64_t max_data_size = 1048576; /* 1 MiB */
+  uint64_t size = rand() % max_data_size;
+  return (size < min_data_size) ? min_data_size : size;
+}
+
+void rand_byte_t(uint64_t data_size, byte_t* a)
+{
+  for(uint64_t i = 0; i < data_size; ++i)
+    a[i] = rand() % 255;
+}
--- a/cachelab/common.h
+++ b/cachelab/common.h
@@ -0,0 +1,22 @@
+///////////////////////////////////////////////////////////////////////
+////  Copyright 2022 by mars.                                        //
+///////////////////////////////////////////////////////////////////////
+
+#ifndef __TRACE_COMMON_H__
+#define __TRACE_COMMON_H__
+
+typedef unsigned char      UINT8;
+typedef unsigned short     UINT16;
+typedef unsigned int       UINT32;
+typedef int                INT32;
+typedef unsigned long long UINT64;
+
+void InitDataCache(void);
+UINT8 AccessDataCache(UINT64 Address, UINT8 Operation, UINT8 DataSize, UINT64 StoreValue, UINT64* LoadResult);
+
+void InitInstCache(void);
+UINT8 AccessInstCache(UINT64 Address, UINT8 Operation, UINT8 InstSize, UINT64* InstResult);
+
+UINT64 ReadMemory(UINT64 Address);
+void WriteMemory(UINT64 Address, UINT64 WriteData);
+#endif
--- a/cachelab/getopt.c
+++ b/cachelab/getopt.c
@@ -0,0 +1,250 @@
+/*****************************************************************************
+* getopt.c - competent and free getopt library.
+* $Header: /cvsroot/freegetopt/freegetopt/getopt.c,v 1.2 2003/10/26 03:10:20 vindaci Exp $
+*
+* Copyright (c)2002-2003 Mark K. Kim
+* All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions
+* are met:
+*
+*   * Redistributions of source code must retain the above copyright
+*     notice, this list of conditions and the following disclaimer.
+*
+*   * Redistributions in binary form must reproduce the above copyright
+*     notice, this list of conditions and the following disclaimer in
+*     the documentation and/or other materials provided with the
+*     distribution.
+*
+*   * Neither the original author of this software nor the names of its
+*     contributors may be used to endorse or promote products derived
+*     from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+* THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
+* DAMAGE.
+*/
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include "getopt.h"
+
+
+// static const char* ID = "$Id: getopt.c,v 1.2 2003/10/26 03:10:20 vindaci Exp $";
+
+
+char* optarg = NULL;
+int optind = 0;
+int opterr = 1;
+int optopt = '?';
+
+
+static char** prev_argv = NULL;        /* Keep a copy of argv and argc to */
+static int prev_argc = 0;              /*    tell if getopt params change */
+static int argv_index = 0;             /* Option we're checking */
+static int argv_index2 = 0;            /* Option argument we're checking */
+static int opt_offset = 0;             /* Index into compounded "-option" */
+static int dashdash = 0;               /* True if "--" option reached */
+static int nonopt = 0;                 /* How many nonopts we've found */
+
+static void increment_index()
+{
+	/* Move onto the next option */
+	if (argv_index < argv_index2)
+	{
+		while (prev_argv[++argv_index] && prev_argv[argv_index][0] != '-'
+			&& argv_index < argv_index2 + 1);
+	}
+	else argv_index++;
+	opt_offset = 1;
+}
+
+
+/*
+* Permutes argv[] so that the argument currently being processed is moved
+* to the end.
+*/
+static int permute_argv_once()
+{
+	/* Movability check */
+	if (argv_index + nonopt >= prev_argc) return 1;
+	/* Move the current option to the end, bring the others to front */
+	else
+	{
+		char* tmp = prev_argv[argv_index];
+
+		/* Move the data */
+		memmove(&prev_argv[argv_index], &prev_argv[argv_index + 1],
+			sizeof(char**) * (prev_argc - argv_index - 1));
+		prev_argv[prev_argc - 1] = tmp;
+
+		nonopt++;
+		return 0;
+	}
+}
+
+
+int getopt(int argc, char** argv, char* optstr)
+{
+	int c = 0;
+
+	/* If we have new argv, reinitialize */
+	if (prev_argv != argv || prev_argc != argc)
+	{
+		/* Initialize variables */
+		prev_argv = argv;
+		prev_argc = argc;
+		argv_index = 1;
+		argv_index2 = 1;
+		opt_offset = 1;
+		dashdash = 0;
+		nonopt = 0;
+	}
+
+	/* Jump point in case we want to ignore the current argv_index */
+getopt_top:
+
+	/* Misc. initializations */
+	optarg = NULL;
+
+	/* Dash-dash check */
+	if (argv[argv_index] && !strcmp(argv[argv_index], "--"))
+	{
+		dashdash = 1;
+		increment_index();
+	}
+
+	/* If we're at the end of argv, that's it. */
+	if (argv[argv_index] == NULL)
+	{
+		c = -1;
+	}
+	/* Are we looking at a string? Single dash is also a string */
+	else if (dashdash || argv[argv_index][0] != '-' || !strcmp(argv[argv_index], "-"))
+	{
+		/* If we want a string... */
+		if (optstr[0] == '-')
+		{
+			c = 1;
+			optarg = argv[argv_index];
+			increment_index();
+		}
+		/* If we really don't want it (we're in POSIX mode), we're done */
+		else if (optstr[0] == '+')// || getenv("POSIXLY_CORRECT"))
+		{
+			c = -1;
+
+			/* Everything else is a non-opt argument */
+			nonopt = argc - argv_index;
+		}
+		/* If we mildly don't want it, then move it back */
+		else
+		{
+			if (!permute_argv_once()) goto getopt_top;
+			else c = -1;
+		}
+	}
+	/* Otherwise we're looking at an option */
+	else
+	{
+		char* opt_ptr = NULL;
+
+		/* Grab the option */
+		c = argv[argv_index][opt_offset++];
+
+		/* Is the option in the optstr? */
+		if (optstr[0] == '-') opt_ptr = strchr(optstr + 1, c);
+		else opt_ptr = strchr(optstr, c);
+		/* Invalid argument */
+		if (!opt_ptr)
+		{
+			if (opterr)
+			{
+				fprintf(stderr, "%s: invalid option -- %c\n", argv[0], c);
+			}
+
+			optopt = c;
+			c = '?';
+
+			/* Move onto the next option */
+			increment_index();
+		}
+		/* Option takes argument */
+		else if (opt_ptr[1] == ':')
+		{
+			/* ie, -oARGUMENT, -xxxoARGUMENT, etc. */
+			if (argv[argv_index][opt_offset] != '\0')
+			{
+				optarg = &argv[argv_index][opt_offset];
+				increment_index();
+			}
+			/* ie, -o ARGUMENT (only if it's a required argument) */
+			else if (opt_ptr[2] != ':')
+			{
+				/* One of those "you're not expected to understand this" moment */
+				if (argv_index2 < argv_index) argv_index2 = argv_index;
+				while (argv[++argv_index2] && argv[argv_index2][0] == '-');
+				optarg = argv[argv_index2];
+
+				/* Don't cross into the non-option argument list */
+				if (argv_index2 + nonopt >= prev_argc) optarg = NULL;
+
+				/* Move onto the next option */
+				increment_index();
+			}
+			else
+			{
+				/* Move onto the next option */
+				increment_index();
+			}
+
+			/* In case we got no argument for an option with required argument */
+			if (optarg == NULL && opt_ptr[2] != ':')
+			{
+				optopt = c;
+				c = '?';
+
+				if (opterr)
+				{
+					fprintf(stderr, "%s: option requires an argument -- %c\n",
+						argv[0], optopt);
+				}
+			}
+		}
+		/* Option does not take argument */
+		else
+		{
+			/* Next argv_index */
+			if (argv[argv_index][opt_offset] == '\0')
+			{
+				increment_index();
+			}
+		}
+	}
+
+	/* Calculate optind */
+	if (c == -1)
+	{
+		optind = argc - nonopt;
+	}
+	else
+	{
+		optind = argv_index;
+	}
+
+	return c;
+}
+
+
+/* vim:ts=3
+*/
--- a/cachelab/getopt.h
+++ b/cachelab/getopt.h
@@ -0,0 +1,63 @@
+/*****************************************************************************
+* getopt.h - competent and free getopt library.
+* $Header: /cvsroot/freegetopt/freegetopt/getopt.h,v 1.2 2003/10/26 03:10:20 vindaci Exp $
+*
+* Copyright (c)2002-2003 Mark K. Kim
+* All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions
+* are met:
+*
+*   * Redistributions of source code must retain the above copyright
+*     notice, this list of conditions and the following disclaimer.
+*
+*   * Redistributions in binary form must reproduce the above copyright
+*     notice, this list of conditions and the following disclaimer in
+*     the documentation and/or other materials provided with the
+*     distribution.
+*
+*   * Neither the original author of this software nor the names of its
+*     contributors may be used to endorse or promote products derived
+*     from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+* THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
+* DAMAGE.
+*/
+#ifndef GETOPT_H_
+#define GETOPT_H_
+
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+
+	extern char* optarg;
+	extern int optind;
+	extern int opterr;
+	extern int optopt;
+
+	int getopt(int argc, char** argv, char* optstr);
+
+
+#ifdef __cplusplus
+}
+#endif
+
+
+#endif /* GETOPT_H_ */
+
+
+/* vim:ts=3
+*/
--- a/cachelab/traces/dave.trace.zst
+++ b/cachelab/traces/dave.trace.zst
--- a/cachelab/traces/gedit.trace.zst
+++ b/cachelab/traces/gedit.trace.zst
--- a/cachelab/traces/long.trace.zst
+++ b/cachelab/traces/long.trace.zst
--- a/cachelab/traces/trans.trace.zst
+++ b/cachelab/traces/trans.trace.zst
--- a/cachelab/traces/yi.trace.zst
+++ b/cachelab/traces/yi.trace.zst
--- a/cachelab/traces/yi2.trace.zst
+++ b/cachelab/traces/yi2.trace.zst
--- a/cachelab/uthash.h
+++ b/cachelab/uthash.h
--- a/cachelab/zstd/libzstd_static-win32.lib
+++ b/cachelab/zstd/libzstd_static-win32.lib
--- a/cachelab/zstd/libzstd_static-win64.lib
+++ b/cachelab/zstd/libzstd_static-win64.lib
--- a/cachelab/zstd/zdict.h
+++ b/cachelab/zstd/zdict.h
@@ -0,0 +1,452 @@
+/*
+ * Copyright (c) Yann Collet, Facebook, Inc.
+ * All rights reserved.
+ *
+ * This source code is licensed under both the BSD-style license (found in the
+ * LICENSE file in the root directory of this source tree) and the GPLv2 (found
+ * in the COPYING file in the root directory of this source tree).
+ * You may select, at your option, one of the above-listed licenses.
+ */
+
+#ifndef DICTBUILDER_H_001
+#define DICTBUILDER_H_001
+
+#if defined (__cplusplus)
+extern "C" {
+#endif
+
+
+/*======  Dependencies  ======*/
+#include <stddef.h>  /* size_t */
+
+
+/* =====   ZDICTLIB_API : control library symbols visibility   ===== */
+#ifndef ZDICTLIB_VISIBILITY
+#  if defined(__GNUC__) && (__GNUC__ >= 4)
+#    define ZDICTLIB_VISIBILITY __attribute__ ((visibility ("default")))
+#  else
+#    define ZDICTLIB_VISIBILITY
+#  endif
+#endif
+#if defined(ZSTD_DLL_EXPORT) && (ZSTD_DLL_EXPORT==1)
+#  define ZDICTLIB_API __declspec(dllexport) ZDICTLIB_VISIBILITY
+#elif defined(ZSTD_DLL_IMPORT) && (ZSTD_DLL_IMPORT==1)
+#  define ZDICTLIB_API __declspec(dllimport) ZDICTLIB_VISIBILITY /* It isn't required but allows to generate better code, saving a function pointer load from the IAT and an indirect jump.*/
+#else
+#  define ZDICTLIB_API ZDICTLIB_VISIBILITY
+#endif
+
+/*******************************************************************************
+ * Zstd dictionary builder
+ *
+ * FAQ
+ * ===
+ * Why should I use a dictionary?
+ * ------------------------------
+ *
+ * Zstd can use dictionaries to improve compression ratio of small data.
+ * Traditionally small files don't compress well because there is very little
+ * repetition in a single sample, since it is small. But, if you are compressing
+ * many similar files, like a bunch of JSON records that share the same
+ * structure, you can train a dictionary on ahead of time on some samples of
+ * these files. Then, zstd can use the dictionary to find repetitions that are
+ * present across samples. This can vastly improve compression ratio.
+ *
+ * When is a dictionary useful?
+ * ----------------------------
+ *
+ * Dictionaries are useful when compressing many small files that are similar.
+ * The larger a file is, the less benefit a dictionary will have. Generally,
+ * we don't expect dictionary compression to be effective past 100KB. And the
+ * smaller a file is, the more we would expect the dictionary to help.
+ *
+ * How do I use a dictionary?
+ * --------------------------
+ *
+ * Simply pass the dictionary to the zstd compressor with
+ * `ZSTD_CCtx_loadDictionary()`. The same dictionary must then be passed to
+ * the decompressor, using `ZSTD_DCtx_loadDictionary()`. There are other
+ * more advanced functions that allow selecting some options, see zstd.h for
+ * complete documentation.
+ *
+ * What is a zstd dictionary?
+ * --------------------------
+ *
+ * A zstd dictionary has two pieces: Its header, and its content. The header
+ * contains a magic number, the dictionary ID, and entropy tables. These
+ * entropy tables allow zstd to save on header costs in the compressed file,
+ * which really matters for small data. The content is just bytes, which are
+ * repeated content that is common across many samples.
+ *
+ * What is a raw content dictionary?
+ * ---------------------------------
+ *
+ * A raw content dictionary is just bytes. It doesn't have a zstd dictionary
+ * header, a dictionary ID, or entropy tables. Any buffer is a valid raw
+ * content dictionary.
+ *
+ * How do I train a dictionary?
+ * ----------------------------
+ *
+ * Gather samples from your use case. These samples should be similar to each
+ * other. If you have several use cases, you could try to train one dictionary
+ * per use case.
+ *
+ * Pass those samples to `ZDICT_trainFromBuffer()` and that will train your
+ * dictionary. There are a few advanced versions of this function, but this
+ * is a great starting point. If you want to further tune your dictionary
+ * you could try `ZDICT_optimizeTrainFromBuffer_cover()`. If that is too slow
+ * you can try `ZDICT_optimizeTrainFromBuffer_fastCover()`.
+ *
+ * If the dictionary training function fails, that is likely because you
+ * either passed too few samples, or a dictionary would not be effective
+ * for your data. Look at the messages that the dictionary trainer printed,
+ * if it doesn't say too few samples, then a dictionary would not be effective.
+ *
+ * How large should my dictionary be?
+ * ----------------------------------
+ *
+ * A reasonable dictionary size, the `dictBufferCapacity`, is about 100KB.
+ * The zstd CLI defaults to a 110KB dictionary. You likely don't need a
+ * dictionary larger than that. But, most use cases can get away with a
+ * smaller dictionary. The advanced dictionary builders can automatically
+ * shrink the dictionary for you, and select the smallest size that doesn't
+ * hurt compression ratio too much. See the `shrinkDict` parameter.
+ * A smaller dictionary can save memory, and potentially speed up
+ * compression.
+ *
+ * How many samples should I provide to the dictionary builder?
+ * ------------------------------------------------------------
+ *
+ * We generally recommend passing ~100x the size of the dictionary
+ * in samples. A few thousand should suffice. Having too few samples
+ * can hurt the dictionaries effectiveness. Having more samples will
+ * only improve the dictionaries effectiveness. But having too many
+ * samples can slow down the dictionary builder.
+ *
+ * How do I determine if a dictionary will be effective?
+ * -----------------------------------------------------
+ *
+ * Simply train a dictionary and try it out. You can use zstd's built in
+ * benchmarking tool to test the dictionary effectiveness.
+ *
+ *   # Benchmark levels 1-3 without a dictionary
+ *   zstd -b1e3 -r /path/to/my/files
+ *   # Benchmark levels 1-3 with a dictionary
+ *   zstd -b1e3 -r /path/to/my/files -D /path/to/my/dictionary
+ *
+ * When should I retrain a dictionary?
+ * -----------------------------------
+ *
+ * You should retrain a dictionary when its effectiveness drops. Dictionary
+ * effectiveness drops as the data you are compressing changes. Generally, we do
+ * expect dictionaries to "decay" over time, as your data changes, but the rate
+ * at which they decay depends on your use case. Internally, we regularly
+ * retrain dictionaries, and if the new dictionary performs significantly
+ * better than the old dictionary, we will ship the new dictionary.
+ *
+ * I have a raw content dictionary, how do I turn it into a zstd dictionary?
+ * -------------------------------------------------------------------------
+ *
+ * If you have a raw content dictionary, e.g. by manually constructing it, or
+ * using a third-party dictionary builder, you can turn it into a zstd
+ * dictionary by using `ZDICT_finalizeDictionary()`. You'll also have to
+ * provide some samples of the data. It will add the zstd header to the
+ * raw content, which contains a dictionary ID and entropy tables, which
+ * will improve compression ratio, and allow zstd to write the dictionary ID
+ * into the frame, if you so choose.
+ *
+ * Do I have to use zstd's dictionary builder?
+ * -------------------------------------------
+ *
+ * No! You can construct dictionary content however you please, it is just
+ * bytes. It will always be valid as a raw content dictionary. If you want
+ * a zstd dictionary, which can improve compression ratio, use
+ * `ZDICT_finalizeDictionary()`.
+ *
+ * What is the attack surface of a zstd dictionary?
+ * ------------------------------------------------
+ *
+ * Zstd is heavily fuzz tested, including loading fuzzed dictionaries, so
+ * zstd should never crash, or access out-of-bounds memory no matter what
+ * the dictionary is. However, if an attacker can control the dictionary
+ * during decompression, they can cause zstd to generate arbitrary bytes,
+ * just like if they controlled the compressed data.
+ *
+ ******************************************************************************/
+
+
+/*! ZDICT_trainFromBuffer():
+ *  Train a dictionary from an array of samples.
+ *  Redirect towards ZDICT_optimizeTrainFromBuffer_fastCover() single-threaded, with d=8, steps=4,
+ *  f=20, and accel=1.
+ *  Samples must be stored concatenated in a single flat buffer `samplesBuffer`,
+ *  supplied with an array of sizes `samplesSizes`, providing the size of each sample, in order.
+ *  The resulting dictionary will be saved into `dictBuffer`.
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *  Note:  Dictionary training will fail if there are not enough samples to construct a
+ *         dictionary, or if most of the samples are too small (< 8 bytes being the lower limit).
+ *         If dictionary training fails, you should use zstd without a dictionary, as the dictionary
+ *         would've been ineffective anyways. If you believe your samples would benefit from a dictionary
+ *         please open an issue with details, and we can look into it.
+ *  Note: ZDICT_trainFromBuffer()'s memory usage is about 6 MB.
+ *  Tips: In general, a reasonable dictionary has a size of ~ 100 KB.
+ *        It's possible to select smaller or larger size, just by specifying `dictBufferCapacity`.
+ *        In general, it's recommended to provide a few thousands samples, though this can vary a lot.
+ *        It's recommended that total size of all samples be about ~x100 times the target size of dictionary.
+ */
+ZDICTLIB_API size_t ZDICT_trainFromBuffer(void* dictBuffer, size_t dictBufferCapacity,
+                                    const void* samplesBuffer,
+                                    const size_t* samplesSizes, unsigned nbSamples);
+
+typedef struct {
+    int      compressionLevel;   /*< optimize for a specific zstd compression level; 0 means default */
+    unsigned notificationLevel;  /*< Write log to stderr; 0 = none (default); 1 = errors; 2 = progression; 3 = details; 4 = debug; */
+    unsigned dictID;             /*< force dictID value; 0 means auto mode (32-bits random value)
+                                  *   NOTE: The zstd format reserves some dictionary IDs for future use.
+                                  *         You may use them in private settings, but be warned that they
+                                  *         may be used by zstd in a public dictionary registry in the future.
+                                  *         These dictionary IDs are:
+                                  *           - low range  : <= 32767
+                                  *           - high range : >= (2^31)
+                                  */
+} ZDICT_params_t;
+
+/*! ZDICT_finalizeDictionary():
+ * Given a custom content as a basis for dictionary, and a set of samples,
+ * finalize dictionary by adding headers and statistics according to the zstd
+ * dictionary format.
+ *
+ * Samples must be stored concatenated in a flat buffer `samplesBuffer`,
+ * supplied with an array of sizes `samplesSizes`, providing the size of each
+ * sample in order. The samples are used to construct the statistics, so they
+ * should be representative of what you will compress with this dictionary.
+ *
+ * The compression level can be set in `parameters`. You should pass the
+ * compression level you expect to use in production. The statistics for each
+ * compression level differ, so tuning the dictionary for the compression level
+ * can help quite a bit.
+ *
+ * You can set an explicit dictionary ID in `parameters`, or allow us to pick
+ * a random dictionary ID for you, but we can't guarantee no collisions.
+ *
+ * The dstDictBuffer and the dictContent may overlap, and the content will be
+ * appended to the end of the header. If the header + the content doesn't fit in
+ * maxDictSize the beginning of the content is truncated to make room, since it
+ * is presumed that the most profitable content is at the end of the dictionary,
+ * since that is the cheapest to reference.
+ *
+ * `maxDictSize` must be >= max(dictContentSize, ZSTD_DICTSIZE_MIN).
+ *
+ * @return: size of dictionary stored into `dstDictBuffer` (<= `maxDictSize`),
+ *          or an error code, which can be tested by ZDICT_isError().
+ * Note: ZDICT_finalizeDictionary() will push notifications into stderr if
+ *       instructed to, using notificationLevel>0.
+ * NOTE: This function currently may fail in several edge cases including:
+ *         * Not enough samples
+ *         * Samples are uncompressible
+ *         * Samples are all exactly the same
+ */
+ZDICTLIB_API size_t ZDICT_finalizeDictionary(void* dstDictBuffer, size_t maxDictSize,
+                                const void* dictContent, size_t dictContentSize,
+                                const void* samplesBuffer, const size_t* samplesSizes, unsigned nbSamples,
+                                ZDICT_params_t parameters);
+
+
+/*======   Helper functions   ======*/
+ZDICTLIB_API unsigned ZDICT_getDictID(const void* dictBuffer, size_t dictSize);  /**< extracts dictID; @return zero if error (not a valid dictionary) */
+ZDICTLIB_API size_t ZDICT_getDictHeaderSize(const void* dictBuffer, size_t dictSize);  /* returns dict header size; returns a ZSTD error code on failure */
+ZDICTLIB_API unsigned ZDICT_isError(size_t errorCode);
+ZDICTLIB_API const char* ZDICT_getErrorName(size_t errorCode);
+
+
+
+#ifdef ZDICT_STATIC_LINKING_ONLY
+
+/* ====================================================================================
+ * The definitions in this section are considered experimental.
+ * They should never be used with a dynamic library, as they may change in the future.
+ * They are provided for advanced usages.
+ * Use them only in association with static linking.
+ * ==================================================================================== */
+
+#define ZDICT_DICTSIZE_MIN    256
+/* Deprecated: Remove in v1.6.0 */
+#define ZDICT_CONTENTSIZE_MIN 128
+
+/*! ZDICT_cover_params_t:
+ *  k and d are the only required parameters.
+ *  For others, value 0 means default.
+ */
+typedef struct {
+    unsigned k;                  /* Segment size : constraint: 0 < k : Reasonable range [16, 2048+] */
+    unsigned d;                  /* dmer size : constraint: 0 < d <= k : Reasonable range [6, 16] */
+    unsigned steps;              /* Number of steps : Only used for optimization : 0 means default (40) : Higher means more parameters checked */
+    unsigned nbThreads;          /* Number of threads : constraint: 0 < nbThreads : 1 means single-threaded : Only used for optimization : Ignored if ZSTD_MULTITHREAD is not defined */
+    double splitPoint;           /* Percentage of samples used for training: Only used for optimization : the first nbSamples * splitPoint samples will be used to training, the last nbSamples * (1 - splitPoint) samples will be used for testing, 0 means default (1.0), 1.0 when all samples are used for both training and testing */
+    unsigned shrinkDict;         /* Train dictionaries to shrink in size starting from the minimum size and selects the smallest dictionary that is shrinkDictMaxRegression% worse than the largest dictionary. 0 means no shrinking and 1 means shrinking  */
+    unsigned shrinkDictMaxRegression; /* Sets shrinkDictMaxRegression so that a smaller dictionary can be at worse shrinkDictMaxRegression% worse than the max dict size dictionary. */
+    ZDICT_params_t zParams;
+} ZDICT_cover_params_t;
+
+typedef struct {
+    unsigned k;                  /* Segment size : constraint: 0 < k : Reasonable range [16, 2048+] */
+    unsigned d;                  /* dmer size : constraint: 0 < d <= k : Reasonable range [6, 16] */
+    unsigned f;                  /* log of size of frequency array : constraint: 0 < f <= 31 : 1 means default(20)*/
+    unsigned steps;              /* Number of steps : Only used for optimization : 0 means default (40) : Higher means more parameters checked */
+    unsigned nbThreads;          /* Number of threads : constraint: 0 < nbThreads : 1 means single-threaded : Only used for optimization : Ignored if ZSTD_MULTITHREAD is not defined */
+    double splitPoint;           /* Percentage of samples used for training: Only used for optimization : the first nbSamples * splitPoint samples will be used to training, the last nbSamples * (1 - splitPoint) samples will be used for testing, 0 means default (0.75), 1.0 when all samples are used for both training and testing */
+    unsigned accel;              /* Acceleration level: constraint: 0 < accel <= 10, higher means faster and less accurate, 0 means default(1) */
+    unsigned shrinkDict;         /* Train dictionaries to shrink in size starting from the minimum size and selects the smallest dictionary that is shrinkDictMaxRegression% worse than the largest dictionary. 0 means no shrinking and 1 means shrinking  */
+    unsigned shrinkDictMaxRegression; /* Sets shrinkDictMaxRegression so that a smaller dictionary can be at worse shrinkDictMaxRegression% worse than the max dict size dictionary. */
+
+    ZDICT_params_t zParams;
+} ZDICT_fastCover_params_t;
+
+/*! ZDICT_trainFromBuffer_cover():
+ *  Train a dictionary from an array of samples using the COVER algorithm.
+ *  Samples must be stored concatenated in a single flat buffer `samplesBuffer`,
+ *  supplied with an array of sizes `samplesSizes`, providing the size of each sample, in order.
+ *  The resulting dictionary will be saved into `dictBuffer`.
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *          See ZDICT_trainFromBuffer() for details on failure modes.
+ *  Note: ZDICT_trainFromBuffer_cover() requires about 9 bytes of memory for each input byte.
+ *  Tips: In general, a reasonable dictionary has a size of ~ 100 KB.
+ *        It's possible to select smaller or larger size, just by specifying `dictBufferCapacity`.
+ *        In general, it's recommended to provide a few thousands samples, though this can vary a lot.
+ *        It's recommended that total size of all samples be about ~x100 times the target size of dictionary.
+ */
+ZDICTLIB_API size_t ZDICT_trainFromBuffer_cover(
+          void *dictBuffer, size_t dictBufferCapacity,
+    const void *samplesBuffer, const size_t *samplesSizes, unsigned nbSamples,
+          ZDICT_cover_params_t parameters);
+
+/*! ZDICT_optimizeTrainFromBuffer_cover():
+ * The same requirements as above hold for all the parameters except `parameters`.
+ * This function tries many parameter combinations and picks the best parameters.
+ * `*parameters` is filled with the best parameters found,
+ * dictionary constructed with those parameters is stored in `dictBuffer`.
+ *
+ * All of the parameters d, k, steps are optional.
+ * If d is non-zero then we don't check multiple values of d, otherwise we check d = {6, 8}.
+ * if steps is zero it defaults to its default value.
+ * If k is non-zero then we don't check multiple values of k, otherwise we check steps values in [50, 2000].
+ *
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *          On success `*parameters` contains the parameters selected.
+ *          See ZDICT_trainFromBuffer() for details on failure modes.
+ * Note: ZDICT_optimizeTrainFromBuffer_cover() requires about 8 bytes of memory for each input byte and additionally another 5 bytes of memory for each byte of memory for each thread.
+ */
+ZDICTLIB_API size_t ZDICT_optimizeTrainFromBuffer_cover(
+          void* dictBuffer, size_t dictBufferCapacity,
+    const void* samplesBuffer, const size_t* samplesSizes, unsigned nbSamples,
+          ZDICT_cover_params_t* parameters);
+
+/*! ZDICT_trainFromBuffer_fastCover():
+ *  Train a dictionary from an array of samples using a modified version of COVER algorithm.
+ *  Samples must be stored concatenated in a single flat buffer `samplesBuffer`,
+ *  supplied with an array of sizes `samplesSizes`, providing the size of each sample, in order.
+ *  d and k are required.
+ *  All other parameters are optional, will use default values if not provided
+ *  The resulting dictionary will be saved into `dictBuffer`.
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *          See ZDICT_trainFromBuffer() for details on failure modes.
+ *  Note: ZDICT_trainFromBuffer_fastCover() requires 6 * 2^f bytes of memory.
+ *  Tips: In general, a reasonable dictionary has a size of ~ 100 KB.
+ *        It's possible to select smaller or larger size, just by specifying `dictBufferCapacity`.
+ *        In general, it's recommended to provide a few thousands samples, though this can vary a lot.
+ *        It's recommended that total size of all samples be about ~x100 times the target size of dictionary.
+ */
+ZDICTLIB_API size_t ZDICT_trainFromBuffer_fastCover(void *dictBuffer,
+                    size_t dictBufferCapacity, const void *samplesBuffer,
+                    const size_t *samplesSizes, unsigned nbSamples,
+                    ZDICT_fastCover_params_t parameters);
+
+/*! ZDICT_optimizeTrainFromBuffer_fastCover():
+ * The same requirements as above hold for all the parameters except `parameters`.
+ * This function tries many parameter combinations (specifically, k and d combinations)
+ * and picks the best parameters. `*parameters` is filled with the best parameters found,
+ * dictionary constructed with those parameters is stored in `dictBuffer`.
+ * All of the parameters d, k, steps, f, and accel are optional.
+ * If d is non-zero then we don't check multiple values of d, otherwise we check d = {6, 8}.
+ * if steps is zero it defaults to its default value.
+ * If k is non-zero then we don't check multiple values of k, otherwise we check steps values in [50, 2000].
+ * If f is zero, default value of 20 is used.
+ * If accel is zero, default value of 1 is used.
+ *
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *          On success `*parameters` contains the parameters selected.
+ *          See ZDICT_trainFromBuffer() for details on failure modes.
+ * Note: ZDICT_optimizeTrainFromBuffer_fastCover() requires about 6 * 2^f bytes of memory for each thread.
+ */
+ZDICTLIB_API size_t ZDICT_optimizeTrainFromBuffer_fastCover(void* dictBuffer,
+                    size_t dictBufferCapacity, const void* samplesBuffer,
+                    const size_t* samplesSizes, unsigned nbSamples,
+                    ZDICT_fastCover_params_t* parameters);
+
+typedef struct {
+    unsigned selectivityLevel;   /* 0 means default; larger => select more => larger dictionary */
+    ZDICT_params_t zParams;
+} ZDICT_legacy_params_t;
+
+/*! ZDICT_trainFromBuffer_legacy():
+ *  Train a dictionary from an array of samples.
+ *  Samples must be stored concatenated in a single flat buffer `samplesBuffer`,
+ *  supplied with an array of sizes `samplesSizes`, providing the size of each sample, in order.
+ *  The resulting dictionary will be saved into `dictBuffer`.
+ * `parameters` is optional and can be provided with values set to 0 to mean "default".
+ * @return: size of dictionary stored into `dictBuffer` (<= `dictBufferCapacity`)
+ *          or an error code, which can be tested with ZDICT_isError().
+ *          See ZDICT_trainFromBuffer() for details on failure modes.
+ *  Tips: In general, a reasonable dictionary has a size of ~ 100 KB.
+ *        It's possible to select smaller or larger size, just by specifying `dictBufferCapacity`.
+ *        In general, it's recommended to provide a few thousands samples, though this can vary a lot.
+ *        It's recommended that total size of all samples be about ~x100 times the target size of dictionary.
+ *  Note: ZDICT_trainFromBuffer_legacy() will send notifications into stderr if instructed to, using notificationLevel>0.
+ */
+ZDICTLIB_API size_t ZDICT_trainFromBuffer_legacy(
+    void* dictBuffer, size_t dictBufferCapacity,
+    const void* samplesBuffer, const size_t* samplesSizes, unsigned nbSamples,
+    ZDICT_legacy_params_t parameters);
+
+
+/* Deprecation warnings */
+/* It is generally possible to disable deprecation warnings from compiler,
+   for example with -Wno-deprecated-declarations for gcc
+   or _CRT_SECURE_NO_WARNINGS in Visual.
+   Otherwise, it's also possible to manually define ZDICT_DISABLE_DEPRECATE_WARNINGS */
+#ifdef ZDICT_DISABLE_DEPRECATE_WARNINGS
+#  define ZDICT_DEPRECATED(message) ZDICTLIB_API   /* disable deprecation warnings */
+#else
+#  define ZDICT_GCC_VERSION (__GNUC__ * 100 + __GNUC_MINOR__)
+#  if defined (__cplusplus) && (__cplusplus >= 201402) /* C++14 or greater */
+#    define ZDICT_DEPRECATED(message) [[deprecated(message)]] ZDICTLIB_API
+#  elif defined(__clang__) || (ZDICT_GCC_VERSION >= 405)
+#    define ZDICT_DEPRECATED(message) ZDICTLIB_API __attribute__((deprecated(message)))
+#  elif (ZDICT_GCC_VERSION >= 301)
+#    define ZDICT_DEPRECATED(message) ZDICTLIB_API __attribute__((deprecated))
+#  elif defined(_MSC_VER)
+#    define ZDICT_DEPRECATED(message) ZDICTLIB_API __declspec(deprecated(message))
+#  else
+#    pragma message("WARNING: You need to implement ZDICT_DEPRECATED for this compiler")
+#    define ZDICT_DEPRECATED(message) ZDICTLIB_API
+#  endif
+#endif /* ZDICT_DISABLE_DEPRECATE_WARNINGS */
+
+ZDICT_DEPRECATED("use ZDICT_finalizeDictionary() instead")
+size_t ZDICT_addEntropyTablesFromBuffer(void* dictBuffer, size_t dictContentSize, size_t dictBufferCapacity,
+                                  const void* samplesBuffer, const size_t* samplesSizes, unsigned nbSamples);
+
+
+#endif   /* ZDICT_STATIC_LINKING_ONLY */
+
+#if defined (__cplusplus)
+}
+#endif
+
+#endif   /* DICTBUILDER_H_001 */
--- a/cachelab/zstd/zstd.h
+++ b/cachelab/zstd/zstd.h
--- a/cachelab/zstd/zstd_errors.h
+++ b/cachelab/zstd/zstd_errors.h
@@ -0,0 +1,96 @@
+/*
+ * Copyright (c) Yann Collet, Facebook, Inc.
+ * All rights reserved.
+ *
+ * This source code is licensed under both the BSD-style license (found in the
+ * LICENSE file in the root directory of this source tree) and the GPLv2 (found
+ * in the COPYING file in the root directory of this source tree).
+ * You may select, at your option, one of the above-listed licenses.
+ */
+
+#ifndef ZSTD_ERRORS_H_398273423
+#define ZSTD_ERRORS_H_398273423
+
+#if defined (__cplusplus)
+extern "C" {
+#endif
+
+/*===== dependency =====*/
+#include <stddef.h>   /* size_t */
+
+
+/* =====   ZSTDERRORLIB_API : control library symbols visibility   ===== */
+#ifndef ZSTDERRORLIB_VISIBILITY
+#  if defined(__GNUC__) && (__GNUC__ >= 4)
+#    define ZSTDERRORLIB_VISIBILITY __attribute__ ((visibility ("default")))
+#  else
+#    define ZSTDERRORLIB_VISIBILITY
+#  endif
+#endif
+#if defined(ZSTD_DLL_EXPORT) && (ZSTD_DLL_EXPORT==1)
+#  define ZSTDERRORLIB_API __declspec(dllexport) ZSTDERRORLIB_VISIBILITY
+#elif defined(ZSTD_DLL_IMPORT) && (ZSTD_DLL_IMPORT==1)
+#  define ZSTDERRORLIB_API __declspec(dllimport) ZSTDERRORLIB_VISIBILITY /* It isn't required but allows to generate better code, saving a function pointer load from the IAT and an indirect jump.*/
+#else
+#  define ZSTDERRORLIB_API ZSTDERRORLIB_VISIBILITY
+#endif
+
+/*-*********************************************
+ *  Error codes list
+ *-*********************************************
+ *  Error codes _values_ are pinned down since v1.3.1 only.
+ *  Therefore, don't rely on values if you may link to any version < v1.3.1.
+ *
+ *  Only values < 100 are considered stable.
+ *
+ *  note 1 : this API shall be used with static linking only.
+ *           dynamic linking is not yet officially supported.
+ *  note 2 : Prefer relying on the enum than on its value whenever possible
+ *           This is the only supported way to use the error list < v1.3.1
+ *  note 3 : ZSTD_isError() is always correct, whatever the library version.
+ **********************************************/
+typedef enum {
+  ZSTD_error_no_error = 0,
+  ZSTD_error_GENERIC  = 1,
+  ZSTD_error_prefix_unknown                = 10,
+  ZSTD_error_version_unsupported           = 12,
+  ZSTD_error_frameParameter_unsupported    = 14,
+  ZSTD_error_frameParameter_windowTooLarge = 16,
+  ZSTD_error_corruption_detected = 20,
+  ZSTD_error_checksum_wrong      = 22,
+  ZSTD_error_dictionary_corrupted      = 30,
+  ZSTD_error_dictionary_wrong          = 32,
+  ZSTD_error_dictionaryCreation_failed = 34,
+  ZSTD_error_parameter_unsupported   = 40,
+  ZSTD_error_parameter_outOfBound    = 42,
+  ZSTD_error_tableLog_tooLarge       = 44,
+  ZSTD_error_maxSymbolValue_tooLarge = 46,
+  ZSTD_error_maxSymbolValue_tooSmall = 48,
+  ZSTD_error_stabilityCondition_notRespected = 50,
+  ZSTD_error_stage_wrong       = 60,
+  ZSTD_error_init_missing      = 62,
+  ZSTD_error_memory_allocation = 64,
+  ZSTD_error_workSpace_tooSmall= 66,
+  ZSTD_error_dstSize_tooSmall = 70,
+  ZSTD_error_srcSize_wrong    = 72,
+  ZSTD_error_dstBuffer_null   = 74,
+  /* following error codes are __NOT STABLE__, they can be removed or changed in future versions */
+  ZSTD_error_frameIndex_tooLarge = 100,
+  ZSTD_error_seekableIO          = 102,
+  ZSTD_error_dstBuffer_wrong     = 104,
+  ZSTD_error_srcBuffer_wrong     = 105,
+  ZSTD_error_maxCode = 120  /* never EVER use this value directly, it can change in future versions! Use ZSTD_isError() instead */
+} ZSTD_ErrorCode;
+
+/*! ZSTD_getErrorCode() :
+    convert a `size_t` function result into a `ZSTD_ErrorCode` enum type,
+    which can be used to compare with enum list published above */
+ZSTDERRORLIB_API ZSTD_ErrorCode ZSTD_getErrorCode(size_t functionResult);
+ZSTDERRORLIB_API const char* ZSTD_getErrorString(ZSTD_ErrorCode code);   /**< Same as ZSTD_getErrorName, but using a `ZSTD_ErrorCode` enum argument */
+
+
+#if defined (__cplusplus)
+}
+#endif
+
+#endif /* ZSTD_ERRORS_H_398273423 */
--- a/malloclab/Makefile
+++ b/malloclab/Makefile
@@ -0,0 +1,26 @@
+# Copyright 2022 by mars
+
+# Description: Makefile for building a malloc/free Simulator.
+#
+
+
+LDFLAGS += 
+
+LDLIBS   += 
+
+CPPFLAGS := -O3 -Wall -Wextra -Winline -Winit-self -Wno-sequence-point\
+           -Wno-unused-function -Wno-inline -fPIC -W -Wcast-qual -Wpointer-arith -Wno-unused-parameter
+
+#CPPFLAGS := -g
+PROGRAMS := malloc
+
+objects = clock.o fcyc.o fsecs.o mdriver.o memlib.o mm.o
+
+all: $(PROGRAMS)
+
+malloc : $(objects)
+	clang $(CPPFLAGS) $(LDFLAGS) -o $@ $^ $(LDLIBS)
+	rm -f $(objects)
+
+clean:
+	rm -f $(PROGRAMS) $(objects)
--- a/malloclab/Readme.txt
+++ b/malloclab/Readme.txt
@@ -0,0 +1,20 @@
+动态内存分配器实验
+
+你需要修改mm.c（你只能修改此文件，其他文件不能修改），使之能够处理内存分配（mm_malloc）、内存释放（mm_free）、内存扩张（mm_realloc）等功能。
+你可以修改traces目录下的TRACE_LIST.txt，以运行不同的trace。
+你需要跑尽可能多的trace，并在评分中拿到尽可能的高分。
+
+【注意】并不是所有trace都可以跑的。有些trace内部包含了错误的操作，是跑不通的。比如：
+1、试图realloc一个不存在的指针
+2、试图free一个不存在的指针
+
+Linux：
+1、make
+2、./malloc -t traces
+
+Windows:
+1、用VS2019打开工程myMalloc/myMalloc.sln，编译
+2、生成可执行代码，myMalloc -t traces
+
+
+【提交】你需要将mm.c修改为mm_201900221122.c，其中后面是你的学号。提交到educoder上。你只需要提交mm.c文件。
--- a/malloclab/clock.c
+++ b/malloclab/clock.c
@@ -0,0 +1,107 @@
+#include <stdio.h>
+#include <stdlib.h>
+#include <time.h>
+#ifdef _WIN32
+#include <windows.h>
+#include <intrin.h>
+#else
+#include <unistd.h>
+#endif
+#include "clock.h"
+
+void start_counter(void);
+double get_counter(void);
+
+/*
+ * Routines for using the cycle counter
+ */
+
+ /* $begin x86cyclecounter */
+ /* Initialize the cycle counter */
+static unsigned cyc_hi = 0;
+static unsigned cyc_lo = 0;
+
+
+/* Set *hi and *lo to the high and low order bits  of the cycle counter.
+   Implementation requires assembly code to use the rdtsc instruction. */
+void access_counter(unsigned* hi, unsigned* lo)
+{
+#ifdef _WIN32
+	long long counter;
+	counter = __rdtsc();
+	(*hi) = (unsigned int)(counter >> 32);
+	(*lo) = (unsigned int)counter;
+#else
+	asm("rdtsc; movl %%edx,%0; movl %%eax,%1"   /* Read cycle counter */
+		: "=r" (*hi), "=r" (*lo)                /* and move results to */
+		: /* No input */                        /* the two outputs */
+		: "%edx", "%eax");
+#endif
+}
+
+/* Record the current value of the cycle counter. */
+void start_counter(void)
+{
+	access_counter(&cyc_hi, &cyc_lo);
+}
+
+/* Return the number of cycles since the last call to start_counter. */
+double get_counter(void)
+{
+	unsigned ncyc_hi, ncyc_lo;
+	unsigned hi, lo, borrow;
+	double result;
+
+	/* Get cycle counter */
+	access_counter(&ncyc_hi, &ncyc_lo);
+
+	/* Do double precision subtraction */
+	lo = ncyc_lo - cyc_lo;
+	borrow = lo > ncyc_lo;
+	hi = ncyc_hi - cyc_hi - borrow;
+	result = (double)hi * (1 << 30) * 4 + lo;
+	if (result < 0) {
+		printf("[%s]错误！counter返回了负值：%.0f\n", __func__, result);
+	}
+	return result;
+}
+
+void make_CPU_busy(void)
+{
+	volatile double old_tick, new_tick;
+	start_counter();
+	old_tick = get_counter();
+	new_tick = get_counter();
+	while (new_tick - old_tick < 1000000000)
+		new_tick = get_counter();
+}
+
+/* $begin mhz */
+/* Estimate the clock rate by measuring the cycles that elapse */
+/* while sleeping for sleeptime seconds */
+double mhz_full(int verbose, int sleeptime)
+{
+	double rate;
+
+	if (verbose)
+		printf("[%s]准备开始测量处理器性能，睡眠时间=%d秒\n", __func__, sleeptime);
+	start_counter();
+#ifdef _WIN32
+	Sleep(sleeptime * 1000);
+#else
+	sleep(sleeptime);
+#endif
+	rate = get_counter() / (1e6 * sleeptime);
+	if (verbose)
+		printf("[%s]处理器主频 ~= %.1f MHz\n", __func__, rate);
+	return rate;
+}
+/* $end mhz */
+
+/* Version using a default sleeptime */
+double mhz(int verbose)
+{
+	return mhz_full(verbose, 2);
+}
+
+
--- a/malloclab/clock.h
+++ b/malloclab/clock.h
@@ -0,0 +1,10 @@
+/* Routines for using cycle counter */
+
+/* Start the counter */
+void start_counter(void);
+
+/* Get # cycles since counter started */
+double get_counter(void);
+
+double mhz(int verbose);
+void make_CPU_busy(void);
--- a/malloclab/config.h
+++ b/malloclab/config.h
@@ -0,0 +1,71 @@
+#ifndef __CONGIF_H_
+#define __CONFIG_H_
+
+/*
+ * config.h - malloc lab configuration file
+ *
+ * Copyright (c) 2002, R. Bryant and D. O'Hallaron, All rights reserved.
+ * May not be used, modified, or copied without permission.
+ */
+
+/*
+ * This is the default path where the driver will look for the
+ * default tracefiles. You can override it at runtime with the -t flag.
+ */
+#define TRACEDIR "./traces/"
+
+/*
+ * This is the list of default tracefiles in TRACEDIR that the driver
+ * will use for testing. Modify this if you want to add or delete
+ * traces from the driver's test suite. For example, if you don't want
+ * your students to implement realloc, you can delete the last two
+ * traces.
+ */
+#define DEFAULT_TRACEFILES \
+  "amptjp-bal.rep",\
+  "cccp-bal.rep",\
+  "cp-decl-bal.rep",\
+  "expr-bal.rep",\
+  "coalescing-bal.rep",\
+  "random-bal.rep",\
+  "random2-bal.rep",\
+  "binary-bal.rep",\
+  "binary2-bal.rep"
+
+/*
+ * This constant gives the estimated performance of the libc malloc
+ * package using our traces on some reference system, typically the
+ * same kind of system the students use. Its purpose is to cap the
+ * contribution of throughput to the performance index. Once the
+ * students surpass the AVG_LIBC_THRUPUT, they get no further benefit
+ * to their score.  This deters students from building extremely fast,
+ * but extremely stupid malloc packages.
+ */
+#define AVG_LIBC_THRUPUT      500E3  /* 500 Kops/sec */
+//#define AVG_LIBC_THRUPUT      53000000  /* 5300 Kops/sec */
+
+ /* 
+  * This constant determines the contributions of space utilization
+  * (UTIL_WEIGHT) and throughput (1 - UTIL_WEIGHT) to the performance
+  * index.  
+  */
+#define UTIL_WEIGHT .60
+
+/* 
+ * Alignment requirement in bytes (either 4 or 8) 
+ */
+#define ALIGNMENT 8  
+
+/* 
+ * Maximum heap size in bytes 
+ */
+#define MAX_HEAP (20*(1<<20))  /* 20 MB */
+
+/*****************************************************************************
+ * Set exactly one of these USE_xxx constants to "1" to select a timing method
+ *****************************************************************************/
+#define USE_FCYC   1   /* cycle counter w/K-best scheme (x86 & Alpha only) */
+#define USE_ITIMER 0   /* interval timer (any Unix box) */
+#define USE_GETTOD 0   /* gettimeofday (any Unix box) */
+
+#endif /* __CONFIG_H */
--- a/malloclab/fcyc.c
+++ b/malloclab/fcyc.c
@@ -0,0 +1,230 @@
+/*
+ * fcyc.c - Estimate the time (in CPU cycles) used by a function f
+ *
+ * Copyright (c) 2002, R. Bryant and D. O'Hallaron, All rights reserved.
+ * May not be used, modified, or copied without permission.
+ *
+ * Uses the cycle timer routines in clock.c to estimate the
+ * the time in CPU cycles for a function f.
+ */
+#include <stdlib.h>
+#include <time.h>
+#include <stdio.h>
+
+#include "fcyc.h"
+#include "clock.h"
+
+ /* Default values */
+#define K 3                  /* Value of K in K-best scheme */
+#define MAXSAMPLES 20        /* Give up after MAXSAMPLES */
+#define EPSILON 0.01         /* K samples should be EPSILON of each other*/
+#define CLEAR_CACHE 0        /* Clear cache before running test function */
+#define CACHE_BYTES (1<<19)  /* Max cache size in bytes */
+#define CACHE_BLOCK 32       /* Cache block size in bytes */
+
+static int kbest = K;
+static int maxsamples = MAXSAMPLES;
+static double epsilon = EPSILON;
+static int clear_cache = CLEAR_CACHE;
+static int cache_bytes = CACHE_BYTES;
+static int cache_block = CACHE_BLOCK;
+
+static int* cache_buf = NULL;
+
+static double* values = NULL;
+static int samplecount = 0;
+
+/* for debugging only */
+#define KEEP_VALS 0
+#define KEEP_SAMPLES 0
+
+#if KEEP_SAMPLES
+static double* samples = NULL;
+#endif
+
+/*
+ * init_sampler - Start new sampling process
+ */
+static void init_sampler(void)
+{
+	if (values)
+		free(values);
+	values = calloc(kbest, sizeof(double));
+#if KEEP_SAMPLES
+	if (samples)
+		free(samples);
+	/* Allocate extra for wraparound analysis */
+	samples = calloc(maxsamples + kbest, sizeof(double));
+#endif
+	samplecount = 0;
+}
+
+/*
+ * add_sample - Add new sample
+ */
+static void add_sample(double val)
+{
+	int pos = 0;
+	if (samplecount < kbest) {
+		pos = samplecount;
+		values[pos] = val;
+	}
+	else if (val < values[kbest - 1]) {
+		pos = kbest - 1;
+		values[pos] = val;
+	}
+#if KEEP_SAMPLES
+	samples[samplecount] = val;
+#endif
+	samplecount++;
+	/* Insertion sort */
+	while (pos > 0 && values[pos - 1] > values[pos]) {
+		double temp = values[pos - 1];
+		values[pos - 1] = values[pos];
+		values[pos] = temp;
+		pos--;
+	}
+}
+
+/*
+ * has_converged- Have kbest minimum measurements converged within epsilon?
+ */
+static int has_converged(void)
+{
+	return
+		(samplecount >= kbest) &&
+		((1 + epsilon) * values[0] >= values[kbest - 1]);
+}
+
+/*
+ * clear - Code to clear cache
+ */
+static volatile int sink = 0;
+
+static void clear(void)
+{
+	int x = sink;
+	int* cptr, * cend;
+	int incr = cache_block / sizeof(int);
+	if (!cache_buf) {
+		cache_buf = malloc(cache_bytes);
+		if (!cache_buf) {
+			printf("[%s]致命错误：当试图清除cache时，malloc返回null\n", __func__);
+			exit(1);
+		}
+	}
+	cptr = (int*)cache_buf;
+	cend = cptr + cache_bytes / sizeof(int);
+	while (cptr < cend) {
+		x += *cptr;
+		cptr += incr;
+	}
+	sink = x;
+}
+
+/*
+ * fcyc - Use K-best scheme to estimate the running time of function f
+ */
+double fcyc(test_funct f, void* argp)
+{
+	double result;
+	init_sampler();
+	make_CPU_busy();
+	do {
+		double cyc;
+		if (clear_cache)
+			clear();
+		start_counter();
+		f(argp);
+		cyc = get_counter();
+		add_sample(cyc);
+	} while (!has_converged() && samplecount < maxsamples);
+#ifdef DEBUG
+	{
+		int i;
+		printf(" %d smallest values: [", kbest);
+		for (i = 0; i < kbest; i++)
+			printf("%.0f%s", values[i], i == kbest - 1 ? "]\n" : ", ");
+	}
+#endif
+	result = values[0];
+#if !KEEP_VALS
+	free(values);
+	values = NULL;
+#endif
+	return result;
+}
+
+
+/*************************************************************
+ * Set the various parameters used by the measurement routines
+ ************************************************************/
+
+ /*
+  * set_fcyc_clear_cache - When set, will run code to clear cache
+  *     before each measurement.
+  *     Default = 0
+  */
+void set_fcyc_clear_cache(int clear)
+{
+	clear_cache = clear;
+}
+
+/*
+ * set_fcyc_cache_size - Set size of cache to use when clearing cache
+ *     Default = 1<<19 (512KB)
+ */
+void set_fcyc_cache_size(int bytes)
+{
+	if (bytes != cache_bytes) {
+		cache_bytes = bytes;
+		if (cache_buf) {
+			free(cache_buf);
+			cache_buf = NULL;
+		}
+	}
+}
+
+/*
+ * set_fcyc_cache_block - Set size of cache block
+ *     Default = 32
+ */
+void set_fcyc_cache_block(int bytes) {
+	cache_block = bytes;
+}
+
+
+
+/*
+ * set_fcyc_k - Value of K in K-best measurement scheme
+ *     Default = 3
+ */
+void set_fcyc_k(int k)
+{
+	kbest = k;
+}
+
+/*
+ * set_fcyc_maxsamples - Maximum number of samples attempting to find
+ *     K-best within some tolerance.
+ *     When exceeded, just return best sample found.
+ *     Default = 20
+ */
+void set_fcyc_maxsamples(int maxsamples_arg)
+{
+	maxsamples = maxsamples_arg;
+}
+
+/*
+ * set_fcyc_epsilon - Tolerance required for K-best
+ *     Default = 0.01
+ */
+void set_fcyc_epsilon(double epsilon_arg)
+{
+	epsilon = epsilon_arg;
+}
+
+
+
+
+
--- a/malloclab/fcyc.h
+++ b/malloclab/fcyc.h
@@ -0,0 +1,68 @@
+/*
+ * fcyc.h - prototypes for the routines in fcyc.c that estimate the
+ *     time in CPU cycles used by a test function f
+ * 
+ * Copyright (c) 2002, R. Bryant and D. O'Hallaron, All rights reserved.
+ * May not be used, modified, or copied without permission.
+ *
+ */
+
+/* The test function takes a generic pointer as input */
+typedef void (*test_funct)(void *);
+
+/* Compute number of cycles used by test function f */
+double fcyc(test_funct f, void* argp);
+
+/*********************************************************
+ * Set the various parameters used by measurement routines 
+ *********************************************************/
+
+/* 
+ * set_fcyc_clear_cache - When set, will run code to clear cache 
+ *     before each measurement. 
+ *     Default = 0
+ */
+void set_fcyc_clear_cache(int clear);
+
+/* 
+ * set_fcyc_cache_size - Set size of cache to use when clearing cache 
+ *     Default = 1<<19 (512KB)
+ */
+void set_fcyc_cache_size(int bytes);
+
+/* 
+ * set_fcyc_cache_block - Set size of cache block 
+ *     Default = 32
+ */
+void set_fcyc_cache_block(int bytes);
+
+/* 
+ * set_fcyc_compensate- When set, will attempt to compensate for 
+ *     timer interrupt overhead 
+ *     Default = 0
+ */
+void set_fcyc_compensate(int compensate_arg);
+
+/* 
+ * set_fcyc_k - Value of K in K-best measurement scheme
+ *     Default = 3
+ */
+void set_fcyc_k(int k);
+
+/* 
+ * set_fcyc_maxsamples - Maximum number of samples attempting to find 
+ *     K-best within some tolerance.
+ *     When exceeded, just return best sample found.
+ *     Default = 20
+ */
+void set_fcyc_maxsamples(int maxsamples_arg);
+
+/* 
+ * set_fcyc_epsilon - Tolerance required for K-best
+ *     Default = 0.01
+ */
+void set_fcyc_epsilon(double epsilon_arg);
+
+
+
+
--- a/malloclab/fsecs.c
+++ b/malloclab/fsecs.c
@@ -0,0 +1,43 @@
+/****************************
+ * High-level timing wrappers
+ ****************************/
+#include <stdio.h>
+#include "fsecs.h"
+#include "fcyc.h"
+#include "clock.h"
+ //#include "ftimer.h"
+#include "config.h"
+
+static double Mhz;  /* estimated CPU clock frequency */
+
+extern int verbose; /* -v option in mdriver.c */
+
+/*
+ * init_fsecs - initialize the timing package
+ */
+void init_fsecs(void)
+{
+	Mhz = 0; /* keep gcc -Wall happy */
+
+	if (verbose)
+		printf("[%s]通过cycle计数器来测量性能.\n", __func__);
+
+	/* set key parameters for the fcyc package */
+	set_fcyc_maxsamples(200);
+	set_fcyc_clear_cache(1);
+	set_fcyc_epsilon(0.01);
+	set_fcyc_k(3);
+	Mhz = mhz(verbose > 0);
+	//    printf("[%s]Your CPU is %fMhz\n",__func__, Mhz);
+}
+
+/*
+ * fsecs - Return the running time of a function f (in seconds)
+ */
+double fsecs(fsecs_test_funct f, void* argp)
+{
+	double cycles = fcyc(f, argp);
+	return cycles / (Mhz * 1e6);
+}
+
+
--- a/malloclab/fsecs.h
+++ b/malloclab/fsecs.h
@@ -0,0 +1,4 @@
+typedef void (*fsecs_test_funct)(void *);
+
+void init_fsecs(void);
+double fsecs(fsecs_test_funct f, void *argp);
--- a/malloclab/getopt.c
+++ b/malloclab/getopt.c
@@ -0,0 +1,250 @@
+/*****************************************************************************
+* getopt.c - competent and free getopt library.
+* $Header: /cvsroot/freegetopt/freegetopt/getopt.c,v 1.2 2003/10/26 03:10:20 vindaci Exp $
+*
+* Copyright (c)2002-2003 Mark K. Kim
+* All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions
+* are met:
+*
+*   * Redistributions of source code must retain the above copyright
+*     notice, this list of conditions and the following disclaimer.
+*
+*   * Redistributions in binary form must reproduce the above copyright
+*     notice, this list of conditions and the following disclaimer in
+*     the documentation and/or other materials provided with the
+*     distribution.
+*
+*   * Neither the original author of this software nor the names of its
+*     contributors may be used to endorse or promote products derived
+*     from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+* THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
+* DAMAGE.
+*/
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include "getopt.h"
+
+
+static const char* ID = "$Id: getopt.c,v 1.2 2003/10/26 03:10:20 vindaci Exp $";
+
+
+char* optarg = NULL;
+int optind = 0;
+int opterr = 1;
+int optopt = '?';
+
+
+static char** prev_argv = NULL;        /* Keep a copy of argv and argc to */
+static int prev_argc = 0;              /*    tell if getopt params change */
+static int argv_index = 0;             /* Option we're checking */
+static int argv_index2 = 0;            /* Option argument we're checking */
+static int opt_offset = 0;             /* Index into compounded "-option" */
+static int dashdash = 0;               /* True if "--" option reached */
+static int nonopt = 0;                 /* How many nonopts we've found */
+
+static void increment_index()
+{
+	/* Move onto the next option */
+	if (argv_index < argv_index2)
+	{
+		while (prev_argv[++argv_index] && prev_argv[argv_index][0] != '-'
+			&& argv_index < argv_index2 + 1);
+	}
+	else argv_index++;
+	opt_offset = 1;
+}
+
+
+/*
+* Permutes argv[] so that the argument currently being processed is moved
+* to the end.
+*/
+static int permute_argv_once()
+{
+	/* Movability check */
+	if (argv_index + nonopt >= prev_argc) return 1;
+	/* Move the current option to the end, bring the others to front */
+	else
+	{
+		char* tmp = prev_argv[argv_index];
+
+		/* Move the data */
+		memmove(&prev_argv[argv_index], &prev_argv[argv_index + 1],
+			sizeof(char**) * (prev_argc - argv_index - 1));
+		prev_argv[prev_argc - 1] = tmp;
+
+		nonopt++;
+		return 0;
+	}
+}
+
+
+int getopt(int argc, char** argv, char* optstr)
+{
+	int c = 0;
+
+	/* If we have new argv, reinitialize */
+	if (prev_argv != argv || prev_argc != argc)
+	{
+		/* Initialize variables */
+		prev_argv = argv;
+		prev_argc = argc;
+		argv_index = 1;
+		argv_index2 = 1;
+		opt_offset = 1;
+		dashdash = 0;
+		nonopt = 0;
+	}
+
+	/* Jump point in case we want to ignore the current argv_index */
+getopt_top:
+
+	/* Misc. initializations */
+	optarg = NULL;
+
+	/* Dash-dash check */
+	if (argv[argv_index] && !strcmp(argv[argv_index], "--"))
+	{
+		dashdash = 1;
+		increment_index();
+	}
+
+	/* If we're at the end of argv, that's it. */
+	if (argv[argv_index] == NULL)
+	{
+		c = -1;
+	}
+	/* Are we looking at a string? Single dash is also a string */
+	else if (dashdash || argv[argv_index][0] != '-' || !strcmp(argv[argv_index], "-"))
+	{
+		/* If we want a string... */
+		if (optstr[0] == '-')
+		{
+			c = 1;
+			optarg = argv[argv_index];
+			increment_index();
+		}
+		/* If we really don't want it (we're in POSIX mode), we're done */
+		else if (optstr[0] == '+')// || getenv("POSIXLY_CORRECT"))
+		{
+			c = -1;
+
+			/* Everything else is a non-opt argument */
+			nonopt = argc - argv_index;
+		}
+		/* If we mildly don't want it, then move it back */
+		else
+		{
+			if (!permute_argv_once()) goto getopt_top;
+			else c = -1;
+		}
+	}
+	/* Otherwise we're looking at an option */
+	else
+	{
+		char* opt_ptr = NULL;
+
+		/* Grab the option */
+		c = argv[argv_index][opt_offset++];
+
+		/* Is the option in the optstr? */
+		if (optstr[0] == '-') opt_ptr = strchr(optstr + 1, c);
+		else opt_ptr = strchr(optstr, c);
+		/* Invalid argument */
+		if (!opt_ptr)
+		{
+			if (opterr)
+			{
+				fprintf(stderr, "%s: invalid option -- %c\n", argv[0], c);
+			}
+
+			optopt = c;
+			c = '?';
+
+			/* Move onto the next option */
+			increment_index();
+		}
+		/* Option takes argument */
+		else if (opt_ptr[1] == ':')
+		{
+			/* ie, -oARGUMENT, -xxxoARGUMENT, etc. */
+			if (argv[argv_index][opt_offset] != '\0')
+			{
+				optarg = &argv[argv_index][opt_offset];
+				increment_index();
+			}
+			/* ie, -o ARGUMENT (only if it's a required argument) */
+			else if (opt_ptr[2] != ':')
+			{
+				/* One of those "you're not expected to understand this" moment */
+				if (argv_index2 < argv_index) argv_index2 = argv_index;
+				while (argv[++argv_index2] && argv[argv_index2][0] == '-');
+				optarg = argv[argv_index2];
+
+				/* Don't cross into the non-option argument list */
+				if (argv_index2 + nonopt >= prev_argc) optarg = NULL;
+
+				/* Move onto the next option */
+				increment_index();
+			}
+			else
+			{
+				/* Move onto the next option */
+				increment_index();
+			}
+
+			/* In case we got no argument for an option with required argument */
+			if (optarg == NULL && opt_ptr[2] != ':')
+			{
+				optopt = c;
+				c = '?';
+
+				if (opterr)
+				{
+					fprintf(stderr, "%s: option requires an argument -- %c\n",
+						argv[0], optopt);
+				}
+			}
+		}
+		/* Option does not take argument */
+		else
+		{
+			/* Next argv_index */
+			if (argv[argv_index][opt_offset] == '\0')
+			{
+				increment_index();
+			}
+		}
+	}
+
+	/* Calculate optind */
+	if (c == -1)
+	{
+		optind = argc - nonopt;
+	}
+	else
+	{
+		optind = argv_index;
+	}
+
+	return c;
+}
+
+
+/* vim:ts=3
+*/
--- a/malloclab/getopt.h
+++ b/malloclab/getopt.h
@@ -0,0 +1,63 @@
+/*****************************************************************************
+* getopt.h - competent and free getopt library.
+* $Header: /cvsroot/freegetopt/freegetopt/getopt.h,v 1.2 2003/10/26 03:10:20 vindaci Exp $
+*
+* Copyright (c)2002-2003 Mark K. Kim
+* All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions
+* are met:
+*
+*   * Redistributions of source code must retain the above copyright
+*     notice, this list of conditions and the following disclaimer.
+*
+*   * Redistributions in binary form must reproduce the above copyright
+*     notice, this list of conditions and the following disclaimer in
+*     the documentation and/or other materials provided with the
+*     distribution.
+*
+*   * Neither the original author of this software nor the names of its
+*     contributors may be used to endorse or promote products derived
+*     from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+* THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
+* DAMAGE.
+*/
+#ifndef GETOPT_H_
+#define GETOPT_H_
+
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+
+	extern char* optarg;
+	extern int optind;
+	extern int opterr;
+	extern int optopt;
+
+	int getopt(int argc, char** argv, char* optstr);
+
+
+#ifdef __cplusplus
+}
+#endif
+
+
+#endif /* GETOPT_H_ */
+
+
+/* vim:ts=3
+*/
--- a/malloclab/malloc
+++ b/malloclab/malloc
--- a/malloclab/mdriver.c
+++ b/malloclab/mdriver.c
--- a/malloclab/memlib.c
+++ b/malloclab/memlib.c
@@ -0,0 +1,112 @@
+/*
+ * memlib.c - a module that simulates the memory system.  Needed because it
+ *            allows us to interleave calls from the student's malloc package
+ *            with the system's malloc package in libc.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <assert.h>
+#ifndef _WIN32
+#include <unistd.h>
+#endif
+#include <string.h>
+#include <errno.h>
+
+#include "memlib.h"
+#include "config.h"
+
+ /* private variables */
+static char* mem_start_brk;  /* points to first byte of heap */
+static char* mem_brk;        /* points to last byte of heap */
+static char* mem_max_addr;   /* largest legal heap address */
+
+#ifdef _WIN32
+#include <windows.h>
+int getpagesize(void)
+{
+	SYSTEM_INFO system_info;
+	GetSystemInfo(&system_info);
+	return system_info.dwPageSize;
+}
+#endif
+
+/*
+ * mem_init - initialize the memory system model
+ */
+void mem_init(void)
+{
+	/* allocate the storage we will use to model the available VM */
+	if ((mem_start_brk = (char*)malloc(MAX_HEAP)) == NULL) {
+		printf("[%s]malloc失败\n", __func__);
+		exit(1);
+	}
+
+	mem_max_addr = mem_start_brk + MAX_HEAP;  /* max legal heap address */
+	mem_brk = mem_start_brk;                  /* heap is empty initially */
+}
+
+/*
+ * mem_deinit - free the storage used by the memory system model
+ */
+void mem_deinit(void)
+{
+	free(mem_start_brk);
+}
+
+/*
+ * mem_reset_brk - reset the simulated brk pointer to make an empty heap
+ */
+void mem_reset_brk()
+{
+	mem_brk = mem_start_brk;
+}
+
+/*
+ * mem_sbrk - simple model of the sbrk function. Extends the heap
+ *    by incr bytes and returns the start address of the new area. In
+ *    this model, the heap cannot be shrunk.
+ */
+void* mem_sbrk(int incr)
+{
+	char* old_brk = mem_brk;
+
+	if ((incr < 0) || ((mem_brk + incr) > mem_max_addr)) {
+		errno = ENOMEM;
+		printf("[%s]失败: 内存已被耗光...\n", __func__);
+		return (void*)-1;
+	}
+	mem_brk += incr;
+	return (void*)old_brk;
+}
+
+/*
+ * mem_heap_lo - return address of the first heap byte
+ */
+void* mem_heap_lo()
+{
+	return (void*)mem_start_brk;
+}
+
+/*
+ * mem_heap_hi - return address of last heap byte
+ */
+void* mem_heap_hi()
+{
+	return (void*)(mem_brk - 1);
+}
+
+/*
+ * mem_heapsize() - returns the heap size in bytes
+ */
+size_t mem_heapsize()
+{
+	return (size_t)(mem_brk - mem_start_brk);
+}
+
+/*
+ * mem_pagesize() - returns the page size of the system
+ */
+size_t mem_pagesize()
+{
+	return (size_t)getpagesize();
+}
--- a/malloclab/memlib.h
+++ b/malloclab/memlib.h
@@ -0,0 +1,13 @@
+#ifndef _WIN32
+#include <unistd.h>
+#endif
+
+void mem_init(void);               
+void mem_deinit(void);
+void *mem_sbrk(int incr);
+void mem_reset_brk(void); 
+void *mem_heap_lo(void);
+void *mem_heap_hi(void);
+size_t mem_heapsize(void);
+size_t mem_pagesize(void);
+
--- a/malloclab/method.md
+++ b/malloclab/method.md
@@ -0,0 +1,76 @@
+# 动态内存分配器实验修改思路
+
+## 实验目标
+实现一个动态内存分配器，支持以下功能：
+1. 内存分配（`mm_malloc`）
+2. 内存释放（`mm_free`）
+3. 内存扩展（`mm_realloc`）
+
+并通过 `traces` 目录下的测试用例，尽可能提高评分。
+
+## 修改内容
+
+### 1. 算法设计思想
+- 使用 **隐式空闲链表** 管理内存块。
+- 每个块包含头部和尾部，用于存储块大小和分配状态。
+- 分配时，使用 **首次适配算法** 找到合适的空闲块。
+- 释放时，合并相邻的空闲块以减少内存碎片。
+- 通过对齐和块分割优化内存利用率。
+
+### 2. 代码实现
+#### 主要宏定义
+- `PACK(size, alloc)`：将块大小和分配位打包成一个字。
+- `GET` 和 `PUT`：读取和写入地址处的字。
+- `HDRP` 和 `FTRP`：计算块的头部和尾部地址。
+- `NEXT_BLKP` 和 `PREV_BLKP`：计算下一个和前一个块的地址。
+
+#### 核心函数
+1. **`mm_init`**
+   - 初始化堆，创建序言块和结尾块。
+   - 扩展堆以初始化空闲块。
+
+2. **`extend_heap`**
+   - 扩展堆的大小，分配新的空闲块。
+   - 初始化新块的头部、尾部和结尾块。
+
+3. **`coalesce`**
+   - 合并相邻的空闲块，减少内存碎片。
+   - 根据前后块的分配状态，处理 4 种情况。
+
+4. **`mm_malloc`**
+   - 调整请求大小以满足对齐要求。
+   - 使用 `find_fit` 查找合适的空闲块。
+   - 如果没有合适的块，扩展堆。
+
+5. **`mm_free`**
+   - 将块标记为空闲。
+   - 调用 `coalesce` 合并相邻空闲块。
+
+6. **`mm_realloc`**
+   - 如果新大小小于当前块大小，直接返回。
+   - 如果新大小大于当前块大小，分配新块并复制数据。
+
+7. **`find_fit`**
+   - 遍历隐式链表，找到第一个满足大小要求的空闲块。
+
+8. **`place`**
+   - 将请求大小的块放入空闲块中。
+   - 如果剩余空间足够大，分割块。
+
+### 3. 测试与优化
+- 修改 `TRACE_LIST.txt`，运行不同的 trace 文件。
+- 使用 `make` 和 `./malloc -t traces` 测试实现。
+- 优化分配和释放逻辑，提高效率和性能。
+
+## 当前状态
+- **正确性**：所有 trace 文件均通过测试。
+- **效率**：平均效率为 77%。
+- **性能**：评分为 84/100。
+
+## 后续优化方向
+1. 使用 **显式空闲链表** 或 **分离空闲链表** 提高查找效率。
+2. 动态调整堆扩展策略，减少不必要的扩展。
+3. 优化块分割和合并逻辑，进一步减少内存碎片。
+
+## 提交要求
+- 将 `mm.c` 文件重命名为 `mm_学号.c`，并提交到指定平台。
--- a/malloclab/mm.c
+++ b/malloclab/mm.c
@@ -0,0 +1,297 @@
+#define MAX(x, y) ((x) > (y) ? (x) : (y))
+/*
+ * mm-naive.c - 参考实现，是一个最快的、最低效率的malloc.
+ *
+ * 在这个参考实现中，分配一个块，仅仅是增加brk指针，
+ * 块内部全部是载荷数据，块内没有header或者footer等
+ * 管理用的数据信息。分配出去的块，永远不释放或者回收。
+ * 重分配函数（realloc）的实现，是直接通过mm_malloc和mm_free实现的
+ *
+ * 亲们请注意：你需要把此段注释，替换成你的算法设计思想。用描述性
+ * 的话来说清楚。
+ * 请将此文件，重新命名为mm_201309060024.c（就是mm_你的学号.c）
+ */
+#include <assert.h>
+#include <stdio.h>
+#include <stdlib.h>
+
+#ifndef _WIN32
+#include <unistd.h>
+#endif
+#include <string.h>
+
+#include "memlib.h"
+#include "mm.h"
+
+/*********************************************************
+ * 亲们请注意：开始之前，请把下面的信息修改为你的个人信息
+ ********************************************************/
+team_t team = {
+    /* 团队名字 */
+    "8-Bit Brainstorm",
+    /* 团队老大的名字 */
+    "Cikki",
+    /* 团队老大的email地址 */
+    "c_gh0s7@nudt.edu.cn",
+    /* 团队其他成员的名字 (如果没有，就空着) */
+    "",
+    /* 团队其他成员的email地址 (如果没有，就空着) */
+    ""};
+
+/* 基本常量和宏定义 */
+#define ALIGNMENT 8 /* 将块对齐到8字节（双字） */
+#define ALIGN(size)                                                            \
+  (((size) + (ALIGNMENT - 1)) & ~0x7) /* 向上舍入到最近的8的倍数 */
+#define SIZE_T_SIZE (ALIGN(sizeof(size_t)))
+
+/* 内存分配器的关键参数 */
+#define WSIZE 4             /* 字（word）的大小 = 4字节 */
+#define DSIZE 8             /* 双字（double word）的大小 = 8字节 */
+#define CHUNKSIZE (1 << 12) /* 扩展堆时的默认大小 = 4096字节 = 4KB */
+
+/* 用于操作头部和脚部的宏 */
+#define PACK(size, alloc) ((size) | (alloc)) /* 将大小和已分配位打包成一个字 \
+                                              */
+#define GET(p) (*(unsigned int *)(p))        /* 读取指针p处的一个字 */
+#define PUT(p, val) (*(unsigned int *)(p) = (val)) /* 在指针p处写入一个字 */
+
+/* 从头部或脚部获取大小和已分配位 */
+#define GET_SIZE(p) (GET(p) & ~0x7) /* 获取块大小，去掉低3位的标志位 */
+#define GET_ALLOC(p) (GET(p) & 0x1) /* 获取已分配位（0=空闲，1=已分配）*/
+
+/* 给定块指针bp，计算块的头部和脚部位置 */
+#define HDRP(bp) ((char *)(bp) - WSIZE) /* 指向块头部的指针 */
+#define FTRP(bp)                                                               \
+  ((char *)(bp) + GET_SIZE(HDRP(bp)) - DSIZE) /* 指向块脚部的指针 */
+
+/* 给定块指针bp，计算下一个和前一个块的地址 */
+#define NEXT_BLKP(bp)                                                          \
+  ((char *)(bp) + GET_SIZE(((char *)(bp) - WSIZE))) /* 下一个块的指针 */
+#define PREV_BLKP(bp)                                                          \
+  ((char *)(bp) - GET_SIZE(((char *)(bp) - DSIZE))) /* 前一个块的指针 */
+
+static char *heap_listp; /* 指向堆的第一个块的指针 */
+
+static void *extend_heap(size_t words);
+static void *coalesce(void *bp);
+static void *find_fit(size_t asize);
+static void place(void *bp, size_t asize);
+
+static void print_block(int request_id, int payload);
+
+/*
+ * mm_init - 初始化内存分配器
+ * 创建初始空堆，包括序言块和结尾块
+ * 返回值：成功返回0，错误返回-1
+ */
+int mm_init(void) {
+  // 创建初始空堆
+  if ((heap_listp = mem_sbrk(4 * WSIZE)) == (void *)-1)
+    return -1;
+  PUT(heap_listp, 0);                            // 对齐填充
+  PUT(heap_listp + (1 * WSIZE), PACK(DSIZE, 1)); // 序言块头部
+  PUT(heap_listp + (2 * WSIZE), PACK(DSIZE, 1)); // 序言块尾部
+  PUT(heap_listp + (3 * WSIZE), PACK(0, 1));     // 结尾块
+  heap_listp += (2 * WSIZE);
+
+  // 扩展空堆
+  if (extend_heap(CHUNKSIZE / WSIZE) == NULL)
+    return -1;
+  return 0;
+}
+
+/*
+ * extend_heap - 通过增加brk指针来扩展堆
+ * 参数 words: 请求的字数（以字为单位）
+ * 返回值：指向新分配区域的指针，如果出错则返回NULL
+ */
+static void *extend_heap(size_t words) {
+  char *bp;
+  size_t size;
+
+  // 分配偶数个字以保持对齐
+  size = (words % 2) ? (words + 1) * WSIZE : words * WSIZE;
+  if ((long)(bp = mem_sbrk(size)) == -1)
+    return NULL;
+
+  // 初始化空闲块头部/尾部和结尾块
+  PUT(HDRP(bp), PACK(size, 0));         // 空闲块头部
+  PUT(FTRP(bp), PACK(size, 0));         // 空闲块尾部
+  PUT(HDRP(NEXT_BLKP(bp)), PACK(0, 1)); // 新的结尾块
+
+  return coalesce(bp);
+}
+
+/*
+ * coalesce - 合并相邻的空闲块
+ * 参数 bp: 指向刚被释放的块的指针
+ * 返回值：指向合并后的块的指针
+ *
+ * 有四种情况：
+ * Case 1：前后块都已分配
+ * Case 2：前块已分配，后块空闲
+ * Case 3：前块空闲，后块已分配
+ * Case 4：前后块都空闲
+ */
+static void *coalesce(void *bp) {
+  size_t prev_alloc = GET_ALLOC(FTRP(PREV_BLKP(bp)));
+  size_t next_alloc = GET_ALLOC(HDRP(NEXT_BLKP(bp)));
+  size_t size = GET_SIZE(HDRP(bp));
+
+  if (prev_alloc && next_alloc) { // Case 1
+    return bp;
+  } else if (prev_alloc && !next_alloc) { // Case 2
+    size += GET_SIZE(HDRP(NEXT_BLKP(bp)));
+    PUT(HDRP(bp), PACK(size, 0));
+    PUT(FTRP(bp), PACK(size, 0));
+  } else if (!prev_alloc && next_alloc) { // Case 3
+    size += GET_SIZE(HDRP(PREV_BLKP(bp)));
+    PUT(FTRP(bp), PACK(size, 0));
+    PUT(HDRP(PREV_BLKP(bp)), PACK(size, 0));
+    bp = PREV_BLKP(bp);
+  } else { // Case 4
+    size += GET_SIZE(HDRP(PREV_BLKP(bp))) + GET_SIZE(FTRP(NEXT_BLKP(bp)));
+    PUT(HDRP(PREV_BLKP(bp)), PACK(size, 0));
+    PUT(FTRP(NEXT_BLKP(bp)), PACK(size, 0));
+    bp = PREV_BLKP(bp);
+  }
+  return bp;
+}
+
+/*
+ * mm_malloc - 分配一个大小为size字节的块
+ * 参数 size: 请求的字节数
+ * 返回值：指向新分配块的指针，如果错误则返回NULL
+ *
+ * 分配策略：
+ * 1. 调整请求大小为8字节对齐
+ * 2. 搜索空闲链表找到第一个适合的块
+ * 3. 如果没有找到合适的块，扩展堆
+ */
+void *mm_malloc(size_t size) {
+  size_t asize;      // 调整后的块大小
+  size_t extendsize; // 如果没有合适的块，扩展堆的大小
+  char *bp;
+
+  if (size == 0)
+    return NULL;
+
+  if (size <= DSIZE)
+    asize = 2 * DSIZE;
+  else
+    asize = DSIZE * ((size + (DSIZE) + (DSIZE - 1)) / DSIZE);
+
+  if ((bp = find_fit(asize)) != NULL) {
+    place(bp, asize);
+    return bp;
+  }
+
+  extendsize = MAX(asize, CHUNKSIZE);
+  if ((bp = extend_heap(extendsize / WSIZE)) == NULL)
+    return NULL;
+  place(bp, asize);
+  return bp;
+}
+
+/*
+ * mm_free - 释放一个之前分配的块
+ * 参数 bp: 指向要释放的块的指针
+ *
+ * 处理步骤：
+ * 1. 标记块为空闲（更新头部和脚部）
+ * 2. 合并相邻的空闲块（如果有的话）
+ */
+void mm_free(void *bp) {
+  if (bp == NULL)
+    return;
+
+  size_t size = GET_SIZE(HDRP(bp));
+  PUT(HDRP(bp), PACK(size, 0));
+  PUT(FTRP(bp), PACK(size, 0));
+  coalesce(bp);
+}
+
+/*
+ * mm_realloc - 调整一个已分配块的大小
+ * 参数：
+ *   ptr - 指向旧块的指针
+ *   size - 请求的新大小
+ * 返回值：指向新块的指针
+ *
+ * 处理策略：
+ * 1. 如果ptr为NULL，等同于malloc
+ * 2. 如果size为0，等同于free
+ * 3. 分配新块，复制数据，释放旧块
+ */
+void *mm_realloc(void *ptr, size_t size) {
+  if (ptr == NULL)
+    return mm_malloc(size);
+
+  if (size == 0) {
+    mm_free(ptr);
+    return NULL;
+  }
+
+  void *newptr = mm_malloc(size);
+  if (newptr == NULL)
+    return NULL;
+
+  size_t copySize = GET_SIZE(HDRP(ptr)) - DSIZE;
+  if (size < copySize)
+    copySize = size;
+  memcpy(newptr, ptr, copySize);
+  mm_free(ptr);
+  return newptr;
+}
+
+/*
+ * find_fit - 使用首次适配搜索，查找满足所需大小的空闲块
+ * 参数 asize: 调整后的块大小
+ * 返回值：找到则返回块指针，否则返回NULL
+ */
+static void *find_fit(size_t asize) {
+  void *bp;
+
+  for (bp = heap_listp; GET_SIZE(HDRP(bp)) > 0; bp = NEXT_BLKP(bp)) {
+    if (!GET_ALLOC(HDRP(bp)) && (asize <= GET_SIZE(HDRP(bp)))) {
+      return bp;
+    }
+  }
+  return NULL;
+}
+
+/*
+ * place - 将请求的块放置在空闲块的起始位置
+ * 参数：
+ *   bp - 空闲块指针
+ *   asize - 请求的大小
+ *
+ * 如果剩余部分足够大（>= 2*DSIZE），则分割块
+ */
+static void place(void *bp, size_t asize) {
+  size_t csize = GET_SIZE(HDRP(bp));
+
+  if ((csize - asize) >= (2 * DSIZE)) {
+    PUT(HDRP(bp), PACK(asize, 1));
+    PUT(FTRP(bp), PACK(asize, 1));
+    bp = NEXT_BLKP(bp);
+    PUT(HDRP(bp), PACK(csize - asize, 0));
+    PUT(FTRP(bp), PACK(csize - asize, 0));
+  } else {
+    PUT(HDRP(bp), PACK(csize, 1));
+    PUT(FTRP(bp), PACK(csize, 1));
+  }
+}
+
+/*
+ * mm_heapcheck - 目前暂不支持堆检查，可以不用修改
+ */
+void mm_heapcheck(void) {}
+
+/*
+ * 输出一块数据 - 用于heapcheck，然而在此并没有什么用，可以不用修改
+ */
+
+static void print_block(int request_id, int payload) {
+  printf("\n[%s]$BLOCK %d %d\n", __func__, request_id, payload);
+}
--- a/malloclab/mm.h
+++ b/malloclab/mm.h
@@ -0,0 +1,23 @@
+#include <stdio.h>
+
+extern int mm_init (void);
+extern void *mm_malloc (size_t size);
+extern void mm_free (void *ptr);
+extern void *mm_realloc(void *ptr, size_t size);
+extern void mm_heapcheck(void);
+
+/* 
+ * Students work in teams of one or two.  Teams enter their team name, 
+ * personal names and login IDs in a struct of this
+ * type in their bits.c file.
+ */
+typedef struct {
+    char *teamname; /* ID1+ID2 or ID1 */
+    char *name1;    /* full name of first member */
+    char *id1;      /* login ID of first member */
+    char *name2;    /* full name of second member (if any) */
+    char *id2;      /* login ID of second member */
+} team_t;
+
+extern team_t team;
+
--- a/malloclab/myMalloc/myMalloc.sln
+++ b/malloclab/myMalloc/myMalloc.sln
@@ -0,0 +1,31 @@
+
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio Version 16
+VisualStudioVersion = 16.0.31829.152
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "myMalloc", "myMalloc.vcxproj", "{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|x64 = Debug|x64
+		Debug|x86 = Debug|x86
+		Release|x64 = Release|x64
+		Release|x86 = Release|x86
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Debug|x64.ActiveCfg = Debug|x64
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Debug|x64.Build.0 = Debug|x64
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Debug|x86.ActiveCfg = Debug|Win32
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Debug|x86.Build.0 = Debug|Win32
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Release|x64.ActiveCfg = Release|x64
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Release|x64.Build.0 = Release|x64
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Release|x86.ActiveCfg = Release|Win32
+		{5C1ED0A5-23CE-4040-A263-C9C69E0BEAC7}.Release|x86.Build.0 = Release|Win32
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(ExtensibilityGlobals) = postSolution
+		SolutionGuid = {975E549F-4459-4716-891C-6BF59727C24E}
+	EndGlobalSection
+EndGlobal
--- a/malloclab/myMalloc/myMalloc.vcxproj
+++ b/malloclab/myMalloc/myMalloc.vcxproj
@@ -0,0 +1,153 @@
+<?xml version="1.0" encoding="utf-8"?>
+<Project DefaultTargets="Build" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <ItemGroup Label="ProjectConfigurations">
+    <ProjectConfiguration Include="Debug|Win32">
+      <Configuration>Debug</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|Win32">
+      <Configuration>Release</Configuration>
+      <Platform>Win32</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Debug|x64">
+      <Configuration>Debug</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+    <ProjectConfiguration Include="Release|x64">
+      <Configuration>Release</Configuration>
+      <Platform>x64</Platform>
+    </ProjectConfiguration>
+  </ItemGroup>
+  <PropertyGroup Label="Globals">
+    <VCProjectVersion>16.0</VCProjectVersion>
+    <Keyword>Win32Proj</Keyword>
+    <ProjectGuid>{5c1ed0a5-23ce-4040-a263-c9c69e0beac7}</ProjectGuid>
+    <RootNamespace>myMalloc</RootNamespace>
+    <WindowsTargetPlatformVersion>10.0</WindowsTargetPlatformVersion>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>true</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
+    <ConfigurationType>Application</ConfigurationType>
+    <UseDebugLibraries>false</UseDebugLibraries>
+    <PlatformToolset>v142</PlatformToolset>
+    <WholeProgramOptimization>true</WholeProgramOptimization>
+    <CharacterSet>Unicode</CharacterSet>
+  </PropertyGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
+  <ImportGroup Label="ExtensionSettings">
+  </ImportGroup>
+  <ImportGroup Label="Shared">
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <ImportGroup Label="PropertySheets" Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
+  </ImportGroup>
+  <PropertyGroup Label="UserMacros" />
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <LinkIncremental>true</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <LinkIncremental>false</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <LinkIncremental>true</LinkIncremental>
+  </PropertyGroup>
+  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <LinkIncremental>false</LinkIncremental>
+  </PropertyGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>WIN32;_CRT_SECURE_NO_WARNINGS;_DEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>WIN32;_CRT_SECURE_NO_WARNINGS;NDEBUG;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>_DEBUG;_CRT_SECURE_NO_WARNINGS;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
+    <ClCompile>
+      <WarningLevel>Level3</WarningLevel>
+      <FunctionLevelLinking>true</FunctionLevelLinking>
+      <IntrinsicFunctions>true</IntrinsicFunctions>
+      <SDLCheck>true</SDLCheck>
+      <PreprocessorDefinitions>NDEBUG;_CRT_SECURE_NO_WARNINGS;_CONSOLE;%(PreprocessorDefinitions)</PreprocessorDefinitions>
+      <ConformanceMode>true</ConformanceMode>
+    </ClCompile>
+    <Link>
+      <SubSystem>Console</SubSystem>
+      <EnableCOMDATFolding>true</EnableCOMDATFolding>
+      <OptimizeReferences>true</OptimizeReferences>
+      <GenerateDebugInformation>true</GenerateDebugInformation>
+    </Link>
+  </ItemDefinitionGroup>
+  <ItemGroup>
+    <ClCompile Include="..\clock.c" />
+    <ClCompile Include="..\fcyc.c" />
+    <ClCompile Include="..\fsecs.c" />
+    <ClCompile Include="..\getopt.c" />
+    <ClCompile Include="..\mdriver.c" />
+    <ClCompile Include="..\memlib.c" />
+    <ClCompile Include="..\mm.c" />
+  </ItemGroup>
+  <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
+  <ImportGroup Label="ExtensionTargets">
+  </ImportGroup>
+</Project>
--- a/malloclab/trace_perfect.sh
+++ b/malloclab/trace_perfect.sh
@@ -0,0 +1,22 @@
+#!/bin/bash
+# 检查 traces 目录下所有 trace 文件是否能得到100分
+TRACE_DIR="traces"
+PERFECT_LIST="PERFECT_TRACES.txt"
+
+# 清空 PERFECT_LIST.txt
+> "$PERFECT_LIST"
+
+# 遍历所有 .rep 文件
+for trace in "$TRACE_DIR"/*.rep; do
+    echo "Testing $trace..."
+    # 运行 malloc 并捕获输出
+    output=$(./malloc -f "$trace" 2>&1)
+    
+    # 检查输出中是否包含 "Performance index = 100"
+    if echo "$output" | grep -q "100/100" ; then
+        echo "Perfect score found for $(basename "$trace")"
+        echo "$(basename "$trace")" >> "$PERFECT_LIST"
+    fi
+done
+
+echo "Updated $PERFECT_LIST with traces that achieved perfect scores." 
--- a/malloclab/traces/PERFECT_TRACES.txt
+++ b/malloclab/traces/PERFECT_TRACES.txt
@@ -0,0 +1,8 @@
+amptjp-bal.rep
+amptjp.rep
+cccp-bal.rep
+cccp.rep
+cp-decl-bal.rep
+cp-decl.rep
+expr-bal.rep
+expr.rep
--- a/malloclab/traces/TRACE_LIST.txt
+++ b/malloclab/traces/TRACE_LIST.txt
@@ -0,0 +1,4 @@
+seglist.rep
+short1.rep
+random2.rep
+xterm.rep
--- a/malloclab/traces/TRACE_LIST.txt-ori
+++ b/malloclab/traces/TRACE_LIST.txt-ori
@@ -0,0 +1,4 @@
+seglist.rep
+short1.rep
+random2.rep
+xterm.rep
--- a/malloclab/traces/TRACE_LIST.txt.full
+++ b/malloclab/traces/TRACE_LIST.txt.full
@@ -0,0 +1,56 @@
+amptjp-bal.rep
+amptjp.rep
+bash.rep
+binary2-bal.rep
+binary2.rep
+binary-bal.rep
+binary.rep
+boat.rep
+cccp-bal.rep
+cccp.rep
+chrome.rep
+coalesce-big.rep
+coalescing-bal.rep
+coalescing.rep
+cp-decl-bal.rep
+cp-decl.rep
+exhaust.rep
+expr-bal.rep
+expr.rep
+firefox-reddit2.rep
+firefox-reddit.rep
+firefox.rep
+freeciv.rep
+fs.rep
+hostname.rep
+login.rep
+ls.1.rep
+ls.rep
+malloc-free.rep
+malloc.rep
+merry-go-round.rep
+mutt.rep
+needle.rep
+perl.1.rep
+perl.2.rep
+perl.3.rep
+perl.rep
+pulseaudio.rep
+random2-bal.rep
+random2.rep
+random-bal.rep
+random.rep
+realloc2-bal.rep
+realloc2.rep
+realloc-bal.rep
+realloc.rep
+rm.1.rep
+rm.rep
+seglist.rep
+short1-bal.rep
+short1.rep
+short2-bal.rep
+short2.rep
+stty.rep
+tty.rep
+xterm.rep
--- a/malloclab/traces/TRACE_LIST.txt.per
+++ b/malloclab/traces/TRACE_LIST.txt.per
@@ -0,0 +1,8 @@
+amptjp-bal.rep
+amptjp.rep
+cccp-bal.rep
+cccp.rep
+cp-decl-bal.rep
+cp-decl.rep
+expr-bal.rep
+expr.rep
--- a/malloclab/traces/alaska.rep
+++ b/malloclab/traces/alaska.rep
--- a/malloclab/traces/amptjp-bal.rep
+++ b/malloclab/traces/amptjp-bal.rep
--- a/malloclab/traces/amptjp.rep
+++ b/malloclab/traces/amptjp.rep
--- a/malloclab/traces/bash.rep
+++ b/malloclab/traces/bash.rep
--- a/malloclab/traces/binary-bal.rep
+++ b/malloclab/traces/binary-bal.rep
--- a/malloclab/traces/binary.rep
+++ b/malloclab/traces/binary.rep
--- a/malloclab/traces/binary2-bal.rep
+++ b/malloclab/traces/binary2-bal.rep
--- a/malloclab/traces/binary2.rep
+++ b/malloclab/traces/binary2.rep
--- a/malloclab/traces/boat.rep
+++ b/malloclab/traces/boat.rep
--- a/malloclab/traces/cccp-bal.rep
+++ b/malloclab/traces/cccp-bal.rep
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
CGH0S7	6d5eb3ea2f	nudt csapp 2025 finished	2025-06-18 10:30:41 +08:00
CGH0S7	603789006c	weblab finished	2025-06-08 21:34:30 +08:00
CGH0S7	ccab1d8e49	threadlab finished	2025-06-08 11:25:52 +08:00
CGH0S7	6da43cbff0	threadlab and weblab initialized	2025-06-08 00:58:01 +08:00
CGH0S7	23d48ee092	malloclab patched finally	2025-06-04 17:06:19 +08:00
CGH0S7	628a771975	malloclab patched	2025-06-04 00:49:13 +08:00
CGH0S7	e861bfd45e	malloclab to finish	2025-05-26 19:19:19 +08:00
CGH0S7	4c3ef87f66	malloclab start	2025-05-21 14:41:01 +08:00
CGH0S7	1b0b28f910	shlab finished	2025-05-20 22:09:48 +08:00
CGH0S7	421a8ac1a4	cachelab fixed	2025-04-25 08:29:08 +08:00
CGH0S7	44051e5098	cachelab finished again	2025-04-25 00:36:49 +08:00
CGH0S7	92300134d2	cachelab finished	2025-04-24 22:32:48 +08:00
CGH0S7	ace7a46fb9	cachelab started	2025-04-21 23:52:27 +08:00
CGH0S7	cc99d9b5d9	perflab finished	2025-04-17 23:02:23 +08:00
CGH0S7	ba21f80f3b	matrix fixed	2025-04-12 11:37:07 +08:00